risingwave_storage/
opts.rs

1// Copyright 2025 RisingWave Labs
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7//     http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15use risingwave_common::config::{
16    EvictionConfig, ObjectStoreConfig, RwConfig, StorageMemoryConfig, extract_storage_memory_config,
17};
18use risingwave_common::system_param::reader::{SystemParamsRead, SystemParamsReader};
19use risingwave_common::system_param::system_params_for_test;
20
21#[derive(Clone, Debug)]
22pub struct StorageOpts {
23    /// The size of parallel task for one compact/flush job.
24    pub parallel_compact_size_mb: u32,
25    /// Target size of the Sstable.
26    pub sstable_size_mb: u32,
27    /// Minimal target size of the Sstable to store data of different state-table in independent files as soon as possible.
28    pub min_sstable_size_mb: u32,
29    /// Size of each block in bytes in SST.
30    pub block_size_kb: u32,
31    /// False positive probability of bloom filter.
32    pub bloom_false_positive: f64,
33    /// parallelism while syncing share buffers into L0 SST. Should NOT be 0.
34    pub share_buffers_sync_parallelism: u32,
35    /// Worker threads number of dedicated tokio runtime for share buffer compaction. 0 means use
36    /// tokio's default value (number of CPU core).
37    pub share_buffer_compaction_worker_threads_number: u32,
38    /// Maximum shared buffer size, writes attempting to exceed the capacity will stall until there
39    /// is enough space.
40    pub shared_buffer_capacity_mb: usize,
41    /// The shared buffer will start flushing data to object when the ratio of memory usage to the
42    /// shared buffer capacity exceed such ratio.
43    pub shared_buffer_flush_ratio: f32,
44    /// The minimum total flush size of shared buffer spill. When a shared buffer spill is trigger,
45    /// the total flush size across multiple epochs should be at least higher than this size.
46    pub shared_buffer_min_batch_flush_size_mb: usize,
47    /// Remote directory for storing data and metadata objects.
48    pub data_directory: String,
49    /// Whether to enable write conflict detection
50    pub write_conflict_detection_enabled: bool,
51    /// Capacity of sstable block cache.
52    pub block_cache_capacity_mb: usize,
53    /// the number of block-cache shard. Less shard means that more concurrent-conflict.
54    pub block_cache_shard_num: usize,
55    /// Eviction config for block cache.
56    pub block_cache_eviction_config: EvictionConfig,
57    /// Capacity of sstable meta cache.
58    pub meta_cache_capacity_mb: usize,
59    /// the number of meta-cache shard. Less shard means that more concurrent-conflict.
60    pub meta_cache_shard_num: usize,
61    /// Eviction config for meta cache.
62    pub meta_cache_eviction_config: EvictionConfig,
63    /// max memory usage for large query.
64    pub prefetch_buffer_capacity_mb: usize,
65
66    pub max_cached_recent_versions_number: usize,
67
68    pub max_prefetch_block_number: usize,
69
70    pub disable_remote_compactor: bool,
71    /// Number of tasks shared buffer can upload in parallel.
72    pub share_buffer_upload_concurrency: usize,
73    /// Capacity of sstable meta cache.
74    pub compactor_memory_limit_mb: usize,
75    /// compactor streaming iterator recreate timeout.
76    /// deprecated
77    pub compact_iter_recreate_timeout_ms: u64,
78    /// Number of SST ids fetched from meta per RPC
79    pub sstable_id_remote_fetch_number: u32,
80    /// Whether to enable streaming upload for sstable.
81    pub min_sst_size_for_streaming_upload: u64,
82    pub max_concurrent_compaction_task_number: u64,
83    pub max_version_pinning_duration_sec: u64,
84    pub compactor_iter_max_io_retry_times: usize,
85
86    pub data_file_cache_dir: String,
87    pub data_file_cache_capacity_mb: usize,
88    pub data_file_cache_file_capacity_mb: usize,
89    pub data_file_cache_flushers: usize,
90    pub data_file_cache_reclaimers: usize,
91    pub data_file_cache_recover_mode: foyer::RecoverMode,
92    pub data_file_cache_recover_concurrency: usize,
93    pub data_file_cache_indexer_shards: usize,
94    pub data_file_cache_compression: foyer::Compression,
95    pub data_file_cache_flush_buffer_threshold_mb: usize,
96    pub data_file_cache_fifo_probation_ratio: f64,
97    pub data_file_cache_runtime_config: foyer::RuntimeOptions,
98    pub data_file_cache_throttle: foyer::Throttle,
99
100    pub cache_refill_data_refill_levels: Vec<u32>,
101    pub cache_refill_timeout_ms: u64,
102    pub cache_refill_concurrency: usize,
103    pub cache_refill_recent_filter_layers: usize,
104    pub cache_refill_recent_filter_rotate_interval_ms: usize,
105    pub cache_refill_unit: usize,
106    pub cache_refill_threshold: f64,
107
108    pub meta_file_cache_dir: String,
109    pub meta_file_cache_capacity_mb: usize,
110    pub meta_file_cache_file_capacity_mb: usize,
111    pub meta_file_cache_flushers: usize,
112    pub meta_file_cache_reclaimers: usize,
113    pub meta_file_cache_recover_mode: foyer::RecoverMode,
114    pub meta_file_cache_recover_concurrency: usize,
115    pub meta_file_cache_indexer_shards: usize,
116    pub meta_file_cache_compression: foyer::Compression,
117    pub meta_file_cache_flush_buffer_threshold_mb: usize,
118    pub meta_file_cache_fifo_probation_ratio: f64,
119    pub meta_file_cache_runtime_config: foyer::RuntimeOptions,
120    pub meta_file_cache_throttle: foyer::Throttle,
121
122    /// The storage url for storing backups.
123    pub backup_storage_url: String,
124    /// The storage directory for storing backups.
125    pub backup_storage_directory: String,
126    /// max time which wait for preload. 0 represent do not do any preload.
127    pub max_preload_wait_time_mill: u64,
128
129    pub compactor_max_sst_key_count: u64,
130    pub compactor_max_task_multiplier: f32,
131    pub compactor_max_sst_size: u64,
132    /// enable `FastCompactorRunner`.
133    pub enable_fast_compaction: bool,
134    pub check_compaction_result: bool,
135    pub max_preload_io_retry_times: usize,
136    pub compactor_fast_max_compact_delete_ratio: u32,
137    pub compactor_fast_max_compact_task_size: u64,
138
139    pub mem_table_spill_threshold: usize,
140
141    pub compactor_concurrent_uploading_sst_count: Option<usize>,
142
143    pub compactor_max_overlap_sst_count: usize,
144
145    /// The maximum number of meta files that can be preloaded.
146    pub compactor_max_preload_meta_file_count: usize,
147
148    pub object_store_config: ObjectStoreConfig,
149    pub time_travel_version_cache_capacity: u64,
150
151    pub iceberg_compaction_target_file_size_mb: u32,
152    pub iceberg_compaction_enable_validate: bool,
153    pub iceberg_compaction_max_record_batch_rows: usize,
154    pub iceberg_compaction_write_parquet_max_row_group_rows: usize,
155    pub iceberg_compaction_min_size_per_partition_mb: u32,
156    pub iceberg_compaction_max_file_count_per_partition: u32,
157}
158
159impl Default for StorageOpts {
160    fn default() -> Self {
161        let c = RwConfig::default();
162        let p = system_params_for_test();
163        let s = extract_storage_memory_config(&c);
164        Self::from((&c, &p.into(), &s))
165    }
166}
167
168impl From<(&RwConfig, &SystemParamsReader, &StorageMemoryConfig)> for StorageOpts {
169    fn from((c, p, s): (&RwConfig, &SystemParamsReader, &StorageMemoryConfig)) -> Self {
170        let mut data_file_cache_throttle = c.storage.data_file_cache.throttle.clone();
171        if data_file_cache_throttle.write_throughput.is_none() {
172            data_file_cache_throttle = data_file_cache_throttle.with_write_throughput(
173                c.storage.data_file_cache.insert_rate_limit_mb * 1024 * 1024,
174            );
175        }
176        let mut meta_file_cache_throttle = c.storage.meta_file_cache.throttle.clone();
177        if meta_file_cache_throttle.write_throughput.is_none() {
178            meta_file_cache_throttle = meta_file_cache_throttle.with_write_throughput(
179                c.storage.meta_file_cache.insert_rate_limit_mb * 1024 * 1024,
180            );
181        }
182
183        Self {
184            parallel_compact_size_mb: p.parallel_compact_size_mb(),
185            sstable_size_mb: p.sstable_size_mb(),
186            min_sstable_size_mb: c.storage.min_sstable_size_mb,
187            block_size_kb: p.block_size_kb(),
188            bloom_false_positive: p.bloom_false_positive(),
189            share_buffers_sync_parallelism: c.storage.share_buffers_sync_parallelism,
190            share_buffer_compaction_worker_threads_number: c
191                .storage
192                .share_buffer_compaction_worker_threads_number,
193            shared_buffer_capacity_mb: s.shared_buffer_capacity_mb,
194            shared_buffer_flush_ratio: c.storage.shared_buffer_flush_ratio,
195            shared_buffer_min_batch_flush_size_mb: c.storage.shared_buffer_min_batch_flush_size_mb,
196            data_directory: p.data_directory().to_owned(),
197            write_conflict_detection_enabled: c.storage.write_conflict_detection_enabled,
198            block_cache_capacity_mb: s.block_cache_capacity_mb,
199            block_cache_shard_num: s.block_cache_shard_num,
200            block_cache_eviction_config: s.block_cache_eviction_config.clone(),
201            meta_cache_capacity_mb: s.meta_cache_capacity_mb,
202            meta_cache_shard_num: s.meta_cache_shard_num,
203            meta_cache_eviction_config: s.meta_cache_eviction_config.clone(),
204            prefetch_buffer_capacity_mb: s.prefetch_buffer_capacity_mb,
205            max_cached_recent_versions_number: c.storage.max_cached_recent_versions_number,
206            max_prefetch_block_number: c.storage.max_prefetch_block_number,
207            disable_remote_compactor: c.storage.disable_remote_compactor,
208            share_buffer_upload_concurrency: c.storage.share_buffer_upload_concurrency,
209            compactor_memory_limit_mb: s.compactor_memory_limit_mb,
210            sstable_id_remote_fetch_number: c.storage.sstable_id_remote_fetch_number,
211            min_sst_size_for_streaming_upload: c.storage.min_sst_size_for_streaming_upload,
212            max_concurrent_compaction_task_number: c.storage.max_concurrent_compaction_task_number,
213            max_version_pinning_duration_sec: c.storage.max_version_pinning_duration_sec,
214            data_file_cache_dir: c.storage.data_file_cache.dir.clone(),
215            data_file_cache_capacity_mb: c.storage.data_file_cache.capacity_mb,
216            data_file_cache_file_capacity_mb: c.storage.data_file_cache.file_capacity_mb,
217            data_file_cache_flushers: c.storage.data_file_cache.flushers,
218            data_file_cache_reclaimers: c.storage.data_file_cache.reclaimers,
219            data_file_cache_recover_mode: c.storage.data_file_cache.recover_mode,
220            data_file_cache_recover_concurrency: c.storage.data_file_cache.recover_concurrency,
221            data_file_cache_indexer_shards: c.storage.data_file_cache.indexer_shards,
222            data_file_cache_compression: c.storage.data_file_cache.compression,
223            data_file_cache_flush_buffer_threshold_mb: s.block_file_cache_flush_buffer_threshold_mb,
224            data_file_cache_fifo_probation_ratio: c.storage.data_file_cache.fifo_probation_ratio,
225            data_file_cache_runtime_config: c.storage.data_file_cache.runtime_config.clone(),
226            data_file_cache_throttle,
227            meta_file_cache_dir: c.storage.meta_file_cache.dir.clone(),
228            meta_file_cache_capacity_mb: c.storage.meta_file_cache.capacity_mb,
229            meta_file_cache_file_capacity_mb: c.storage.meta_file_cache.file_capacity_mb,
230            meta_file_cache_flushers: c.storage.meta_file_cache.flushers,
231            meta_file_cache_reclaimers: c.storage.meta_file_cache.reclaimers,
232            meta_file_cache_recover_mode: c.storage.meta_file_cache.recover_mode,
233            meta_file_cache_recover_concurrency: c.storage.meta_file_cache.recover_concurrency,
234            meta_file_cache_indexer_shards: c.storage.meta_file_cache.indexer_shards,
235            meta_file_cache_compression: c.storage.meta_file_cache.compression,
236            meta_file_cache_flush_buffer_threshold_mb: s.meta_file_cache_flush_buffer_threshold_mb,
237            meta_file_cache_fifo_probation_ratio: c.storage.meta_file_cache.fifo_probation_ratio,
238            meta_file_cache_runtime_config: c.storage.meta_file_cache.runtime_config.clone(),
239            meta_file_cache_throttle,
240            cache_refill_data_refill_levels: c.storage.cache_refill.data_refill_levels.clone(),
241            cache_refill_timeout_ms: c.storage.cache_refill.timeout_ms,
242            cache_refill_concurrency: c.storage.cache_refill.concurrency,
243            cache_refill_recent_filter_layers: c.storage.cache_refill.recent_filter_layers,
244            cache_refill_recent_filter_rotate_interval_ms: c
245                .storage
246                .cache_refill
247                .recent_filter_rotate_interval_ms,
248            cache_refill_unit: c.storage.cache_refill.unit,
249            cache_refill_threshold: c.storage.cache_refill.threshold,
250            max_preload_wait_time_mill: c.storage.max_preload_wait_time_mill,
251            compact_iter_recreate_timeout_ms: c.storage.compact_iter_recreate_timeout_ms,
252
253            max_preload_io_retry_times: c.storage.max_preload_io_retry_times,
254            backup_storage_url: p.backup_storage_url().to_owned(),
255            backup_storage_directory: p.backup_storage_directory().to_owned(),
256            compactor_max_sst_key_count: c.storage.compactor_max_sst_key_count,
257            compactor_max_task_multiplier: c.storage.compactor_max_task_multiplier,
258            compactor_max_sst_size: c.storage.compactor_max_sst_size,
259            enable_fast_compaction: c.storage.enable_fast_compaction,
260            check_compaction_result: c.storage.check_compaction_result,
261            mem_table_spill_threshold: c.storage.mem_table_spill_threshold,
262            object_store_config: c.storage.object_store.clone(),
263            compactor_fast_max_compact_delete_ratio: c
264                .storage
265                .compactor_fast_max_compact_delete_ratio,
266            compactor_fast_max_compact_task_size: c.storage.compactor_fast_max_compact_task_size,
267            compactor_iter_max_io_retry_times: c.storage.compactor_iter_max_io_retry_times,
268            compactor_concurrent_uploading_sst_count: c
269                .storage
270                .compactor_concurrent_uploading_sst_count,
271            time_travel_version_cache_capacity: c.storage.time_travel_version_cache_capacity,
272            compactor_max_overlap_sst_count: c.storage.compactor_max_overlap_sst_count,
273            compactor_max_preload_meta_file_count: c.storage.compactor_max_preload_meta_file_count,
274
275            iceberg_compaction_target_file_size_mb: c
276                .storage
277                .iceberg_compaction_target_file_size_mb,
278            iceberg_compaction_enable_validate: c.storage.iceberg_compaction_enable_validate,
279            iceberg_compaction_max_record_batch_rows: c
280                .storage
281                .iceberg_compaction_max_record_batch_rows,
282            iceberg_compaction_write_parquet_max_row_group_rows: c
283                .storage
284                .iceberg_compaction_write_parquet_max_row_group_rows,
285            iceberg_compaction_min_size_per_partition_mb: c
286                .storage
287                .iceberg_compaction_min_size_per_partition_mb,
288            iceberg_compaction_max_file_count_per_partition: c
289                .storage
290                .iceberg_compaction_max_file_count_per_partition,
291        }
292    }
293}