@@ -113,32 +113,13 @@ impl GarbageCollector {
113113 counters : GarbageCollectorCounters :: default ( ) ,
114114 }
115115 }
116- // if !deleted_file_entries.is_empty() {
117- // let num_deleted_splits = deleted_file_entries.len();
118- // let num_deleted_bytes = deleted_file_entries
119- // .iter()
120- // .map(|entry| entry.file_size_bytes.as_u64() as usize)
121- // .sum::<usize>();
122- // let deleted_files: HashSet<&Path> = deleted_file_entries
123- // .iter()
124- // .map(|deleted_entry| deleted_entry.file_name.as_path())
125- // .take(5)
126- // .collect();
127- // info!(
128- // num_deleted_splits = num_deleted_splits,
129- // "Janitor deleted {:?} and {} other splits.", deleted_files, num_deleted_splits,
130- // );
131- // self.counters.num_deleted_files += num_deleted_splits;
132- // self.counters.num_deleted_bytes += num_deleted_bytes;
133116
134117 fn record_gc_result ( & mut self , result : & GcRunResult , split_type : & str ) {
135118 self . counters . num_failed_splits += result. num_failed ;
136119 if result. num_deleted_splits > 0 {
137120 info ! (
138121 "Janitor deleted {:?} and {} other {} splits." ,
139- result. sample_deleted_files,
140- result. num_deleted_splits,
141- split_type,
122+ result. sample_deleted_files, result. num_deleted_splits, split_type,
142123 ) ;
143124 self . counters . num_deleted_files += result. num_deleted_splits ;
144125 self . counters . num_deleted_bytes += result. num_deleted_bytes ;
@@ -222,22 +203,40 @@ impl GarbageCollector {
222203 . await ;
223204
224205 let tantivy_run_duration = tantivy_start. elapsed ( ) . as_secs ( ) ;
225- JANITOR_METRICS . gc_seconds_total . with_label_values ( [ "tantivy" ] ) . inc_by ( tantivy_run_duration) ;
206+ JANITOR_METRICS
207+ . gc_seconds_total
208+ . with_label_values ( [ "tantivy" ] )
209+ . inc_by ( tantivy_run_duration) ;
226210
227211 let result = match gc_res {
228212 Ok ( removal_info) => {
229213 self . counters . num_successful_gc_run += 1 ;
230- JANITOR_METRICS . gc_runs . with_label_values ( [ "success" , "tantivy" ] ) . inc ( ) ;
214+ JANITOR_METRICS
215+ . gc_runs
216+ . with_label_values ( [ "success" , "tantivy" ] )
217+ . inc ( ) ;
231218 GcRunResult {
232219 num_deleted_splits : removal_info. removed_split_entries . len ( ) ,
233- num_deleted_bytes : removal_info. removed_split_entries . iter ( ) . map ( |e| e. file_size_bytes . as_u64 ( ) as usize ) . sum ( ) ,
220+ num_deleted_bytes : removal_info
221+ . removed_split_entries
222+ . iter ( )
223+ . map ( |e| e. file_size_bytes . as_u64 ( ) as usize )
224+ . sum ( ) ,
234225 num_failed : removal_info. failed_splits . len ( ) ,
235- sample_deleted_files : removal_info. removed_split_entries . iter ( ) . take ( 5 ) . map ( |e| e. file_name . display ( ) . to_string ( ) ) . collect ( ) ,
226+ sample_deleted_files : removal_info
227+ . removed_split_entries
228+ . iter ( )
229+ . take ( 5 )
230+ . map ( |e| e. file_name . display ( ) . to_string ( ) )
231+ . collect ( ) ,
236232 }
237233 }
238234 Err ( error) => {
239235 self . counters . num_failed_gc_run += 1 ;
240- JANITOR_METRICS . gc_runs . with_label_values ( [ "error" , "tantivy" ] ) . inc ( ) ;
236+ JANITOR_METRICS
237+ . gc_runs
238+ . with_label_values ( [ "error" , "tantivy" ] )
239+ . inc ( ) ;
241240 error ! ( error=?error, "failed to run garbage collection" ) ;
242241 GcRunResult :: failed ( )
243242 }
@@ -260,22 +259,36 @@ impl GarbageCollector {
260259 . await ;
261260
262261 let parquet_run_duration = parquet_start. elapsed ( ) . as_secs ( ) ;
263- JANITOR_METRICS . gc_seconds_total . with_label_values ( [ "parquet" ] ) . inc_by ( parquet_run_duration) ;
262+ JANITOR_METRICS
263+ . gc_seconds_total
264+ . with_label_values ( [ "parquet" ] )
265+ . inc_by ( parquet_run_duration) ;
264266
265267 let result = match gc_res {
266268 Ok ( removal_info) => {
267269 self . counters . num_successful_gc_run += 1 ;
268- JANITOR_METRICS . gc_runs . with_label_values ( [ "success" , "parquet" ] ) . inc ( ) ;
270+ JANITOR_METRICS
271+ . gc_runs
272+ . with_label_values ( [ "success" , "parquet" ] )
273+ . inc ( ) ;
269274 GcRunResult {
270275 num_deleted_splits : removal_info. removed_split_count ( ) ,
271276 num_deleted_bytes : removal_info. removed_bytes ( ) as usize ,
272277 num_failed : removal_info. failed_split_count ( ) ,
273- sample_deleted_files : removal_info. removed_parquet_splits_entries . iter ( ) . take ( 5 ) . map ( |e| format ! ( "{}.parquet" , e. split_id) ) . collect ( ) ,
278+ sample_deleted_files : removal_info
279+ . removed_parquet_splits_entries
280+ . iter ( )
281+ . take ( 5 )
282+ . map ( |e| format ! ( "{}.parquet" , e. split_id) )
283+ . collect ( ) ,
274284 }
275285 }
276286 Err ( error) => {
277287 self . counters . num_failed_gc_run += 1 ;
278- JANITOR_METRICS . gc_runs . with_label_values ( [ "error" , "parquet" ] ) . inc ( ) ;
288+ JANITOR_METRICS
289+ . gc_runs
290+ . with_label_values ( [ "error" , "parquet" ] )
291+ . inc ( ) ;
279292 error ! ( error=?error, "failed to run parquet garbage collection" ) ;
280293 GcRunResult :: failed ( )
281294 }
@@ -865,15 +878,13 @@ mod tests {
865878 let storage_resolver = StorageResolver :: unconfigured ( ) ;
866879 let mut mock = MockMetastoreService :: new ( ) ;
867880
868- mock. expect_list_indexes_metadata ( )
869- . times ( 1 )
870- . returning ( |_| {
871- let indexes = vec ! [ IndexMetadata :: for_test(
872- "otel-metrics-v0_1" ,
873- "ram://indexes/otel-metrics-v0_1" ,
874- ) ] ;
875- Ok ( ListIndexesMetadataResponse :: for_test ( indexes) )
876- } ) ;
881+ mock. expect_list_indexes_metadata ( ) . times ( 1 ) . returning ( |_| {
882+ let indexes = vec ! [ IndexMetadata :: for_test(
883+ "otel-metrics-v0_1" ,
884+ "ram://indexes/otel-metrics-v0_1" ,
885+ ) ] ;
886+ Ok ( ListIndexesMetadataResponse :: for_test ( indexes) )
887+ } ) ;
877888
878889 let marked_split = MetricsSplitRecord {
879890 state : MetricsSplitState :: MarkedForDeletion ,
@@ -903,10 +914,8 @@ mod tests {
903914 Ok ( EmptyResponse { } )
904915 } ) ;
905916
906- let garbage_collect_actor = GarbageCollector :: new (
907- MetastoreServiceClient :: from_mock ( mock) ,
908- storage_resolver,
909- ) ;
917+ let garbage_collect_actor =
918+ GarbageCollector :: new ( MetastoreServiceClient :: from_mock ( mock) , storage_resolver) ;
910919 let universe = Universe :: with_accelerated_time ( ) ;
911920 let ( _mailbox, handle) = universe. spawn_builder ( ) . spawn ( garbage_collect_actor) ;
912921
0 commit comments