commit 1791653e15707c17fd720cea667066a714576cab · nekomimi.pet/microcosm-rs

+1 -1

ufos/src/consumer.rs

···

       22
       22
        
       const MAX_BATCH_SPAN_SECS: f64 = 60.; // hard limit of duration from oldest to latest event cursor within a batch, in seconds.

     

       23
       23
        
       

     

       24
       24
        
       const SEND_TIMEOUT_S: f64 = 60.;

     

       25
       25
       -
       const BATCH_QUEUE_SIZE: usize = 1024; // 4096 got OOM'd

     

       25
       25
       +
       const BATCH_QUEUE_SIZE: usize = 512; // 4096 got OOM'd. update: 1024 also got OOM'd during L0 compaction blocking

     

       26
       26
        
       

     

       27
       27
        
       #[derive(Debug)]

     

       28
       28
        
       struct Batcher {

+110 -56

ufos/src/store.rs

···

       16
       16
        
       use std::path::{Path, PathBuf};

     

       17
       17
        
       use std::time::{Duration, Instant};

     

       18
       18
        
       use tokio::sync::mpsc::Receiver;

     

       19
       19
       -
       use tokio::time::sleep;

     

       19
       19
       +
       use tokio::time::{interval_at, sleep};

     

       20
       20
        
       

     

       21
       21
        
       /// Commit the RW batch immediately if this number of events have been read off the mod queue

     

       22
       22
        
       const MAX_BATCHED_RW_EVENTS: usize = 18;

     
···

       155
       155
        
           /// Read-write loop reads from the queue for record-modifying events and does rollups

     

       156
       156
        
           pub async fn rw_loop(&self) -> anyhow::Result<()> {

     

       157
       157
        
               // TODO: lock so that only one rw loop can possibly be run. or even better, take a mutable resource thing to enforce at compile time.

     

       158
       158
       -
               loop {

     

       159
       159
       -
                   sleep(Duration::from_secs_f64(0.1)).await; // todo: interval rate-limit instead

     

       160
       158
        
       

     

       161
       161
       -
                   let db = &self.db;

     

       162
       162
       -
                   let keyspace = db.keyspace.clone();

     

       163
       163
       -
                   let partition = db.partition.clone();

     

       159
       159
       +
               let now = tokio::time::Instant::now();

     

       160
       160
       +
               let mut time_to_update_events = interval_at(now, Duration::from_secs_f64(0.051));

     

       161
       161
       +
               let mut time_to_trim_surplus = interval_at(

     

       162
       162
       +
                   now + Duration::from_secs_f64(1.0),

     

       163
       163
       +
                   Duration::from_secs_f64(3.3),

     

       164
       164
       +
               );

     

       165
       165
       +
               let mut time_to_roll_up = interval_at(

     

       166
       166
       +
                   now + Duration::from_secs_f64(0.4),

     

       167
       167
       +
                   Duration::from_secs_f64(0.9),

     

       168
       168
       +
               );

     

       164
       169
        
       

     

       165
       165
       -
                   log::trace!("rw: spawn blocking for batch...");

     

       166
       166
       -
                   tokio::task::spawn_blocking(move || -> anyhow::Result<()> {

     

       167
       167
       -
                       log::trace!("rw: getting rw cursor...");

     

       168
       168
       -
                       let mod_cursor = get_static::<ModCursorKey, ModCursorValue>(&partition)?

     

       169
       169
       -
                           .unwrap_or(Cursor::from_start());

     

       170
       170
       -
                       let range = ModQueueItemKey::new(mod_cursor.clone()).range_to_prefix_end()?;

     

       170
       170
       +
               time_to_update_events.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);

     

       171
       171
       +
               time_to_trim_surplus.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);

     

       172
       172
       +
               time_to_roll_up.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);

     

       171
       173
        
       

     

       172
       172
       -
                       let mut db_batch = keyspace.batch();

     

       173
       173
       -
                       let mut batched_rw_items = 0;

     

       174
       174
       -
                       let mut any_tasks_found = false;

     

       174
       174
       +
               loop {

     

       175
       175
       +
                   let keyspace = self.db.keyspace.clone();

     

       176
       176
       +
                   let partition = self.db.partition.clone();

     

       177
       177
       +
                   tokio::select! {

     

       178
       178
       +
                       _ = time_to_update_events.tick() => {

     

       179
       179
       +
                           log::debug!("beginning event update task");

     

       180
       180
       +
                           tokio::task::spawn_blocking(move || Self::update_events(keyspace, partition)).await??;

     

       181
       181
       +
                           log::debug!("finished event update task");

     

       182
       182
       +
                       }

     

       183
       183
       +
                       _ = time_to_trim_surplus.tick() => {

     

       184
       184
       +
                           log::debug!("beginning record trim task");

     

       185
       185
       +
                           tokio::task::spawn_blocking(move || Self::trim_old_events(keyspace, partition)).await??;

     

       186
       186
       +
                           log::debug!("finished record trim task");

     

       187
       187
       +
                       }

     

       188
       188
       +
                       _ = time_to_roll_up.tick() => {

     

       189
       189
       +
                           log::debug!("beginning rollup task");

     

       190
       190
       +
                           tokio::task::spawn_blocking(move || Self::roll_up_counts(keyspace, partition)).await??;

     

       191
       191
       +
                           log::debug!("finished rollup task");

     

       192
       192
       +
                       },

     

       193
       193
       +
                   }

     

       194
       194
       +
               }

     

       195
       195
       +
           }

     

       175
       196
        
       

     

       176
       176
       -
                       log::trace!("rw: iterating newer rw items...");

     

       197
       197
       +
           fn update_events(keyspace: Keyspace, partition: PartitionHandle) -> anyhow::Result<()> {

     

       198
       198
       +
               // TODO: lock this to prevent concurrent rw

     

       177
       199
        
       

     

       178
       178
       -
                       for (i, pair) in partition.range(range.clone()).enumerate() {

     

       179
       179
       -
                           log::trace!("rw: iterating {i}");

     

       180
       180
       -
                           any_tasks_found = true;

     

       200
       200
       +
               log::trace!("rw: getting rw cursor...");

     

       201
       201
       +
               let mod_cursor =

     

       202
       202
       +
                   get_static::<ModCursorKey, ModCursorValue>(&partition)?.unwrap_or(Cursor::from_start());

     

       203
       203
       +
               let range = ModQueueItemKey::new(mod_cursor.clone()).range_to_prefix_end()?;

     

       181
       204
        
       

     

       182
       182
       -
                           if i >= MAX_BATCHED_RW_EVENTS {

     

       183
       183
       -
                               break;

     

       184
       184
       -
                           }

     

       205
       205
       +
               let mut db_batch = keyspace.batch();

     

       206
       206
       +
               let mut batched_rw_items = 0;

     

       207
       207
       +
               let mut any_tasks_found = false;

     

       185
       208
        
       

     

       186
       186
       -
                           let (key_bytes, val_bytes) = pair?;

     

       187
       187
       -
                           let mod_key = match db_complete::<ModQueueItemKey>(&key_bytes) {

     

       188
       188
       -
                               Ok(k) => k,

     

       189
       189
       -
                               Err(EncodingError::WrongStaticPrefix(_, _)) => {

     

       190
       190
       -
                                   panic!("wsp: mod queue empty.");

     

       191
       191
       -
                               }

     

       192
       192
       -
                               otherwise => otherwise?,

     

       193
       193
       -
                           };

     

       209
       209
       +
               log::trace!("rw: iterating newer rw items...");

     

       194
       210
        
       

     

       195
       195
       -
                           let mod_value: ModQueueItemValue =

     

       196
       196
       -
                               db_complete::<ModQueueItemStringValue>(&val_bytes)?.try_into()?;

     

       211
       211
       +
               for (i, pair) in partition.range(range.clone()).enumerate() {

     

       212
       212
       +
                   log::trace!("rw: iterating {i}");

     

       213
       213
       +
                   any_tasks_found = true;

     

       197
       214
        
       

     

       198
       198
       -
                           log::trace!("rw: iterating {i}: sending to batcher {mod_key:?} => {mod_value:?}");

     

       199
       199
       -
                           batched_rw_items += DBWriter {

     

       200
       200
       -
                               keyspace: keyspace.clone(),

     

       201
       201
       -
                               partition: partition.clone(),

     

       202
       202
       -
                           }

     

       203
       203
       -
                           .write_rw(&mut db_batch, mod_key, mod_value)?;

     

       204
       204
       -
                           log::trace!("rw: iterating {i}: back from batcher.");

     

       215
       215
       +
                   if i >= MAX_BATCHED_RW_EVENTS {

     

       216
       216
       +
                       break;

     

       217
       217
       +
                   }

     

       205
       218
        
       

     

       206
       206
       -
                           if batched_rw_items >= MAX_BATCHED_RW_ITEMS {

     

       207
       207
       -
                               log::trace!("rw: iterating {i}: batch big enough, breaking out.");

     

       208
       208
       -
                               break;

     

       209
       209
       -
                           }

     

       219
       219
       +
                   let (key_bytes, val_bytes) = pair?;

     

       220
       220
       +
                   let mod_key = match db_complete::<ModQueueItemKey>(&key_bytes) {

     

       221
       221
       +
                       Ok(k) => k,

     

       222
       222
       +
                       Err(EncodingError::WrongStaticPrefix(_, _)) => {

     

       223
       223
       +
                           panic!("wsp: mod queue empty.");

     

       210
       224
        
                       }

     

       225
       225
       +
                       otherwise => otherwise?,

     

       226
       226
       +
                   };

     

       227
       227
       +
       

     

       228
       228
       +
                   let mod_value: ModQueueItemValue =

     

       229
       229
       +
                       db_complete::<ModQueueItemStringValue>(&val_bytes)?.try_into()?;

     

       211
       230
        
       

     

       212
       212
       -
                       if !any_tasks_found {

     

       213
       213
       -
                           log::trace!("rw: skipping batch commit since apparently no items were added (this is normal, skipping is new)");

     

       214
       214
       -
                           return Ok(());

     

       215
       215
       -
                       }

     

       231
       231
       +
                   log::trace!("rw: iterating {i}: sending to batcher {mod_key:?} => {mod_value:?}");

     

       232
       232
       +
                   batched_rw_items += DBWriter {

     

       233
       233
       +
                       keyspace: keyspace.clone(),

     

       234
       234
       +
                       partition: partition.clone(),

     

       235
       235
       +
                   }

     

       236
       236
       +
                   .write_rw(&mut db_batch, mod_key, mod_value)?;

     

       237
       237
       +
                   log::trace!("rw: iterating {i}: back from batcher.");

     

       216
       238
        
       

     

       217
       217
       -
                       log::info!("rw: committing rw batch with {batched_rw_items} items (items != total inserts/deletes)...");

     

       218
       218
       -
                       let r = db_batch.commit();

     

       219
       219
       -
                       log::info!("rw: commit result: {r:?}");

     

       220
       220
       -
                       r?;

     

       221
       221
       -
                       Ok(())

     

       222
       222
       -
                   })

     

       223
       223
       -
                   .await??;

     

       224
       224
       -
                   log::trace!("rw: back from blocking for rw...");

     

       239
       239
       +
                   if batched_rw_items >= MAX_BATCHED_RW_ITEMS {

     

       240
       240
       +
                       log::trace!("rw: iterating {i}: batch big enough, breaking out.");

     

       241
       241
       +
                       break;

     

       242
       242
       +
                   }

     

       225
       243
        
               }

     

       226
       226
       -
               // log::warn!("exited rw loop (rw task)");

     

       244
       244
       +
       

     

       245
       245
       +
               if !any_tasks_found {

     

       246
       246
       +
                   log::trace!("rw: skipping batch commit since apparently no items were added (this is normal, skipping is new)");

     

       247
       247
       +
                   // TODO: is this missing a chance to update the cursor?

     

       248
       248
       +
                   return Ok(());

     

       249
       249
       +
               }

     

       250
       250
       +
       

     

       251
       251
       +
               log::info!("rw: committing rw batch with {batched_rw_items} items (items != total inserts/deletes)...");

     

       252
       252
       +
               let r = db_batch.commit();

     

       253
       253
       +
               log::info!("rw: commit result: {r:?}");

     

       254
       254
       +
               r?;

     

       255
       255
       +
               Ok(())

     

       256
       256
       +
           }

     

       257
       257
       +
       

     

       258
       258
       +
           fn trim_old_events(_keyspace: Keyspace, _partition: PartitionHandle) -> anyhow::Result<()> {

     

       259
       259
       +
               // we *could* keep a collection dirty list in memory to reduce the amount of searching here

     

       260
       260
       +
               // actually can we use seen_by_js_cursor_collection??

     

       261
       261
       +
               // *   ["seen_by_js_cursor_collection"|js_cursor|collection] => u64

     

       262
       262
       +
               // -> the rollup cursor could handle trims.

     

       263
       263
       +
       

     

       264
       264
       +
               // key structure:

     

       265
       265
       +
               // *   ["by_collection"|collection|js_cursor] => [did|rkey|record]

     

       266
       266
       +
       

     

       267
       267
       +
               // *new* strategy:

     

       268
       268
       +
               // 1. collect `collection`s seen during rollup

     

       269
       269
       +
               // 2. for each collected collection:

     

       270
       270
       +
               // 3. set up prefix iterator

     

       271
       271
       +
               // 4. reverse and try to walk back MAX_RETAINED steps

     

       272
       272
       +
               // 5. if we didn't end iteration yet, start deleting records (and their forward links) until we get to the end

     

       273
       273
       +
       

     

       274
       274
       +
               // ... we can probably do even better with cursor ranges too, since we'll have a cursor range from rollup and it's in the by_collection key

     

       275
       275
       +
       

     

       276
       276
       +
               Ok(())

     

       277
       277
       +
           }

     

       278
       278
       +
       

     

       279
       279
       +
           fn roll_up_counts(_keyspace: Keyspace, _partition: PartitionHandle) -> anyhow::Result<()> {

     

       280
       280
       +
               Ok(())

     

       227
       281
        
           }

     

       228
       282
        
       

     

       229
       283
        
           pub async fn get_collection_records(