wasmcloud_host/wasmbus/
config.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
//! Module with structs for use in managing and accessing config used by various wasmCloud entities
use std::{collections::HashMap, fmt::Debug, sync::Arc};

use anyhow::{bail, Context};
use async_nats::jetstream::kv::{Operation, Store};
use futures::{future::AbortHandle, stream::Abortable, TryStreamExt};
use tokio::sync::{
    watch::{self, Receiver, Sender},
    RwLock, RwLockReadGuard,
};
use tracing::{error, warn, Instrument};

type LockedConfig = Arc<RwLock<HashMap<String, String>>>;
/// A cache of named config mapped to an existing receiver
type WatchCache = Arc<RwLock<HashMap<String, Receiver<HashMap<String, String>>>>>;

/// A struct used for mapping a config name to a receiver for logging/tracing purposes
struct ConfigReceiver {
    pub name: String,
    pub receiver: Receiver<HashMap<String, String>>,
}

/// Helper struct that aborts on drop so we don't abort them when something is cloned in an arc. It
/// will only abort after the last arc has been dropped.
#[derive(Default)]
struct AbortHandles {
    handles: Vec<AbortHandle>,
}

impl Drop for AbortHandles {
    fn drop(&mut self) {
        for handle in &self.handles {
            handle.abort();
        }
    }
}

/// A merged bundle of configuration for use with components that watches for updates to all named
/// configs specified.
///
/// There are two main ways to get config from this struct:
///
/// 1. You can call [`get_config`](ConfigBundle::get_config) which will return a reference to the
///    merged config. This is mainly for use in components, which will fetch needed config on demand
/// 2. You can call [`changed`](ConfigBundle::changed) which will return a reference to the merged
///    config. This is for use in situations where you want to be notified when a config changes,
///    such as for a provider that needs to be notified when a config changes
pub struct ConfigBundle {
    /// A live view of the configuration that is being managed/updated by this bundle
    merged_config: LockedConfig,
    /// Names of named config that contribute to this bundle
    config_names: Vec<String>,
    /// A receiver that fires when changes are made to the bundle
    changed_receiver: Receiver<()>,
    /// Abort handles to the tasks that are watching for updates
    ///
    /// These are `drop()`ed when the bundle is dropped
    _handles: Arc<AbortHandles>,
    /// The sender that is used to notify the receiver that the config has changed, this
    /// must not be dropped until the receiver is dropped so we ensure it's kept alive
    _changed_notifier: Arc<Sender<()>>,
}

impl Clone for ConfigBundle {
    fn clone(&self) -> Self {
        // Cloning marks the value in the new receiver as seen, so we mark it as unseen, even if it
        // was already viewed before cloning. This ensures that the newly cloned bundle will return
        // the current config rather than needing to wait for a change.
        let mut changed_receiver = self.changed_receiver.clone();
        changed_receiver.mark_changed();
        ConfigBundle {
            merged_config: self.merged_config.clone(),
            config_names: self.config_names.clone(),
            changed_receiver,
            _changed_notifier: self._changed_notifier.clone(),
            _handles: self._handles.clone(),
        }
    }
}

impl Debug for ConfigBundle {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("ConfigBundle")
            .field("merged_config", &self.merged_config)
            .finish()
    }
}

impl ConfigBundle {
    /// Create a new config bundle.
    ///
    /// It takes an ordered list of receivers that should match the
    /// order of config given by the user.
    ///
    /// This is only called internally.
    #[must_use]
    async fn new(receivers: Vec<ConfigReceiver>) -> Self {
        // Generate the initial abort handles so we can construct the bundle
        let (abort_handles, mut registrations): (Vec<_>, Vec<_>) =
            std::iter::repeat_with(AbortHandle::new_pair)
                .take(receivers.len())
                .unzip();
        // Now that we've set initial config, create the bundle and update the merged config with the latest values
        let (changed_notifier, changed_receiver) = watch::channel(());
        let changed_notifier = Arc::new(changed_notifier);
        let mut bundle = ConfigBundle {
            merged_config: Arc::default(),
            config_names: receivers.iter().map(|r| r.name.clone()).collect(),
            changed_receiver,
            _changed_notifier: changed_notifier.clone(),
            _handles: Arc::new(AbortHandles {
                handles: abort_handles,
            }),
        };
        let ordered_configs: Arc<Vec<Receiver<HashMap<String, String>>>> =
            Arc::new(receivers.iter().map(|r| r.receiver.clone()).collect());
        update_merge(&bundle.merged_config, &changed_notifier, &ordered_configs).await;
        // Move all the receivers into spawned tasks to update the config
        for ConfigReceiver { name, mut receiver } in receivers {
            // SAFETY: We know we have the right amount of registrations because we just created
            // them using the len above
            let reg = registrations
                .pop()
                .expect("missing registration, this is developer error");
            let cloned_name = name.clone();
            let ordered_receivers = ordered_configs.clone();
            let merged_config = bundle.merged_config.clone();
            let notifier = changed_notifier.clone();
            tokio::spawn(
                Abortable::new(
                    async move {
                        loop {
                            match receiver.changed().await {
                                Ok(()) => {
                                    update_merge(&merged_config, &notifier, &ordered_receivers)
                                        .await;
                                }
                                Err(e) => {
                                    warn!(error = %e, %name, "config sender dropped, updates will not be delivered");
                                    return;
                                }
                            }
                        }
                    },
                    reg,
                )
                .instrument(tracing::trace_span!("config_update", name = %cloned_name)),
            );
        }
        // More likely than not, there will be a new value in the watch channel because we always
        // read the latest value from the store before putting it here. But just in case, this
        // ensures that the newly create bundle will return the current config rather than needing
        // to wait for a change.
        bundle.changed_receiver.mark_changed();
        bundle
    }

    /// Returns a reference to the merged config behind a lock guard. This guard must be dropped
    /// when you are no longer consuming the config
    pub async fn get_config(&self) -> RwLockReadGuard<'_, HashMap<String, String>> {
        self.merged_config.read().await
    }

    /// Waits for the config to change and returns a reference to the merged config behind a lock
    /// guard. This guard must be dropped when you are no longer consuming the config.
    ///
    /// Please note that this requires a mutable borrow in order to manage underlying notification
    /// acknowledgement.
    pub async fn changed(
        &mut self,
    ) -> anyhow::Result<RwLockReadGuard<'_, HashMap<String, String>>> {
        // NOTE(thomastaylor312): We use a watch channel here because we want everything to get
        // notified individually (including clones) if config changes. Notify doesn't quite work
        // because we have to have a permit existing when we create otherwise the notify_watchers
        // won't actually get picked up (that only happens with notify_one).
        if let Err(e) = self.changed_receiver.changed().await {
            // If we get here, it likely means that a whole bunch of stuff has failed above it.
            // Might be worth changing this to a panic
            error!(error = %e, "Config changed receiver errored, this means that the config sender has dropped and the whole bundle has failed");
            bail!("failed to read receiver: {e}");
        }
        Ok(self.merged_config.read().await)
    }

    /// Returns a reference to the ordered list of config names handled by this bundle
    #[must_use]
    pub fn config_names(&self) -> &Vec<String> {
        &self.config_names
    }
}

/// A struct used for generating a config bundle given a list of named configs
#[derive(Clone)]
pub struct BundleGenerator {
    store: Store,
    watch_cache: WatchCache,
    watch_handles: Arc<RwLock<AbortHandles>>,
}

impl BundleGenerator {
    /// Create a new bundle generator
    #[must_use]
    pub fn new(store: Store) -> Self {
        Self {
            store,
            watch_cache: Arc::default(),
            watch_handles: Arc::default(),
        }
    }

    /// Generate a new config bundle. Will return an error if any of the configs do not exist or if
    /// there was an error fetching the initial config
    pub async fn generate(&self, config_names: Vec<String>) -> anyhow::Result<ConfigBundle> {
        let receivers: Vec<ConfigReceiver> =
            futures::future::join_all(config_names.into_iter().map(|name| self.get_receiver(name)))
                .await
                .into_iter()
                .collect::<anyhow::Result<_>>()?;
        Ok(ConfigBundle::new(receivers).await)
    }

    async fn get_receiver(&self, name: String) -> anyhow::Result<ConfigReceiver> {
        // First check the cache to see if we already have a receiver for this config
        if let Some(receiver) = self.watch_cache.read().await.get(&name) {
            return Ok(ConfigReceiver {
                name,
                receiver: receiver.clone(),
            });
        }

        // We need to actually try and fetch the config here. If we don't do this, then a watch will
        // just blindly watch even if the key doesn't exist. We should return an error if the config
        // doesn't exist or has data issues. It also allows us to set the intitial value
        let config: HashMap<String, String> = match self.store.get(&name).await {
            Ok(Some(data)) => serde_json::from_slice(&data)
                .context("Data corruption error, unable to decode data from store")?,
            Ok(None) => return Err(anyhow::anyhow!("Config {} does not exist", name)),
            Err(e) => return Err(anyhow::anyhow!("Error fetching config {}: {}", name, e)),
        };

        // Otherwise we need to setup the watcher. We start by setting up the watch so we don't miss
        // any events after we query the initial config
        let (tx, rx) = watch::channel(config);
        let (done, wait) = tokio::sync::oneshot::channel();
        let (handle, reg) = AbortHandle::new_pair();
        tokio::task::spawn(Abortable::new(
            watcher_loop(self.store.clone(), name.clone(), tx, done),
            reg,
        ));

        wait.await
            .context("Error waiting for watcher to start")?
            .context("Error waiting for watcher to start")?;

        // NOTE(thomastaylor312): We should probably find a way to clear out this cache. The Sender
        // part of the channel can tell you how many receivers it has, but we pass that along to the
        // watcher, so there would need to be more work to expose that, probably via a struct. We
        // could also do something with a resource counter and track that way with a cleanup task.
        // But for now going the easy route as we already cache everything anyway
        self.watch_handles.write().await.handles.push(handle);
        self.watch_cache
            .write()
            .await
            .insert(name.clone(), rx.clone());

        Ok(ConfigReceiver { name, receiver: rx })
    }
}

async fn watcher_loop(
    store: Store,
    name: String,
    tx: watch::Sender<HashMap<String, String>>,
    done: tokio::sync::oneshot::Sender<anyhow::Result<()>>,
) {
    // We need to watch with history so we can get the initial config.
    let mut watcher = match store.watch(&name).await {
        Ok(watcher) => {
            done.send(Ok(())).expect(
                "Receiver for watcher setup should not have been dropped. This is programmer error",
            );
            watcher
        }
        Err(e) => {
            done.send(Err(anyhow::anyhow!(
                "Error setting up watcher for {}: {}",
                name,
                e
            )))
            .expect(
                "Receiver for watcher setup should not have been dropped. This is programmer error",
            );
            return;
        }
    };
    loop {
        match watcher.try_next().await {
            Ok(Some(entry)) if matches!(entry.operation, Operation::Delete | Operation::Purge) => {
                // NOTE(thomastaylor312): We should probably do something and notify something up
                // the chain if we get a delete or purge event of a config that is still being used.
                // For now we just zero it out
                tx.send_replace(HashMap::new());
            }
            Ok(Some(entry)) => {
                let config: HashMap<String, String> = match serde_json::from_slice(&entry.value) {
                    Ok(config) => config,
                    Err(e) => {
                        error!(%name, error = %e, "Error decoding config from store during watch");
                        continue;
                    }
                };
                tx.send_if_modified(|current| {
                    if current == &config {
                        false
                    } else {
                        *current = config;
                        true
                    }
                });
            }
            Ok(None) => {
                error!(%name, "Watcher for config has closed");
                return;
            }
            Err(e) => {
                error!(%name, error = %e, "Error reading from watcher for config. Will wait for next entry");
                continue;
            }
        }
    }
}

async fn update_merge(
    merged_config: &RwLock<HashMap<String, String>>,
    changed_notifier: &Sender<()>,
    ordered_receivers: &[Receiver<HashMap<String, String>>],
) {
    // We get a write lock to start so nothing else can update the merged config while we merge
    // in the other configs (e.g. when one of the ordered configs is write locked)
    let mut hashmap = merged_config.write().await;
    hashmap.clear();

    // NOTE(thomastaylor312): There is a possible optimization here where we could just create a
    // temporary hashmap of borrowed strings and then after extending everything we could
    // into_iter it and clone it into the final hashmap. This would avoid extra allocations at
    // the cost of a few more iterations
    for recv in ordered_receivers {
        hashmap.extend(recv.borrow().clone());
    }
    // Send a notification that the config has changed
    changed_notifier.send_replace(());
}

#[cfg(test)]
mod tests {
    use super::*;
    use std::time::Duration;

    use tokio::sync::watch;

    #[tokio::test]
    async fn test_config_bundle() {
        let (foo_tx, foo_rx) =
            watch::channel(HashMap::from([("foo".to_string(), "bar".to_string())]));
        let (bar_tx, bar_rx) = watch::channel(HashMap::new());
        let (baz_tx, baz_rx) = watch::channel(HashMap::new());

        let mut bundle = ConfigBundle::new(vec![
            ConfigReceiver {
                name: "foo".to_string(),
                receiver: foo_rx,
            },
            ConfigReceiver {
                name: "bar".to_string(),
                receiver: bar_rx,
            },
            ConfigReceiver {
                name: "baz".to_string(),
                receiver: baz_rx,
            },
        ])
        .await;

        // We should be able to get the initial config before sending anything
        assert_eq!(
            *bundle.get_config().await,
            HashMap::from([("foo".to_string(), "bar".to_string())])
        );

        // Should also be able to get a value from the changed method immediately
        let _ = tokio::time::timeout(Duration::from_millis(50), bundle.changed())
            .await
            .expect("Should have received a config");

        // Update the bar config to overwrite the foo config
        bar_tx.send_replace(HashMap::from([("foo".to_string(), "baz".to_string())]));
        // Wait for the new config to come. This calls the same underlying method as get_config
        let conf = tokio::time::timeout(Duration::from_millis(50), bundle.changed())
            .await
            .expect("conf should have been present")
            .expect("Should have received a config");
        assert_eq!(
            *conf,
            HashMap::from([("foo".to_string(), "baz".to_string())])
        );
        drop(conf);

        // Update the baz config with additional data
        baz_tx.send_replace(HashMap::from([("star".to_string(), "wars".to_string())]));
        let conf = tokio::time::timeout(Duration::from_millis(50), bundle.changed())
            .await
            .expect("conf should have been present")
            .expect("Should have received a config");
        assert_eq!(
            *conf,
            HashMap::from([
                ("foo".to_string(), "baz".to_string()),
                ("star".to_string(), "wars".to_string())
            ])
        );
        drop(conf);

        // Update foo config with additional data
        foo_tx.send_replace(HashMap::from([
            ("starship".to_string(), "troopers".to_string()),
            ("foo".to_string(), "bar".to_string()),
        ]));
        let conf = tokio::time::timeout(Duration::from_millis(50), bundle.changed())
            .await
            .expect("conf should have been present")
            .expect("Should have received a config");
        // Check that the config merged correctly
        assert_eq!(
            *conf,
            HashMap::from([
                ("foo".to_string(), "baz".to_string()),
                ("star".to_string(), "wars".to_string()),
                ("starship".to_string(), "troopers".to_string())
            ]),
        );
    }
}