-
Notifications
You must be signed in to change notification settings - Fork 102
/
topic_matcher.rs
678 lines (594 loc) · 21.3 KB
/
topic_matcher.rs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
// topic_matcher.rs
//
// Code to match MQTT topics to filters that may contain wildcards.
//
// This file is part of the Eclipse Paho MQTT Rust Client library.
//
/*******************************************************************************
* Copyright (c) 2021-2024 Frank Pagliughi <[email protected]>
* Copyright (c) 2024 Altair Bueno <[email protected]>
*
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v2.0
* and Eclipse Distribution License v1.0 which accompany this distribution.
*
* The Eclipse Public License is available at
* http://www.eclipse.org/legal/epl-v20.html
* and the Eclipse Distribution License is available at
* http://www.eclipse.org/org/documents/edl-v10.php.
*
* Contributors:
* Frank Pagliughi - TopicFilter trie collection
* Altair Bueno - TopicFilterExt trait and topic matches functions
*******************************************************************************/
//! Code to match MQTT topics to filters that may contain wildcards.
use std::{collections::HashMap, str::Split};
/////////////////////////////////////////////////////////////////////////////
// Utility functions
/// Checks if a filter matches a given topic.
///
/// # Example
///
/// ```
/// # use paho_mqtt::topic_matcher::topic_matches;
/// assert!(topic_matches("a/+/c", "a/b/c"));
/// assert!(topic_matches("a/#", "a/b/d"));
/// ```
pub fn topic_matches(filter: &str, topic: &str) -> bool {
topic_matches_iter(filter.split('/'), topic.split('/'))
}
/// Checks if a split filter matches a given split topic.
///
/// # Example
///
/// ```
/// # use paho_mqtt::topic_matcher::topic_matches_iter;
/// assert!(topic_matches_iter(["a", "+", "c"], ["a", "b", "c"]));
/// assert!(topic_matches_iter(["a", "#"], ["a", "b", "d"]));
/// ```
pub fn topic_matches_iter<'a>(
filter: impl IntoIterator<Item = &'a str>,
topic: impl IntoIterator<Item = &'a str>,
) -> bool {
let mut filter = filter.into_iter().peekable();
let mut topic = topic.into_iter().peekable();
// Topics starting with '$' don't match a wildcard in the first field.
// See https://docs.oasis-open.org/mqtt/mqtt/v5.0/os/mqtt-v5.0-os.html#_Toc3901246
if matches!(filter.peek(), Some(&"#" | &"+"))
&& matches!(topic.peek(), Some(x) if x.starts_with('$'))
{
return false;
}
loop {
let filter_level = filter.next();
let topic_level = topic.next();
match (filter_level, topic_level) {
// Exhausted both filter and topic
(None, None) => return true,
// Wildcard on filter
(Some("#"), _) => return true,
// Single level wildcard on filter
(Some("+"), Some(_)) => continue,
// Equal levels
(Some(filter), Some(topic)) if filter == topic => continue,
// Otherwise, no match
_ => return false,
}
}
}
/// Extension trait for map types and tuple iterators that allows to filter
/// entries by matching a MQTT topic.
///
/// # Example
///
/// ```
/// # use std::collections::{HashMap, HashSet};
/// # use paho_mqtt::topic_matcher::TopicMatcherExt as _;
///
/// let mut matcher = HashMap::<&str, &str>::new();
/// matcher.insert("00:00:00:00:00:00/+/+/rpc", "_/device_type/systemid/_");
/// matcher.insert("00:00:00:00:00:00/+/+/+/rpc", "_/device_type/systemid/zoneid/_");
/// matcher.insert("00:00:00:00:00:00/+/rpc", "_/device_type/_");
/// matcher.insert("00:00:00:00:00:00/rpc", "");
///
/// let topic = "00:00:00:00:00:00/humidifier/1/rpc";
/// let matches: HashSet<_> = matcher.matches(topic).collect();
/// assert_eq!(
/// matches,
/// HashSet::from([("00:00:00:00:00:00/+/+/rpc", "_/device_type/systemid/_")])
/// );
/// ```
pub trait TopicMatcherExt {
/// The key type returned by the iterator.
type Key;
/// The value type returned by the iterator.
type Value;
/// Matches the given topic against the keys of the map and returns an
/// iterator over the matching entries. Keys of the map are expected to
/// be MQTT topic filter patterns and may contain wildcards.
fn matches<'topic>(
self,
topic: &'topic str,
) -> impl Iterator<Item = (Self::Key, Self::Value)> + 'topic
where
Self: 'topic;
}
impl<K, V, C> TopicMatcherExt for C
where
C: IntoIterator<Item = (K, V)>,
K: AsRef<str>,
{
type Key = K;
type Value = V;
fn matches<'topic>(
self,
topic: &'topic str,
) -> impl Iterator<Item = (Self::Key, Self::Value)> + 'topic
where
Self: 'topic,
{
self.into_iter()
.filter(move |(pattern, _)| topic_matches(pattern.as_ref(), topic))
}
}
/////////////////////////////////////////////////////////////////////////////
// Node (for TopicMatcher)
/// A single node in the topic matcher trie collection.
///
/// A terminal (leaf) node has some `content`, whereas intermediate nodes
/// do not. We also cache the full topic at the leaf. This should allow for
/// more efficient searches through the collection, so that the iterators
/// don't have to keep the stack of keys that lead down to the final leaf.
///
#[derive(Debug)]
struct Node<T> {
/// The value that matches the topic at this node, if any.
/// This includes a cached value of the filter to this node.
value: Option<(String, T)>,
/// The explicit, non-wildcard child nodes mapped by the next field
/// of the topic.
children: HashMap<Box<str>, Node<T>>,
}
impl<T> Node<T> {
/// Determines if the node does not contain a value.
fn is_empty(&self) -> bool {
self.value.is_none() && self.children.is_empty()
}
/// Gets an iterator for the node and all its children.
fn iter(&self) -> NodeIter<T> {
Box::new(
self.value
.iter()
.map(|(k, v)| (k.as_str(), v))
.chain(self.children.values().flat_map(|n| n.iter())),
)
}
/// Gets a mutable iterator for the node and all its children.
fn iter_mut(&mut self) -> NodeIterMut<T> {
Box::new(
self.value
.iter_mut()
.map(|(k, v)| (k.as_str(), v))
.chain(self.children.values_mut().flat_map(|n| n.iter_mut())),
)
}
/// Removes empty child nodes.
fn prune(&mut self) {
// Recursively prune children
for node in &mut self.children.values_mut() {
node.shrink_to_fit();
}
// Remove empty children and shrink the has hmaps
self.children.retain(|_, node| !node.is_empty());
}
/// Removes empty child nodes and shrinks the capacity of the
/// collection as much as possible.
fn shrink_to_fit(&mut self) {
// Recursively shrink children
for node in self.children.values_mut() {
node.shrink_to_fit();
}
// Remove empty children and shrink the has hmaps
self.children.retain(|_, node| !node.is_empty());
self.children.shrink_to_fit();
}
}
// We manually implement Default, otherwise the derived one
// would require T: Default.
impl<T> Default for Node<T> {
/// Creates a default, empty node.
fn default() -> Self {
Node {
value: None,
children: HashMap::new(),
}
}
}
/// An iterator type to visit all values in a node and its children.
type NodeIter<'a, T> = Box<dyn Iterator<Item = (&'a str, &'a T)> + 'a>;
/// A mutable iterator type to visit all values in a node and its children.
type NodeIterMut<'a, T> = Box<dyn Iterator<Item = (&'a str, &'a mut T)> + 'a>;
/////////////////////////////////////////////////////////////////////////////
// TopicMatcher
/// A trie collection of topic filters to arbitrary objects.
///
/// This can be used to get an iterator to all items that have a filter that
/// matches a topic. To test against a single filter, see
/// [`TopicFilter`](crate::TopicFilter). This collection is more commonly
/// used when there are a nuber of filters and each needs to be associated
/// with a particular action or piece of data. A single incoming topic could
/// match against several items in the collection.
///
/// For example, the topic:
/// ```text
/// data/temperature/engine
/// ```
/// Could match against the filters:
/// ```text
/// data/temperature/engine
/// data/temperature/#
/// data/+/engine
/// ```
///
/// Thus, the collection gives an iterator for the items matching a topic.
///
/// A common use for this would be to store callbacks to proces incoming
/// messages based on topics, but note that there might be an issue with
/// overlapped subscriptions where callbacks are invoked multiple times for
/// a message that matches more than one subscription.
///
/// This code was adapted from the Eclipse Python `MQTTMatcher` class:
/// <https://github.com/eclipse/paho.mqtt.python/blob/master/src/paho/mqtt/matcher.py>
///
/// which use a prefix tree (trie) to store the values.
///
///
/// When using MQTT v5, subscription identifiers would be more efficient
/// and also solve the problem of multiple overlapped callbacks. See:
/// <https://github.com/eclipse/paho.mqtt.rust/blob/master/examples/sync_consume_v5.rs>
///
#[derive(Debug)]
pub struct TopicMatcher<T> {
root: Node<T>,
}
impl<T> TopicMatcher<T> {
/// Creates a new, empty, topic matcher collection.
pub fn new() -> Self {
Self::default()
}
/// Determines if the collection contains no values.
pub fn is_empty(&self) -> bool {
self.root.is_empty()
}
/// Clears all the entries in the collection
pub fn clear(&mut self) {
self.root = Node::default();
}
/// Inserts a new topic filter into the collection.
pub fn insert<S>(&mut self, filter: S, val: T)
where
S: Into<String>,
{
let filter = filter.into();
let mut curr = &mut self.root;
for field in filter.split('/') {
curr = curr.children.entry(field.into()).or_default()
}
curr.value = Some((filter, val));
}
/// Returns a reference to a value from the collection using an exact
/// filter match.
pub fn get(&self, topic: &str) -> Option<&T> {
let mut curr = &self.root;
for field in topic.split('/') {
curr = match curr.children.get(field) {
Some(node) => node,
None => return None,
};
}
curr.value.as_ref().map(|(_, v)| v)
}
/// Gets a mutable mutable reference to a value from the collection
/// using an exact filter match.
pub fn get_mut(&mut self, topic: &str) -> Option<&mut T> {
let mut curr = &mut self.root;
for field in topic.split('/') {
curr = match curr.children.get_mut(field) {
Some(node) => node,
None => return None,
};
}
curr.value.as_mut().map(|(_, v)| v)
}
/// Removes the entry, returning the value for it, if found.
///
/// This removes the value from the internal node, but leaves the node
/// even if it's empty. To remove empty nodes, use [`prune`](Self::prune)
/// or [`shrink_to_fit`](Self::shrink_to_fit).
///
pub fn remove(&mut self, topic: &str) -> Option<T> {
let mut curr = &mut self.root;
for field in topic.split('/') {
curr = match curr.children.get_mut(field) {
Some(node) => node,
None => return None,
};
}
curr.value.take().map(|(_, v)| v)
}
/// Removes empty nodes in the collection.
pub fn prune(&mut self) {
self.root.prune()
}
/// Removes ampty nodes and shrinks the capacity of the collection
/// as much as possible.
pub fn shrink_to_fit(&mut self) {
self.root.shrink_to_fit()
}
/// Gets an iterator over all the items in the collection.
pub fn iter(&self) -> NodeIter<T> {
self.root.iter()
}
/// Gets a muable iterator over all the items in the collection.
pub fn iter_mut(&mut self) -> NodeIterMut<T> {
self.root.iter_mut()
}
/// Gets an iterator for all the matches to the specified topic
pub fn matches<'a, 'b>(&'a self, topic: &'b str) -> MatchIter<'a, 'b, T> {
MatchIter::new(&self.root, topic)
}
/// Determines if the topic matches any of the filters in the collection.
pub fn has_match(&self, topic: &str) -> bool {
self.matches(topic).next().is_some()
}
}
// We manually implement Default, otherwise the derived one
// would require T: Default.
impl<T> Default for TopicMatcher<T> {
/// Create an empty TopicMatcher collection.
fn default() -> Self {
TopicMatcher {
root: Node::default(),
}
}
}
impl<'a, T: 'a> IntoIterator for &'a TopicMatcher<T> {
type Item = (&'a str, &'a T);
type IntoIter = NodeIter<'a, T>;
fn into_iter(self) -> Self::IntoIter {
self.iter()
}
}
impl<'a, T: 'a> IntoIterator for &'a mut TopicMatcher<T> {
type Item = (&'a str, &'a mut T);
type IntoIter = NodeIterMut<'a, T>;
fn into_iter(self) -> Self::IntoIter {
self.iter_mut()
}
}
/////////////////////////////////////////////////////////////////////////////
/// Iterator for the topic matcher collection.
///
/// This is created from a specific topic string and will find the contents
/// of all the matching filters in the collection.
/// Lifetimes:
/// 'a - The matcher collection
/// 'b - The topic string
///
/// We keep a stack of nodes that still need to be searched. For each node,
/// there is also an iterator stack of fields for that node to search.
#[derive(Debug)]
pub struct MatchIter<'a, 'b, T> {
// The nodes still to be processed.
// The tuple is (current node, remaining topic fields, if first node)
remaining: Vec<(&'a Node<T>, Split<'b, char>, bool)>,
}
impl<'a, 'b, T> MatchIter<'a, 'b, T> {
fn new(node: &'a Node<T>, topic: &'b str) -> Self {
let fields = topic.split('/');
Self {
remaining: vec![(node, fields, true)],
}
}
}
impl<'a, 'b, T> Iterator for MatchIter<'a, 'b, T> {
type Item = (&'a str, &'a T);
/// Gets the next value that matches the iterator's topic.
fn next(&mut self) -> Option<Self::Item> {
let (node, mut fields, first) = match self.remaining.pop() {
Some(val) => val,
None => return None,
};
let field = match fields.next() {
Some(field) => field,
None => {
return node
.value
.as_ref()
.map(|(k, v)| (k.as_str(), v))
.or_else(|| self.next())
}
};
if let Some(child) = node.children.get(field) {
self.remaining.push((child, fields.clone(), false));
}
// A topic starting with '$' doesn't match wildcards
// https://docs.oasis-open.org/mqtt/mqtt/v5.0/os/mqtt-v5.0-os.html#_Toc3901246
if !first || !field.starts_with('$') {
if let Some(child) = node.children.get("+") {
self.remaining.push((child, fields, false))
}
if let Some(child) = node.children.get("#") {
// By protocol definition, a '#' must be a terminating leaf.
return child.value.as_ref().map(|(k, v)| (k.as_str(), v));
}
}
self.next()
}
}
/// Macro to create a [`TopicMatcher`] collection.
#[macro_export]
macro_rules! topic_matcher {
{ $($filter:expr => $val:expr),+ } => {
{
let mut tm = $crate::topic_matcher::TopicMatcher::new();
$(
tm.insert($filter, $val);
)+
tm
}
};
}
/////////////////////////////////////////////////////////////////////////////
// Unit Tests
/////////////////////////////////////////////////////////////////////////////
#[cfg(test)]
mod tests {
use super::*;
use std::collections::HashSet;
#[test]
fn test_basic_topic_matcher() {
let tm: TopicMatcher<i32> = topic_matcher! {
"some/test/#" => 99,
"some/test/topic" => 19,
"some/+/topic" => 42,
"some/prod/topic" => 155
};
assert_eq!(tm.get("some/test/topic"), Some(&19));
assert_eq!(tm.get("some/test/bubba"), None);
assert!(tm.has_match("some/random/topic"));
assert!(!tm.has_match("some/other/thing"));
// Test the iterator
let set = HashSet::from([19, 42, 99]);
let mut match_set = HashSet::new();
for (_k, v) in tm.matches("some/test/topic") {
match_set.insert(*v);
}
assert_eq!(set, match_set);
// Weird corner case
let tm = topic_matcher! {
"hello/#" => 99,
"hi/there" => 13,
"hello/world" => 42,
"hello/there/bubba" => 96,
"hello/+/bubba" => 27
};
assert_eq!(2, tm.matches("hello/world").count());
}
#[test]
fn test_topic_matcher() {
use crate::topic_matcher as tm;
// Should match
assert!(tm! {"foo/bar" => ()}.has_match("foo/bar"));
assert!(tm! {"foo/+" => ()}.has_match("foo/bar"));
assert!(tm! {"foo/+/baz" => ()}.has_match("foo/bar/baz"));
assert!(tm! {"foo/+/#"=> ()}.has_match("foo/bar/baz"));
assert!(tm! {"A/B/+/#"=> ()}.has_match("A/B/B/C"));
assert!(tm! {"#"=> ()}.has_match("foo/bar/baz"));
assert!(tm! {"#"=> ()}.has_match("/foo/bar"));
assert!(tm! {"/#"=> ()}.has_match("/foo/bar"));
assert!(tm! {"$SYS/bar"=> ()}.has_match("$SYS/bar"));
assert!(tm! {"foo/#"=> ()}.has_match("foo/$bar"));
assert!(tm! {"foo/+/baz"=> ()}.has_match("foo/$bar/baz"));
// Should not match
assert!(!tm! {"test/6/#"=> ()}.has_match("test/3"));
assert!(!tm! {"foo/bar"=> ()}.has_match("foo"));
assert!(!tm! {"foo/+"=> ()}.has_match("foo/bar/baz"));
assert!(!tm! {"foo/+/baz"=> ()}.has_match("foo/bar/bar"));
assert!(!tm! {"foo/+/#"=> ()}.has_match("fo2/bar/baz"));
assert!(!tm! {"/#"=> ()}.has_match("foo/bar"));
assert!(!tm! {"#"=> ()}.has_match("$SYS/bar"));
assert!(!tm! {"$BOB/bar"=> ()}.has_match("$SYS/bar"));
assert!(!tm! {"+/bar"=> ()}.has_match("$SYS/bar"));
}
#[test]
fn test_topic_matcher_callback() {
let mut matcher = TopicMatcher::new();
matcher.insert("some/+/topic", Box::new(|n: u32| n * 2));
for (_t, f) in matcher.matches("some/random/topic") {
let n = f(2);
assert_eq!(n, 4);
}
}
#[test]
fn assert_that_no_wildcards_matches() {
assert!(topic_matches("a/b/c", "a/b/c"));
assert!(topic_matches("foo/bar", "foo/bar"));
}
#[test]
fn assert_that_plus_wildcard_matches() {
assert!(topic_matches("a/+/c", "a/b/c"));
assert!(topic_matches("foo/+/baz", "foo/bar/baz"));
}
#[test]
fn assert_that_leading_plus_wildcard_matches() {
assert!(topic_matches("+/b/c", "a/b/c"));
}
#[test]
fn assert_that_trailing_plus_wildcard_matches() {
assert!(topic_matches("a/b/+", "a/b/c"));
assert!(topic_matches("foo/+", "foo/bar"));
}
#[test]
fn assert_that_hash_wildcard_matches_none_level() {
assert!(topic_matches("a/b/#", "a/b"));
}
#[test]
fn assert_that_hash_wildcard_matches_single_level() {
assert!(topic_matches("a/b/#", "a/b/c"));
}
#[test]
fn assert_that_hash_wildcard_matches_multiple_levels() {
assert!(topic_matches("a/b/#", "a/b/c/d"));
}
#[test]
fn assert_that_single_hash_matches_all() {
assert!(topic_matches("#", "foo/bar/baz"));
assert!(topic_matches("#", "/foo/bar"));
assert!(topic_matches("/#", "/foo/bar"));
}
#[test]
fn assert_that_plus_and_hash_wildcards_matches() {
assert!(topic_matches("foo/+/#", "foo/bar/baz"));
assert!(topic_matches("A/B/+/#", "A/B/B/C"));
}
#[test]
fn assert_that_sys_topic_matches() {
assert!(topic_matches("$SYS/bar", "$SYS/bar"));
}
#[test]
fn assert_that_non_first_levels_with_dollar_sign_matches_hash_wildcard() {
assert!(topic_matches("foo/#", "foo/$bar"));
}
#[test]
fn assert_that_non_first_levels_with_dollar_sign_matches_plus_wildcard() {
assert!(topic_matches("foo/+/baz", "foo/$bar/baz"));
}
#[test]
fn assert_that_different_levels_does_not_match() {
assert!(!topic_matches("test/6/#", "test/3"));
assert!(!topic_matches("foo/+/baz", "foo/bar/bar"));
assert!(!topic_matches("foo/+/#", "fo2/bar/baz"));
assert!(!topic_matches("$BOB/bar", "$SYS/bar"));
}
#[test]
fn assert_that_longer_topics_does_not_match() {
assert!(!topic_matches("foo/bar", "foo"));
}
#[test]
fn assert_that_plus_wildcard_does_not_match_multiple_levels() {
assert!(!topic_matches("foo/+", "foo/bar/baz"));
}
#[test]
fn assert_that_leading_slash_with_hash_wildcard_does_not_match_normal_topic() {
assert!(!topic_matches("/#", "foo/bar"));
}
#[test]
fn assert_that_hash_wildcard_does_not_match_an_internal_topic() {
assert!(!topic_matches("#", "$SYS/bar"));
}
#[test]
fn assert_that_plus_wildcard_does_not_match_an_internal_topic() {
assert!(!topic_matches("+/bar", "$SYS/bar"));
}
}