1
use std::{
2
    borrow::Borrow,
3
    collections::HashSet,
4
    fmt::Display,
5
    hash::Hash,
6
    ops::Deref,
7
    sync::{
8
        atomic::{self, AtomicBool},
9
        Arc, Mutex,
10
    },
11
};
12

            
13
static ACTIVE_SYMBOLS: Mutex<Option<Symbols>> = Mutex::new(None);
14

            
15
13153
fn with_active_symbols<T>(logic: impl FnOnce(&mut Symbols) -> T) -> T {
16
13153
    let mut symbols = ACTIVE_SYMBOLS.lock().expect("poisoned");
17
13153
    if symbols.is_none() {
18
157
        *symbols = Some(Symbols {
19
157
            active: HashSet::new(),
20
157
            slots: Vec::new(),
21
157
            free_slots: Vec::new(),
22
157
        });
23
12996
    }
24

            
25
13153
    logic(symbols.as_mut().expect("always initialized"))
26
13153
}
27

            
28
struct Symbols {
29
    active: HashSet<SharedData>,
30
    slots: Vec<Option<Symbol>>,
31
    free_slots: Vec<usize>,
32
}
33

            
34
/// A String-like type that ensures only one instance of each Symbol exists per
35
/// value, enabling quicker lookups by not requiring string comparisons.
36
///
37
/// After all instances of a given Symbol are dropped, the underlying storage is
38
/// released.
39
///
40
/// This type's [`Hash`] implementation is different than `String`'s hash
41
/// implementation. This type avoids implementing `Borrow<str>` to prevent using
42
/// strings to look up values in `HashMap`s/`HashSet`s where this type is used
43
/// as the key.
44
6945
#[derive(Debug, Clone)]
45
pub struct Symbol(SharedData);
46

            
47
impl Symbol {
48
    /// Returns this symbol's underlying representation.
49
    #[must_use]
50
2160
    pub fn as_str(&self) -> &str {
51
2160
        &self.0 .0.value
52
2160
    }
53
}
54

            
55
impl Hash for Symbol {
56
1032
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
57
1032
        self.0 .0.index.hash(state);
58
1032
    }
59
}
60

            
61
impl Eq for Symbol {}
62

            
63
impl PartialEq for Symbol {
64
1911
    fn eq(&self, other: &Self) -> bool {
65
1911
        self.0 .0.index == other.0 .0.index
66
1911
    }
67
}
68

            
69
impl From<&Symbol> for Symbol {
70
    fn from(value: &Symbol) -> Self {
71
        value.clone()
72
    }
73
}
74

            
75
15404
#[derive(Debug, Clone)]
76
struct SharedData(Arc<Data>);
77

            
78
#[derive(Debug)]
79
struct Data {
80
    index: usize,
81
    value: String,
82
    freeing: AtomicBool,
83
}
84

            
85
impl Hash for SharedData {
86
9987
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
87
9987
        self.0.value.hash(state);
88
9987
    }
89
}
90

            
91
impl Eq for SharedData {}
92

            
93
impl PartialEq for SharedData {
94
5009
    fn eq(&self, other: &Self) -> bool {
95
5009
        self.0.index == other.0.index
96
5009
    }
97
}
98

            
99
impl Display for Symbol {
100
100
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
101
100
        f.write_str(self)
102
100
    }
103
}
104

            
105
impl Borrow<str> for SharedData {
106
4096
    fn borrow(&self) -> &str {
107
4096
        &self.0.value
108
4096
    }
109
}
110

            
111
impl<'a> From<&'a str> for Symbol {
112
8459
    fn from(sym: &'a str) -> Self {
113
8459
        with_active_symbols(|symbols| {
114
8459
            if let Some(symbol) = symbols.active.get(sym).cloned() {
115
3779
                Symbol(symbol)
116
            } else {
117
4680
                let value = sym.to_string();
118

            
119
4680
                let index = if let Some(free_slot) = symbols.free_slots.pop() {
120
3858
                    free_slot
121
                } else {
122
822
                    let slot_id = symbols.slots.len();
123
822
                    symbols.slots.push(None);
124
822
                    slot_id
125
                };
126

            
127
4680
                let symbol = Symbol(SharedData(Arc::new(Data {
128
4680
                    index,
129
4680
                    value,
130
4680
                    freeing: AtomicBool::new(false),
131
4680
                })));
132
4680
                symbols.active.insert(symbol.0.clone());
133
4680
                symbols.slots[index] = Some(symbol.clone());
134
4680
                symbol
135
            }
136
8459
        })
137
8459
    }
138
}
139

            
140
impl Deref for Symbol {
141
    type Target = str;
142

            
143
11905
    fn deref(&self) -> &Self::Target {
144
11905
        &self.0 .0.value
145
11905
    }
146
}
147

            
148
impl PartialEq<str> for Symbol {
149
10686
    fn eq(&self, other: &str) -> bool {
150
10686
        &**self == other
151
10686
    }
152
}
153

            
154
impl<'a> PartialEq<&'a str> for Symbol {
155
552
    fn eq(&self, other: &&'a str) -> bool {
156
552
        self == *other
157
552
    }
158
}
159

            
160
impl Drop for SharedData {
161
39353
    fn drop(&mut self) {
162
39353
        // The main Symbols structure holds two strong references to the same
163
39353
        // Arc we hold. Thus, if we reach 3 strong count (our ref included), we
164
39353
        // need to remove the symbol so it can be freeed.
165
39353
        //
166
39353
        // We can use any form of atomics here because if the strong count is 3,
167
39353
        // we can be guaranteed the only thread able to free our data is this
168
39353
        // thread.
169
39353
        if Arc::strong_count(&self.0) == 3
170
9372
            && self
171
9372
                .0
172
9372
                .freeing
173
9372
                .compare_exchange(
174
9372
                    false,
175
9372
                    true,
176
9372
                    atomic::Ordering::Relaxed,
177
9372
                    atomic::Ordering::Relaxed,
178
9372
                )
179
9372
                .is_ok()
180
4692
        {
181
4692
            with_active_symbols(|symbols| {
182
4692
                // Check that the strong count hasn't changed. If it has, we
183
4692
                // need to allow the symbol to stay alive.
184
4692
                if Arc::strong_count(&self.0) > 3 {
185
12
                    self.0.freeing.store(false, atomic::Ordering::Relaxed);
186
4680
                } else {
187
4680
                    symbols.active.remove(self);
188
4680
                    symbols.slots[self.0.index] = None;
189
4680
                    symbols.free_slots.push(self.0.index);
190
4680
                }
191
4692
            });
192
34673
        }
193
39365
    }
194
}
195

            
196
1
#[test]
197
1
fn basics() {
198
1
    let first_symbol = Symbol::from("basics-test-symbol");
199
1
    let slot = first_symbol.0 .0.index;
200
1
    let first_again = Symbol::from("basics-test-symbol");
201
1
    assert_eq!(slot, first_again.0 .0.index);
202
1
    assert_eq!(first_symbol, first_again);
203
1
    drop(first_again);
204
1
    // Dropping the second copy shouldn't free the underlying symbol
205
1
    with_active_symbols(|symbols| {
206
1
        assert!(symbols.active.contains("basics-test-symbol"));
207
1
        assert!(!symbols.slots.is_empty());
208
1
        assert!(symbols.slots[slot].is_some());
209
5
        assert!(!symbols.free_slots.iter().any(|free| *free == slot));
210
1
    });
211
1
    drop(first_symbol);
212
1
    with_active_symbols(|symbols| {
213
1
        assert!(!symbols.active.contains("basics-test-symbol"));
214
1
        match &symbols.slots[slot] {
215
            Some(new_symbol) => {
216
                // This test isn't run in isolation, so other symbols may get
217
                // registered between the drop and this block. Very unlikely,
218
                // but possible.
219
                assert_ne!(new_symbol, "basics-test-symbol");
220
            }
221
            None => {
222
6
                assert!(symbols.free_slots.iter().any(|free| *free == slot));
223
            }
224
        }
225
1
    });
226
1
}