1
use std::{
2
    borrow::Cow,
3
    fmt::{Debug, Display, Write},
4
    sync::Arc,
5
};
6

            
7
use serde::{Deserialize, Serialize};
8

            
9
/// A schema name. Cloning is inexpensive.
10
96888497
#[derive(Hash, PartialEq, Eq, Deserialize, Serialize, Debug, Clone, Ord, PartialOrd)]
11
#[serde(try_from = "String")]
12
#[serde(into = "String")]
13
pub struct Name {
14
    name: Arc<Cow<'static, str>>,
15
    needs_escaping: bool,
16
}
17

            
18
/// A name was unable to e parsed.
19
#[derive(thiserror::Error, Debug, Serialize, Deserialize, Clone)]
20
#[error("invalid name: {0}")]
21
pub struct InvalidNameError(pub String);
22

            
23
impl Name {
24
    /// Creates a new name.
25
10157339
    pub fn new<T: Into<Self>>(contents: T) -> Self {
26
10157339
        contents.into()
27
10157339
    }
28

            
29
    /// Parses a name that was previously encoded via [`Self::encoded()`].
30
    ///
31
    /// # Errors
32
    ///
33
    /// Returns [`InvalidNameError`] if the name contains invalid escape
34
    /// sequences.
35
331
    pub fn parse_encoded(encoded: &str) -> Result<Self, InvalidNameError> {
36
331
        let mut bytes = encoded.bytes();
37
331
        let mut decoded = Vec::with_capacity(encoded.len());
38
3560
        while let Some(byte) = bytes.next() {
39
3233
            if byte == b'_' {
40
126
                if let (Some(high), Some(low)) = (bytes.next(), bytes.next()) {
41
123
                    if let Some(byte) = hex_chars_to_byte(high, low) {
42
122
                        decoded.push(byte);
43
122
                        continue;
44
1
                    }
45
3
                }
46
4
                return Err(InvalidNameError(encoded.to_string()));
47
3107
            }
48
3107

            
49
3107
            decoded.push(byte);
50
        }
51

            
52
327
        String::from_utf8(decoded)
53
327
            .map(Self::from)
54
327
            .map_err(|_| InvalidNameError(encoded.to_string()))
55
331
    }
56

            
57
    /// Returns an encoded version of this name that contains only alphanumeric
58
    /// ASCII, underscore, and hyphen.
59
    #[must_use]
60
1
    pub fn encoded(&self) -> String {
61
1
        format!("{:#}", self)
62
1
    }
63
}
64

            
65
impl From<Cow<'static, str>> for Name {
66
64609686
    fn from(value: Cow<'static, str>) -> Self {
67
64609686
        let needs_escaping = !value
68
64609686
            .bytes()
69
551889710
            .all(|b| b.is_ascii_alphanumeric() || b == b'-');
70
64609686
        Self {
71
64609686
            name: Arc::new(value),
72
64609686
            needs_escaping,
73
64609686
        }
74
64609686
    }
75
}
76

            
77
impl From<&'static str> for Name {
78
35660718
    fn from(value: &'static str) -> Self {
79
35660718
        Self::from(Cow::Borrowed(value))
80
35660718
    }
81
}
82

            
83
impl From<String> for Name {
84
3473189
    fn from(value: String) -> Self {
85
3473189
        Self::from(Cow::Owned(value))
86
3473189
    }
87
}
88

            
89
#[allow(clippy::from_over_into)] // the auto into impl doesn't work with serde(into)
90
impl Into<String> for Name {
91
6969253
    fn into(self) -> String {
92
6969253
        self.name.to_string()
93
6969253
    }
94
}
95

            
96
impl Display for Name {
97
13663161
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
98
13663161
        if f.alternate() && self.needs_escaping {
99
32243295
            for byte in self.name.bytes() {
100
32243295
                if byte.is_ascii_alphanumeric() || byte == b'-' {
101
28446494
                    f.write_char(byte as char)?;
102
                } else {
103
                    // Encode the byte as _FF
104
3795881
                    f.write_char('_')?;
105
3795881
                    f.write_char(nibble_to_hex_char(byte >> 4))?;
106
3795881
                    f.write_char(nibble_to_hex_char(byte & 0xF))?;
107
                }
108
            }
109
3795603
            Ok(())
110
        } else {
111
9868616
            Display::fmt(&self.name, f)
112
        }
113
13664219
    }
114
}
115

            
116
7591279
const fn nibble_to_hex_char(nibble: u8) -> char {
117
7591808
    let ch = match nibble {
118
7591026
        0..=9 => b'0' + nibble,
119
3796014
        _ => b'a' + nibble - 10,
120
    };
121
7591808
    ch as char
122
7591808
}
123

            
124
const fn hex_chars_to_byte(high_nibble: u8, low_nibble: u8) -> Option<u8> {
125
    match (
126
123
        hex_char_to_nibble(high_nibble),
127
123
        hex_char_to_nibble(low_nibble),
128
    ) {
129
122
        (Some(high_nibble), Some(low_nibble)) => Some(high_nibble << 4 | low_nibble),
130
1
        _ => None,
131
    }
132
123
}
133

            
134
246
const fn hex_char_to_nibble(nibble: u8) -> Option<u8> {
135
246
    let ch = match nibble {
136
246
        b'0'..=b'9' => nibble - b'0',
137
118
        b'a'..=b'f' => nibble - b'a' + 10,
138
1
        _ => return None,
139
    };
140
245
    Some(ch)
141
246
}
142

            
143
impl AsRef<str> for Name {
144
269445
    fn as_ref(&self) -> &str {
145
269445
        self.name.as_ref()
146
269445
    }
147
}
148

            
149
/// The owner of a schema item. This should represent the company, group, or
150
/// individual that created the item in question. This value is used for
151
/// namespacing. Changing this after values are in use is not supported without
152
/// manual migrations at this time.
153
40705573
#[derive(Hash, PartialEq, Eq, Deserialize, Serialize, Debug, Clone, Ord, PartialOrd)]
154
#[serde(transparent)]
155
pub struct Authority(Name);
156

            
157
impl From<Cow<'static, str>> for Authority {
158
25506116
    fn from(value: Cow<'static, str>) -> Self {
159
25506116
        Self::from(Name::from(value))
160
25506116
    }
161
}
162

            
163
impl From<&'static str> for Authority {
164
25506599
    fn from(value: &'static str) -> Self {
165
25506599
        Self::from(Cow::Borrowed(value))
166
25506599
    }
167
}
168

            
169
impl From<String> for Authority {
170
    fn from(value: String) -> Self {
171
        Self::from(Cow::Owned(value))
172
    }
173
}
174

            
175
impl From<Name> for Authority {
176
25509407
    fn from(value: Name) -> Self {
177
25509407
        Self(value)
178
25509407
    }
179
}
180

            
181
impl Display for Authority {
182
5380187
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
183
5380187
        Display::fmt(&self.0, f)
184
5380187
    }
185
}
186

            
187
/// The name of a [`Schema`](super::Schema).
188
1152111
#[derive(Hash, PartialEq, Eq, Deserialize, Serialize, Debug, Clone, Ord, PartialOrd)]
189
pub struct SchemaName {
190
    /// The authority of this schema.
191
    pub authority: Authority,
192

            
193
    /// The name of this schema.
194
    pub name: Name,
195
}
196

            
197
impl SchemaName {
198
    /// Creates a new schema name.
199
1246187
    pub fn new<A: Into<Authority>, N: Into<Name>>(authority: A, name: N) -> Self {
200
1246187
        let authority = authority.into();
201
1246187
        let name = name.into();
202
1246187
        Self { authority, name }
203
1246187
    }
204

            
205
    /// Parses a schema name that was previously encoded via
206
    /// [`Self::encoded()`].
207
    ///
208
    /// # Errors
209
    ///
210
    /// Returns [`InvalidNameError`] if the name contains invalid escape
211
    /// sequences or contains more than two periods.
212
162
    pub fn parse_encoded(schema_name: &str) -> Result<Self, InvalidNameError> {
213
162
        let mut parts = schema_name.split('.');
214
162
        if let (Some(authority), Some(name), None) = (parts.next(), parts.next(), parts.next()) {
215
162
            let authority = Name::parse_encoded(authority)?;
216
162
            let name = Name::parse_encoded(name)?;
217

            
218
162
            Ok(Self::new(authority, name))
219
        } else {
220
            Err(InvalidNameError(schema_name.to_string()))
221
        }
222
162
    }
223

            
224
    /// Encodes this schema name such that the authority and name can be
225
    /// safely parsed using [`Self::parse_encoded`].
226
    #[must_use]
227
967
    pub fn encoded(&self) -> String {
228
967
        format!("{:#}", self)
229
967
    }
230
}
231

            
232
impl Display for SchemaName {
233
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
234
968
        Display::fmt(&self.authority, f)?;
235
968
        f.write_char('.')?;
236
968
        Display::fmt(&self.name, f)
237
968
    }
238
}
239

            
240
/// The name of a [`Collection`](super::Collection).
241
39509458
#[derive(Hash, PartialEq, Eq, Deserialize, Serialize, Debug, Clone)]
242
pub struct CollectionName {
243
    /// The authority of this collection.
244
    pub authority: Authority,
245

            
246
    /// The name of this collection.
247
    pub name: Name,
248
}
249

            
250
impl CollectionName {
251
    /// Creates a new collection name.
252
24261265
    pub fn new<A: Into<Authority>, N: Into<Name>>(authority: A, name: N) -> Self {
253
24261265
        let authority = authority.into();
254
24261265
        let name = name.into();
255
24261265
        Self { authority, name }
256
24261265
    }
257

            
258
    /// Parses a colleciton name that was previously encoded via
259
    /// [`Self::encoded()`].
260
    ///
261
    /// # Errors
262
    ///
263
    /// Returns [`InvalidNameError`] if the name contains invalid escape
264
    /// sequences or contains more than two periods.
265
1
    pub fn parse_encoded(collection_name: &str) -> Result<Self, InvalidNameError> {
266
1
        let mut parts = collection_name.split('.');
267
1
        if let (Some(authority), Some(name), None) = (parts.next(), parts.next(), parts.next()) {
268
1
            let authority = Name::parse_encoded(authority)?;
269
1
            let name = Name::parse_encoded(name)?;
270

            
271
1
            Ok(Self::new(authority, name))
272
        } else {
273
            Err(InvalidNameError(collection_name.to_string()))
274
        }
275
1
    }
276

            
277
    /// Encodes this collection name such that the authority and name can be
278
    /// safely parsed using [`Self::parse_encoded`].
279
    #[must_use]
280
530
    pub fn encoded(&self) -> String {
281
530
        format!("{:#}", self)
282
530
    }
283
}
284

            
285
impl Display for CollectionName {
286
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
287
5379380
        Display::fmt(&self.authority, f)?;
288
5379380
        f.write_char('.')?;
289
5379196
        Display::fmt(&self.name, f)
290
5379196
    }
291
}
292

            
293
/// The name of a [`View`](super::View).
294
15490484
#[derive(Hash, PartialEq, Eq, Deserialize, Serialize, Debug, Clone)]
295
pub struct ViewName {
296
    /// The name of the collection that contains this view.
297
    pub collection: CollectionName,
298
    /// The name of this view.
299
    pub name: Name,
300
}
301

            
302
impl ViewName {
303
    /// Creates a new view name.
304
    pub fn new<
305
        C: TryInto<CollectionName, Error = InvalidNameError>,
306
        N: TryInto<Name, Error = InvalidNameError>,
307
    >(
308
        collection: C,
309
        name: N,
310
    ) -> Result<Self, InvalidNameError> {
311
        let collection = collection.try_into()?;
312
        let name = name.try_into()?;
313
        Ok(Self { collection, name })
314
    }
315
}
316

            
317
impl Display for ViewName {
318
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
319
2904601
        Display::fmt(&self.collection, f)?;
320
2904601
        f.write_char('.')?;
321
2904555
        Display::fmt(&self.name, f)
322
2904555
    }
323
}
324

            
325
1
#[test]
326
1
fn name_escaping_tests() {
327
1
    const VALID_CHARS: &str = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-";
328
1
    const INVALID_CHARS: &str = "._hello\u{1F680}";
329
1
    const ESCAPED_INVALID: &str = "_2e_5fhello_f0_9f_9a_80";
330
1
    assert_eq!(Name::new(VALID_CHARS).to_string(), VALID_CHARS);
331
1
    assert_eq!(Name::new(INVALID_CHARS).to_string(), INVALID_CHARS);
332
1
    assert_eq!(Name::new(INVALID_CHARS).encoded(), ESCAPED_INVALID);
333
1
    assert_eq!(
334
1
        Name::parse_encoded(ESCAPED_INVALID).unwrap(),
335
1
        Name::new(INVALID_CHARS)
336
1
    );
337
1
    Name::parse_encoded("_").unwrap_err();
338
1
    Name::parse_encoded("_0").unwrap_err();
339
1
    Name::parse_encoded("_z").unwrap_err();
340
1
    Name::parse_encoded("_0z").unwrap_err();
341
1
}
342

            
343
1
#[test]
344
1
fn joined_names_tests() {
345
1
    const INVALID_CHARS: &str = "._hello\u{1F680}.._world\u{1F680}";
346
1
    const ESCAPED_INVALID: &str = "_2e_5fhello_f0_9f_9a_80._2e_5fworld_f0_9f_9a_80";
347
1
    let collection = CollectionName::parse_encoded(ESCAPED_INVALID).unwrap();
348
1
    assert_eq!(collection.to_string(), INVALID_CHARS);
349
1
    assert_eq!(collection.encoded(), ESCAPED_INVALID);
350

            
351
1
    let schema_name = SchemaName::parse_encoded(ESCAPED_INVALID).unwrap();
352
1
    assert_eq!(schema_name.to_string(), INVALID_CHARS);
353
1
    assert_eq!(schema_name.encoded(), ESCAPED_INVALID);
354
1
}