1use super::{AsULE, RawBytesULE, VarULE};
6use crate::ule::EqULE;
7use crate::{map::ZeroMapKV, VarZeroSlice, VarZeroVec, ZeroVecError};
8use alloc::boxed::Box;
9use core::cmp::Ordering;
10use core::fmt;
11use core::ops::Deref;
12
13#[repr(transparent)]
46#[derive(PartialEq, Eq, PartialOrd, Ord)]
47#[allow(clippy::exhaustive_structs)] pub struct UnvalidatedStr([u8]);
49
50impl fmt::Debug for UnvalidatedStr {
51 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
52 match self.try_as_str() {
54 Ok(s) => fmt::Debug::fmt(s, f),
55 Err(_) => fmt::Debug::fmt(&self.0, f),
56 }
57 }
58}
59
60impl UnvalidatedStr {
61 #[inline]
63 pub const fn from_bytes(other: &[u8]) -> &Self {
64 unsafe { core::mem::transmute(other) }
66 }
67
68 #[inline]
70 pub const fn from_str(s: &str) -> &Self {
71 Self::from_bytes(s.as_bytes())
72 }
73
74 #[inline]
76 pub fn from_boxed_bytes(other: Box<[u8]>) -> Box<Self> {
77 unsafe { core::mem::transmute(other) }
79 }
80
81 #[inline]
83 pub fn from_boxed_str(other: Box<str>) -> Box<Self> {
84 Self::from_boxed_bytes(other.into_boxed_bytes())
85 }
86
87 #[inline]
89 pub const fn as_bytes(&self) -> &[u8] {
90 &self.0
91 }
92
93 #[inline]
107 pub fn try_as_str(&self) -> Result<&str, core::str::Utf8Error> {
108 core::str::from_utf8(&self.0)
109 }
110}
111
112impl<'a> From<&'a str> for &'a UnvalidatedStr {
113 #[inline]
114 fn from(other: &'a str) -> Self {
115 UnvalidatedStr::from_str(other)
116 }
117}
118
119impl From<Box<str>> for Box<UnvalidatedStr> {
120 #[inline]
121 fn from(other: Box<str>) -> Self {
122 UnvalidatedStr::from_boxed_str(other)
123 }
124}
125
126impl Deref for UnvalidatedStr {
127 type Target = [u8];
128 fn deref(&self) -> &Self::Target {
129 &self.0
130 }
131}
132
133impl<'a> ZeroMapKV<'a> for UnvalidatedStr {
134 type Container = VarZeroVec<'a, UnvalidatedStr>;
135 type Slice = VarZeroSlice<UnvalidatedStr>;
136 type GetType = UnvalidatedStr;
137 type OwnedType = Box<UnvalidatedStr>;
138}
139
140unsafe impl VarULE for UnvalidatedStr {
149 #[inline]
150 fn validate_byte_slice(_: &[u8]) -> Result<(), ZeroVecError> {
151 Ok(())
152 }
153 #[inline]
154 unsafe fn from_byte_slice_unchecked(bytes: &[u8]) -> &Self {
155 UnvalidatedStr::from_bytes(bytes)
156 }
157}
158
159#[cfg(feature = "serde")]
161impl serde::Serialize for UnvalidatedStr {
162 fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
163 where
164 S: serde::Serializer,
165 {
166 use serde::ser::Error;
167 let s = self
168 .try_as_str()
169 .map_err(|_| S::Error::custom("invalid UTF-8 in UnvalidatedStr"))?;
170 if serializer.is_human_readable() {
171 serializer.serialize_str(s)
172 } else {
173 serializer.serialize_bytes(s.as_bytes())
174 }
175 }
176}
177
178#[cfg(feature = "serde")]
180impl<'de> serde::Deserialize<'de> for Box<UnvalidatedStr> {
181 fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
182 where
183 D: serde::Deserializer<'de>,
184 {
185 if deserializer.is_human_readable() {
186 let boxed_str = Box::<str>::deserialize(deserializer)?;
187 Ok(UnvalidatedStr::from_boxed_str(boxed_str))
188 } else {
189 let boxed_bytes = Box::<[u8]>::deserialize(deserializer)?;
190 Ok(UnvalidatedStr::from_boxed_bytes(boxed_bytes))
191 }
192 }
193}
194
195#[cfg(feature = "serde")]
197impl<'de, 'a> serde::Deserialize<'de> for &'a UnvalidatedStr
198where
199 'de: 'a,
200{
201 fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
202 where
203 D: serde::Deserializer<'de>,
204 {
205 if deserializer.is_human_readable() {
206 let s = <&str>::deserialize(deserializer)?;
207 Ok(UnvalidatedStr::from_str(s))
208 } else {
209 let bytes = <&[u8]>::deserialize(deserializer)?;
210 Ok(UnvalidatedStr::from_bytes(bytes))
211 }
212 }
213}
214
215#[repr(transparent)]
241#[derive(PartialEq, Eq, Clone, Copy, Hash)]
242pub struct UnvalidatedChar([u8; 3]);
243
244impl UnvalidatedChar {
245 #[inline]
256 pub const fn from_char(c: char) -> Self {
257 let [u0, u1, u2, _u3] = (c as u32).to_le_bytes();
258 Self([u0, u1, u2])
259 }
260
261 #[inline]
262 #[doc(hidden)]
263 pub const fn from_u24(c: u32) -> Self {
264 let [u0, u1, u2, _u3] = c.to_le_bytes();
265 Self([u0, u1, u2])
266 }
267
268 #[inline]
282 pub fn try_to_char(self) -> Result<char, core::char::CharTryFromError> {
283 let [u0, u1, u2] = self.0;
284 char::try_from(u32::from_le_bytes([u0, u1, u2, 0]))
285 }
286
287 #[inline]
299 pub fn to_char_lossy(self) -> char {
300 self.try_to_char().unwrap_or(char::REPLACEMENT_CHARACTER)
301 }
302
303 #[inline]
319 pub unsafe fn to_char_unchecked(self) -> char {
320 let [u0, u1, u2] = self.0;
321 char::from_u32_unchecked(u32::from_le_bytes([u0, u1, u2, 0]))
322 }
323}
324
325impl RawBytesULE<3> {
326 #[inline]
329 pub const fn from_unvalidated_char(uc: UnvalidatedChar) -> Self {
330 RawBytesULE(uc.0)
331 }
332}
333
334impl AsULE for UnvalidatedChar {
335 type ULE = RawBytesULE<3>;
336
337 #[inline]
338 fn to_unaligned(self) -> Self::ULE {
339 RawBytesULE(self.0)
340 }
341
342 #[inline]
343 fn from_unaligned(unaligned: Self::ULE) -> Self {
344 Self(unaligned.0)
345 }
346}
347
348unsafe impl EqULE for UnvalidatedChar {}
351
352impl fmt::Debug for UnvalidatedChar {
353 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
354 match self.try_to_char() {
356 Ok(c) => fmt::Debug::fmt(&c, f),
357 Err(_) => fmt::Debug::fmt(&self.0, f),
358 }
359 }
360}
361
362impl PartialOrd for UnvalidatedChar {
363 fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
364 Some(self.cmp(other))
365 }
366}
367
368impl Ord for UnvalidatedChar {
369 fn cmp(&self, other: &Self) -> Ordering {
371 let [a0, a1, a2] = self.0;
372 let a = u32::from_le_bytes([a0, a1, a2, 0]);
373 let [b0, b1, b2] = other.0;
374 let b = u32::from_le_bytes([b0, b1, b2, 0]);
375 a.cmp(&b)
376 }
377}
378
379impl From<char> for UnvalidatedChar {
380 #[inline]
381 fn from(value: char) -> Self {
382 Self::from_char(value)
383 }
384}
385
386impl TryFrom<UnvalidatedChar> for char {
387 type Error = core::char::CharTryFromError;
388
389 #[inline]
390 fn try_from(value: UnvalidatedChar) -> Result<char, Self::Error> {
391 value.try_to_char()
392 }
393}
394
395#[cfg(feature = "serde")]
397impl serde::Serialize for UnvalidatedChar {
398 fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
399 where
400 S: serde::Serializer,
401 {
402 use serde::ser::Error;
403 let c = self
404 .try_to_char()
405 .map_err(|_| S::Error::custom("invalid Unicode scalar value in UnvalidatedChar"))?;
406 if serializer.is_human_readable() {
407 serializer.serialize_char(c)
408 } else {
409 self.0.serialize(serializer)
410 }
411 }
412}
413
414#[cfg(feature = "serde")]
416impl<'de> serde::Deserialize<'de> for UnvalidatedChar {
417 fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
418 where
419 D: serde::Deserializer<'de>,
420 {
421 if deserializer.is_human_readable() {
422 let c = <char>::deserialize(deserializer)?;
423 Ok(UnvalidatedChar::from_char(c))
424 } else {
425 let bytes = <[u8; 3]>::deserialize(deserializer)?;
426 Ok(UnvalidatedChar(bytes))
427 }
428 }
429}
430
431#[cfg(feature = "databake")]
432impl databake::Bake for UnvalidatedChar {
433 fn bake(&self, env: &databake::CrateEnv) -> databake::TokenStream {
434 match self.try_to_char() {
435 Ok(ch) => {
436 env.insert("zerovec");
437 let ch = ch.bake(env);
438 databake::quote! {
439 zerovec::ule::UnvalidatedChar::from_char(#ch)
440 }
441 }
442 Err(_) => {
443 env.insert("zerovec");
444 let u24 = u32::from_le_bytes([self.0[0], self.0[1], self.0[2], 0]);
445 databake::quote! {
446 zerovec::ule::UnvalidatedChar::from_u24(#u24)
447 }
448 }
449 }
450 }
451}
452
453#[cfg(test)]
454mod test {
455 use super::*;
456 use crate::ZeroVec;
457
458 #[test]
459 fn test_serde_fail() {
460 let uc = UnvalidatedChar([0xFF, 0xFF, 0xFF]);
461 serde_json::to_string(&uc).expect_err("serialize invalid char bytes");
462 bincode::serialize(&uc).expect_err("serialize invalid char bytes");
463 }
464
465 #[test]
466 fn test_serde_json() {
467 let c = '🙃';
468 let uc = UnvalidatedChar::from_char(c);
469 let json_ser = serde_json::to_string(&uc).unwrap();
470
471 assert_eq!(json_ser, r#""🙃""#);
472
473 let json_de: UnvalidatedChar = serde_json::from_str(&json_ser).unwrap();
474
475 assert_eq!(uc, json_de);
476 }
477
478 #[test]
479 fn test_serde_bincode() {
480 let c = '🙃';
481 let uc = UnvalidatedChar::from_char(c);
482 let bytes_ser = bincode::serialize(&uc).unwrap();
483
484 assert_eq!(bytes_ser, [0x43, 0xF6, 0x01]);
485
486 let bytes_de: UnvalidatedChar = bincode::deserialize(&bytes_ser).unwrap();
487
488 assert_eq!(uc, bytes_de);
489 }
490
491 #[test]
492 fn test_representation() {
493 let chars = ['w', 'ω', '文', '𑄃', '🙃'];
494
495 let uvchars: Vec<_> = chars
497 .iter()
498 .copied()
499 .map(UnvalidatedChar::from_char)
500 .collect();
501 let zvec: ZeroVec<_> = uvchars.clone().into_iter().collect();
503
504 let ule_bytes = zvec.as_bytes();
505 let uvbytes;
506 unsafe {
507 let ptr = &uvchars[..] as *const _ as *const u8;
508 uvbytes = core::slice::from_raw_parts(ptr, ule_bytes.len());
509 }
510
511 assert_eq!(uvbytes, ule_bytes);
514
515 assert_eq!(
516 &[119, 0, 0, 201, 3, 0, 135, 101, 0, 3, 17, 1, 67, 246, 1],
517 ule_bytes
518 );
519 }
520
521 #[test]
522 fn test_char_bake() {
523 databake::test_bake!(UnvalidatedChar, const: crate::ule::UnvalidatedChar::from_char('b'), zerovec);
524 databake::test_bake!(UnvalidatedChar, const: crate::ule::UnvalidatedChar::from_u24(55296u32), zerovec);
526 }
527}