|
1 |
| -use std::{borrow::Cow, collections::HashMap, str}; |
| 1 | +use std::{borrow::Cow, collections::HashMap}; |
2 | 2 |
|
3 | 3 | use crate::{unescape, value::Value, Number, Result};
|
4 | 4 |
|
@@ -152,11 +152,6 @@ pub fn null_u8(bytes: &[u8]) -> Result<(&[u8], &[u8])> {
|
152 | 152 | Ok(split_at_u8(bytes, 4))
|
153 | 153 | }
|
154 | 154 |
|
155 |
| -#[inline(always)] |
156 |
| -pub fn split_at(s: &str, mid: usize) -> (&str, &str) { |
157 |
| - unsafe { (s.get_unchecked(..mid), s.get_unchecked(mid..s.len())) } |
158 |
| -} |
159 |
| - |
160 | 155 | #[inline(always)]
|
161 | 156 | pub fn split_at_u8(s: &[u8], mid: usize) -> (&[u8], &[u8]) {
|
162 | 157 | unsafe { (s.get_unchecked(..mid), s.get_unchecked(mid..s.len())) }
|
@@ -201,60 +196,21 @@ pub fn string_u8(bytes: &[u8]) -> Result<(&[u8], &[u8], bool)> {
|
201 | 196 | Ok((a, b, esc))
|
202 | 197 | }
|
203 | 198 |
|
204 |
| -pub fn string(input: &str) -> Result<(&str, &str)> { |
205 |
| - let mut i = 1; |
206 |
| - let bytes = input.as_bytes(); |
207 |
| - const CHUNK: usize = 4; |
208 |
| - |
209 |
| - 'outer: while i + CHUNK < bytes.len() { |
210 |
| - for _ in 0..CHUNK { |
211 |
| - let &b = unsafe { bytes.get_unchecked(i) }; |
212 |
| - i += 1; |
213 |
| - match b { |
214 |
| - b'"' => { |
215 |
| - return Ok(split_at(input, i)); |
216 |
| - } |
217 |
| - b'\\' => { |
218 |
| - i += 1; |
219 |
| - continue 'outer; |
220 |
| - } |
221 |
| - _ => {} |
222 |
| - } |
223 |
| - } |
224 |
| - } |
225 |
| - |
226 |
| - while i < bytes.len() { |
227 |
| - let b = unsafe { *bytes.get_unchecked(i) }; |
228 |
| - |
229 |
| - match b { |
230 |
| - b'"' => { |
231 |
| - i += 1; |
232 |
| - break; |
233 |
| - } |
234 |
| - b'\\' => { |
235 |
| - i += 1; |
236 |
| - } |
237 |
| - _ => {} |
238 |
| - } |
239 |
| - |
240 |
| - i += 1; |
241 |
| - } |
242 |
| - |
243 |
| - return Ok(split_at(input, i)); |
244 |
| -} |
245 |
| - |
246 | 199 | #[cfg(test)]
|
247 |
| -mod test_string { |
248 |
| - use super::string; |
| 200 | +mod test_strin_u8 { |
| 201 | + use super::string_u8; |
249 | 202 |
|
250 | 203 | #[test]
|
251 | 204 | fn test_string() {
|
252 | 205 | assert_eq!(
|
253 |
| - string(r#""hello": "tom""#), |
254 |
| - Ok((r#""hello""#, r#": "tom""#)) |
| 206 | + string_u8(r#""hello": "tom""#.as_bytes()), |
| 207 | + Ok((r#""hello""#.as_bytes(), r#": "tom""#.as_bytes(), false)) |
255 | 208 | );
|
256 | 209 |
|
257 |
| - assert_eq!(string(r#""hello"#), Ok((r#""hello"#, r#""#))); |
| 210 | + assert_eq!( |
| 211 | + string_u8(r#""hello"#.as_bytes()), |
| 212 | + Ok((r#""hello"#.as_bytes(), r#""#.as_bytes(), false)) |
| 213 | + ); |
258 | 214 | }
|
259 | 215 | }
|
260 | 216 |
|
@@ -322,83 +278,17 @@ pub fn compound_u8(bytes: &[u8]) -> Result<(&[u8], &[u8])> {
|
322 | 278 | return Ok(split_at_u8(bytes, i));
|
323 | 279 | }
|
324 | 280 |
|
325 |
| -// object or array |
326 |
| -pub fn compound(input: &str) -> Result<(&str, &str)> { |
327 |
| - let bytes = input.as_bytes(); |
328 |
| - let mut i = 1; |
329 |
| - let mut depth = 1; |
330 |
| - |
331 |
| - const CHUNK_SIZE: usize = 32; |
332 |
| - |
333 |
| - 'outer: while i + CHUNK_SIZE < bytes.len() { |
334 |
| - for _ in 0..CHUNK_SIZE { |
335 |
| - let &b = unsafe { bytes.get_unchecked(i) }; |
336 |
| - |
337 |
| - match b { |
338 |
| - b'\\' => { |
339 |
| - i += 2; |
340 |
| - continue 'outer; |
341 |
| - } |
342 |
| - b'"' => { |
343 |
| - let input = unsafe { input.get_unchecked(i..) }; |
344 |
| - let (s, _) = string(input).unwrap(); |
345 |
| - |
346 |
| - i += s.len(); |
347 |
| - continue 'outer; |
348 |
| - } |
349 |
| - b'[' | b'{' => depth += 1, |
350 |
| - b']' | b'}' => { |
351 |
| - depth -= 1; |
352 |
| - if depth == 0 { |
353 |
| - i += 1; |
354 |
| - return Ok(split_at(input, i)); |
355 |
| - } |
356 |
| - } |
357 |
| - _ => (), |
358 |
| - } |
359 |
| - i += 1; |
360 |
| - } |
361 |
| - } |
362 |
| - |
363 |
| - while i < bytes.len() { |
364 |
| - let &b = unsafe { bytes.get_unchecked(i) }; |
365 |
| - match b { |
366 |
| - b'\\' => { |
367 |
| - i += 1; |
368 |
| - } |
369 |
| - b'"' => { |
370 |
| - let input = unsafe { input.get_unchecked(i..) }; |
371 |
| - let (s, _) = string(input).unwrap(); |
372 |
| - i += s.len(); |
373 |
| - continue; |
374 |
| - } |
375 |
| - b'[' | b'{' => depth += 1, |
376 |
| - b']' | b'}' => { |
377 |
| - depth -= 1; |
378 |
| - if depth == 0 { |
379 |
| - i += 1; |
380 |
| - break; |
381 |
| - } |
382 |
| - } |
383 |
| - _ => (), |
384 |
| - } |
385 |
| - i += 1; |
386 |
| - } |
387 |
| - |
388 |
| - return Ok(split_at(input, i)); |
389 |
| -} |
390 |
| - |
391 | 281 | #[cfg(test)]
|
392 |
| -mod test_compound { |
393 |
| - use super::{compound, Result}; |
| 282 | +mod test_compound_u8 { |
| 283 | + use super::{compound_u8, Result}; |
394 | 284 |
|
395 | 285 | #[test]
|
396 | 286 | fn test_compound() -> Result<()> {
|
397 | 287 | const JSON: &str = r#"{"1":"2", "name": "jack"}xxxx"#;
|
398 |
| - let r = compound(JSON)?; |
| 288 | + let r = compound_u8(JSON.as_bytes())?; |
399 | 289 |
|
400 |
| - assert_eq!(r.0, r#"{"1":"2", "name": "jack"}"#); |
401 |
| - assert_eq!(r.1, "xxxx"); |
| 290 | + assert_eq!(r.0, r#"{"1":"2", "name": "jack"}"#.as_bytes()); |
| 291 | + assert_eq!(r.1, "xxxx".as_bytes()); |
402 | 292 |
|
403 | 293 | Ok(())
|
404 | 294 | }
|
|
0 commit comments