1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
|
//! Line ending detection and conversion.
use std::fmt::Debug;
/// Supported line endings. Like in the Rust standard library, two line
/// endings are supported: `\r\n` and `\n`
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub enum LineEnding {
/// _Carriage return and line feed_ – a line ending sequence
/// historically used in Windows. Corresponds to the sequence
/// of ASCII control characters `0x0D 0x0A` or `\r\n`
CRLF,
/// _Line feed_ – a line ending historically used in Unix.
/// Corresponds to the ASCII control character `0x0A` or `\n`
LF,
}
impl LineEnding {
/// Turns this [`LineEnding`] value into its ASCII representation.
#[inline]
pub const fn as_str(&self) -> &'static str {
match self {
Self::CRLF => "\r\n",
Self::LF => "\n",
}
}
}
/// An iterator over the lines of a string, as tuples of string slice
/// and [`LineEnding`] value; it only emits non-empty lines (i.e. having
/// some content before the terminating `\r\n` or `\n`).
///
/// This struct is used internally by the library.
#[derive(Debug, Clone, Copy)]
pub(crate) struct NonEmptyLines<'a>(pub &'a str);
impl<'a> Iterator for NonEmptyLines<'a> {
type Item = (&'a str, Option<LineEnding>);
fn next(&mut self) -> Option<Self::Item> {
while let Some(lf) = self.0.find('\n') {
if lf == 0 || (lf == 1 && self.0.as_bytes()[lf - 1] == b'\r') {
self.0 = &self.0[(lf + 1)..];
continue;
}
let trimmed = match self.0.as_bytes()[lf - 1] {
b'\r' => (&self.0[..(lf - 1)], Some(LineEnding::CRLF)),
_ => (&self.0[..lf], Some(LineEnding::LF)),
};
self.0 = &self.0[(lf + 1)..];
return Some(trimmed);
}
if self.0.is_empty() {
None
} else {
let line = std::mem::take(&mut self.0);
Some((line, None))
}
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn non_empty_lines_full_case() {
assert_eq!(
NonEmptyLines("LF\nCRLF\r\n\r\n\nunterminated")
.collect::<Vec<(&str, Option<LineEnding>)>>(),
vec![
("LF", Some(LineEnding::LF)),
("CRLF", Some(LineEnding::CRLF)),
("unterminated", None),
]
);
}
#[test]
fn non_empty_lines_new_lines_only() {
assert_eq!(NonEmptyLines("\r\n\n\n\r\n").next(), None);
}
#[test]
fn non_empty_lines_no_input() {
assert_eq!(NonEmptyLines("").next(), None);
}
}
|