1 use crate::{Literal, StringLit, test_util::{assert_parse_ok_eq, assert_roundtrip}};
2
3 // ===== Utility functions =======================================================================
4
5 macro_rules! check {
6 ($lit:literal, $has_escapes:expr, $num_hashes:expr) => {
7 check!($lit, stringify!($lit), $has_escapes, $num_hashes, "")
8 };
9 ($lit:literal, $input:expr, $has_escapes:expr, $num_hashes:expr, $suffix:literal) => {
10 let input = $input;
11 let expected = StringLit {
12 raw: input,
13 value: if $has_escapes { Some($lit.to_string()) } else { None },
14 num_hashes: $num_hashes,
15 start_suffix: input.len() - $suffix.len(),
16 };
17
18 assert_parse_ok_eq(input, StringLit::parse(input), expected.clone(), "StringLit::parse");
19 assert_parse_ok_eq(
20 input, Literal::parse(input), Literal::String(expected.clone()), "Literal::parse");
21 let lit = StringLit::parse(input).unwrap();
22 assert_eq!(lit.value(), $lit);
23 assert_eq!(lit.suffix(), $suffix);
24 assert_eq!(lit.into_value(), $lit);
25 assert_roundtrip(expected.into_owned(), input);
26 };
27 }
28
29
30 // ===== Actual tests ============================================================================
31
32 #[test]
simple()33 fn simple() {
34 check!("", false, None);
35 check!("a", false, None);
36 check!("peter", false, None);
37 check!("Sei gegrüßt, Bärthelt!", false, None);
38 check!("أنا لا أتحدث العربية", false, None);
39 check!("お前はもう死んでいる", false, None);
40 check!("Пушки - интересные музыкальные инструменты", false, None);
41 check!("lit af", false, None);
42 }
43
44 #[test]
special_whitespace()45 fn special_whitespace() {
46 let strings = ["\n", "\t", "foo\tbar", "\n"];
47
48 for &s in &strings {
49 let input = format!(r#""{}""#, s);
50 let input_raw = format!(r#"r"{}""#, s);
51 for (input, num_hashes) in vec![(input, None), (input_raw, Some(0))] {
52 let expected = StringLit {
53 raw: &*input,
54 value: None,
55 num_hashes,
56 start_suffix: input.len(),
57 };
58 assert_parse_ok_eq(
59 &input, StringLit::parse(&*input), expected.clone(), "StringLit::parse");
60 assert_parse_ok_eq(
61 &input, Literal::parse(&*input), Literal::String(expected), "Literal::parse");
62 assert_eq!(StringLit::parse(&*input).unwrap().value(), s);
63 assert_eq!(StringLit::parse(&*input).unwrap().into_value(), s);
64 }
65 }
66 }
67
68 #[test]
simple_escapes()69 fn simple_escapes() {
70 check!("a\nb", true, None);
71 check!("\nb", true, None);
72 check!("a\n", true, None);
73 check!("\n", true, None);
74
75 check!("\x60犬 \t 猫\r馬\n うさぎ \0ネズミ", true, None);
76 check!("నా \\పిల్లి లావుగా ఉంది", true, None);
77 check!("నా \\పిల్లి లావుగా \"ఉంది", true, None);
78 check!("\\నా\\ పిల్లి లావుగా\" ఉంది\"", true, None);
79 check!("\"నా \\ పిల్లి లావుగా \" ఉంది\\", true, None);
80
81 check!("\x00", true, None);
82 check!(" \x01", true, None);
83 check!("\x0c ", true, None);
84 check!(" \x0D ", true, None);
85 check!("\\x13", true, None);
86 check!("\"x30", true, None);
87 }
88
89 #[test]
unicode_escapes()90 fn unicode_escapes() {
91 check!("\u{0}", true, None);
92 check!(" \u{00}", true, None);
93 check!("\u{b} ", true, None);
94 check!(" \u{B} ", true, None);
95 check!("\u{7e}", true, None);
96 check!("నక్క\u{E4}", true, None);
97 check!("\u{e4} నక్క", true, None);
98 check!(" \u{fc}నక్క ", true, None);
99 check!("\u{Fc}", true, None);
100 check!("\u{fC}\nлиса", true, None);
101 check!("лиса\u{FC}", true, None);
102 check!("лиса\u{b10}నక్క", true, None);
103 check!("\"నక్క\u{B10}", true, None);
104 check!("лиса\\\u{0b10}", true, None);
105 check!("лиса\\\"\u{0b10}", true, None);
106 check!("నక్క\\\\u{0b10}", true, None);
107 check!("\u{2764}Füchsin", true, None);
108 check!("Füchse \u{1f602}", true, None);
109 check!("cd\u{1F602}ab", true, None);
110
111 check!("\u{0}", true, None);
112 check!("лиса\u{0__}", true, None);
113 check!("\\\u{3_b}", true, None);
114 check!("\u{1_F_6_0_2}Füchsin", true, None);
115 check!("నక్క\\\u{1_F6_02_____}నక్క", true, None);
116 }
117
118 #[test]
string_continue()119 fn string_continue() {
120 check!("నక్క\
121 bar", true, None);
122 check!("foo\
123 ", true, None);
124
125 check!("foo\
126
127 banana", true, None);
128
129 // Weird whitespace characters
130 let lit = StringLit::parse("\"foo\\\n\r\t\n \n\tbar\"").expect("failed to parse");
131 assert_eq!(lit.value(), "foobar");
132 let lit = StringLit::parse("\"foo\\\n\u{85}bar\"").expect("failed to parse");
133 assert_eq!(lit.value(), "foo\u{85}bar");
134 let lit = StringLit::parse("\"foo\\\n\u{a0}bar\"").expect("failed to parse");
135 assert_eq!(lit.value(), "foo\u{a0}bar");
136
137 // Raw strings do not handle "string continues"
138 check!(r"foo\
139 bar", false, Some(0));
140 }
141
142 #[test]
crlf_newlines()143 fn crlf_newlines() {
144 let lit = StringLit::parse("\"foo\r\nbar\"").expect("failed to parse");
145 assert_eq!(lit.value(), "foo\nbar");
146
147 let lit = StringLit::parse("\"\r\nbar\"").expect("failed to parse");
148 assert_eq!(lit.value(), "\nbar");
149
150 let lit = StringLit::parse("\"лиса\r\n\"").expect("failed to parse");
151 assert_eq!(lit.value(), "лиса\n");
152
153 let lit = StringLit::parse("r\"foo\r\nbar\"").expect("failed to parse");
154 assert_eq!(lit.value(), "foo\nbar");
155
156 let lit = StringLit::parse("r#\"\r\nbar\"#").expect("failed to parse");
157 assert_eq!(lit.value(), "\nbar");
158
159 let lit = StringLit::parse("r##\"лиса\r\n\"##").expect("failed to parse");
160 assert_eq!(lit.value(), "лиса\n");
161 }
162
163 #[test]
raw_string()164 fn raw_string() {
165 check!(r"", false, Some(0));
166 check!(r"a", false, Some(0));
167 check!(r"peter", false, Some(0));
168 check!(r"Sei gegrüßt, Bärthelt!", false, Some(0));
169 check!(r"أنا لا أتحدث العربية", false, Some(0));
170 check!(r"お前はもう死んでいる", false, Some(0));
171 check!(r"Пушки - интересные музыкальные инструменты", false, Some(0));
172 check!(r"lit af", false, Some(0));
173
174 check!(r#""#, false, Some(1));
175 check!(r#"a"#, false, Some(1));
176 check!(r##"peter"##, false, Some(2));
177 check!(r###"Sei gegrüßt, Bärthelt!"###, false, Some(3));
178 check!(r########"lit af"########, false, Some(8));
179
180 check!(r#"foo " bar"#, false, Some(1));
181 check!(r##"foo " bar"##, false, Some(2));
182 check!(r#"foo """" '"'" bar"#, false, Some(1));
183 check!(r#""foo""#, false, Some(1));
184 check!(r###""foo'"###, false, Some(3));
185 check!(r#""x'#_#s'"#, false, Some(1));
186 check!(r"#", false, Some(0));
187 check!(r"foo#", false, Some(0));
188 check!(r"##bar", false, Some(0));
189 check!(r###""##foo"##bar'"###, false, Some(3));
190
191 check!(r"さび\n\t\r\0\\x60\u{123}フェリス", false, Some(0));
192 check!(r#"さび\n\t\r\0\\x60\u{123}フェリス"#, false, Some(1));
193 }
194
195 #[test]
suffixes()196 fn suffixes() {
197 check!("hello", r###""hello"suffix"###, false, None, "suffix");
198 check!(r"お前はもう死んでいる", r###"r"お前はもう死んでいる"_banana"###, false, Some(0), "_banana");
199 check!("fox", r#""fox"peter"#, false, None, "peter");
200 check!("", r#"""peter"#, false, None, "peter");
201 check!("నక్క\\\\u{0b10}", r###""నక్క\\\\u{0b10}"jü_rgen"###, true, None, "jü_rgen");
202 }
203
204 #[test]
parse_err()205 fn parse_err() {
206 assert_err!(StringLit, r#"""#, UnterminatedString, None);
207 assert_err!(StringLit, r#""犬"#, UnterminatedString, None);
208 assert_err!(StringLit, r#""Jürgen"#, UnterminatedString, None);
209 assert_err!(StringLit, r#""foo bar baz"#, UnterminatedString, None);
210
211 assert_err!(StringLit, r#""fox"peter""#, InvalidSuffix, 5);
212 assert_err!(StringLit, r###"r#"foo "# bar"#"###, UnexpectedChar, 9);
213
214 assert_err!(StringLit, "\"\r\"", IsolatedCr, 1);
215 assert_err!(StringLit, "\"fo\rx\"", IsolatedCr, 3);
216 assert_err!(StringLit, "r\"\r\"", IsolatedCr, 2);
217 assert_err!(StringLit, "r\"fo\rx\"", IsolatedCr, 4);
218
219 assert_err!(StringLit, r##"r####""##, UnterminatedRawString, None);
220 assert_err!(StringLit, r#####"r##"foo"#bar"#####, UnterminatedRawString, None);
221 assert_err!(StringLit, r##"r####"##, InvalidLiteral, None);
222 assert_err!(StringLit, r##"r####x"##, InvalidLiteral, None);
223 }
224
225 #[test]
invald_ascii_escapes()226 fn invald_ascii_escapes() {
227 assert_err!(StringLit, r#""\x80""#, NonAsciiXEscape, 1..5);
228 assert_err!(StringLit, r#""\x81""#, NonAsciiXEscape, 5..9);
229 assert_err!(StringLit, r#"" \x8a""#, NonAsciiXEscape, 2..6);
230 assert_err!(StringLit, r#""\x8Ff""#, NonAsciiXEscape, 1..5);
231 assert_err!(StringLit, r#""\xa0 ""#, NonAsciiXEscape, 1..5);
232 assert_err!(StringLit, r#""నక్క\xB0""#, NonAsciiXEscape, 13..17);
233 assert_err!(StringLit, r#""\xc3నక్క""#, NonAsciiXEscape, 1..5);
234 assert_err!(StringLit, r#""\xDf""#, NonAsciiXEscape, 1..5);
235 assert_err!(StringLit, r#""నక్క\xffనక్క""#, NonAsciiXEscape, 13..17);
236 assert_err!(StringLit, r#""\xfF ""#, NonAsciiXEscape, 1..5);
237 assert_err!(StringLit, r#"" \xFf""#, NonAsciiXEscape, 2..6);
238 assert_err!(StringLit, r#""నక్క \xFF""#, NonAsciiXEscape, 15..19);
239 }
240
241 #[test]
invalid_escapes()242 fn invalid_escapes() {
243 assert_err!(StringLit, r#""\a""#, UnknownEscape, 1..3);
244 assert_err!(StringLit, r#""foo\y""#, UnknownEscape, 4..6);
245 assert_err!(StringLit, r#""\"#, UnterminatedEscape, 1);
246 assert_err!(StringLit, r#""\x""#, UnterminatedEscape, 1..3);
247 assert_err!(StringLit, r#""\x1""#, UnterminatedEscape, 5..8);
248 assert_err!(StringLit, r#"" \xaj""#, InvalidXEscape, 2..6);
249 assert_err!(StringLit, r#""నక్క\xjb""#, InvalidXEscape, 13..17);
250 }
251
252 #[test]
invalid_unicode_escapes()253 fn invalid_unicode_escapes() {
254 assert_err!(StringLit, r#""\u""#, UnicodeEscapeWithoutBrace, 1..3);
255 assert_err!(StringLit, r#""\u ""#, UnicodeEscapeWithoutBrace, 5..7);
256 assert_err!(StringLit, r#""\u3""#, UnicodeEscapeWithoutBrace, 1..3);
257
258 assert_err!(StringLit, r#""\u{""#, UnterminatedUnicodeEscape, 1..4);
259 assert_err!(StringLit, r#""\u{12""#, UnterminatedUnicodeEscape, 1..6);
260 assert_err!(StringLit, r#""\u{a0b""#, UnterminatedUnicodeEscape, 5..11);
261 assert_err!(StringLit, r#""\u{a0_b ""#, UnterminatedUnicodeEscape, 1..10);
262
263 assert_err!(StringLit, r#""\u{_}నక్క""#, InvalidStartOfUnicodeEscape, 4);
264 assert_err!(StringLit, r#""\u{_5f}""#, InvalidStartOfUnicodeEscape, 4);
265
266 assert_err!(StringLit, r#""fox\u{x}""#, NonHexDigitInUnicodeEscape, 7);
267 assert_err!(StringLit, r#""\u{0x}""#, NonHexDigitInUnicodeEscape, 5);
268 assert_err!(StringLit, r#""నక్క\u{3bx}""#, NonHexDigitInUnicodeEscape, 18);
269 assert_err!(StringLit, r#""\u{3b_x}лиса""#, NonHexDigitInUnicodeEscape, 7);
270 assert_err!(StringLit, r#""\u{4x_}""#, NonHexDigitInUnicodeEscape, 5);
271
272 assert_err!(StringLit, r#""\u{1234567}""#, TooManyDigitInUnicodeEscape, 10);
273 assert_err!(StringLit, r#""నక్క\u{1234567}""#, TooManyDigitInUnicodeEscape, 22);
274 assert_err!(StringLit, r#""నక్క\u{1_23_4_56_7}""#, TooManyDigitInUnicodeEscape, 26);
275 assert_err!(StringLit, r#""\u{abcdef123}лиса""#, TooManyDigitInUnicodeEscape, 10);
276
277 assert_err!(StringLit, r#""\u{110000}fox""#, InvalidUnicodeEscapeChar, 1..10);
278 }
279