1 use crate::{Literal, StringLit, test_util::{assert_parse_ok_eq, assert_roundtrip}};
2 
3 // ===== Utility functions =======================================================================
4 
5 macro_rules! check {
6     ($lit:literal, $has_escapes:expr, $num_hashes:expr) => {
7         let input = stringify!($lit);
8         let expected = StringLit {
9             raw: input,
10             value: if $has_escapes { Some($lit.to_string()) } else { None },
11             num_hashes: $num_hashes,
12         };
13 
14         assert_parse_ok_eq(input, StringLit::parse(input), expected.clone(), "StringLit::parse");
15         assert_parse_ok_eq(
16             input, Literal::parse(input), Literal::String(expected.clone()), "Literal::parse");
17         assert_eq!(StringLit::parse(input).unwrap().value(), $lit);
18         assert_eq!(StringLit::parse(input).unwrap().into_value(), $lit);
19         assert_roundtrip(expected.into_owned(), input);
20     };
21 }
22 
23 
24 // ===== Actual tests ============================================================================
25 
26 #[test]
simple()27 fn simple() {
28     check!("", false, None);
29     check!("a", false, None);
30     check!("peter", false, None);
31     check!("Sei gegrüßt, Bärthelt!", false, None);
32     check!("أنا لا أتحدث العربية", false, None);
33     check!("お前はもう死んでいる", false, None);
34     check!("Пушки - интересные музыкальные инструменты", false, None);
35     check!("lit �� �� af", false, None);
36 }
37 
38 #[test]
special_whitespace()39 fn special_whitespace() {
40     let strings = ["\n", "\t", "foo\tbar", "��\n"];
41 
42     for &s in &strings {
43         let input = format!(r#""{}""#, s);
44         let input_raw = format!(r#"r"{}""#, s);
45         for (input, num_hashes) in vec![(input, None), (input_raw, Some(0))] {
46             let expected = StringLit {
47                 raw: &*input,
48                 value: None,
49                 num_hashes,
50             };
51             assert_parse_ok_eq(
52                 &input, StringLit::parse(&*input), expected.clone(), "StringLit::parse");
53             assert_parse_ok_eq(
54                 &input, Literal::parse(&*input), Literal::String(expected), "Literal::parse");
55             assert_eq!(StringLit::parse(&*input).unwrap().value(), s);
56             assert_eq!(StringLit::parse(&*input).unwrap().into_value(), s);
57         }
58     }
59 }
60 
61 #[test]
simple_escapes()62 fn simple_escapes() {
63     check!("a\nb", true, None);
64     check!("\nb", true, None);
65     check!("a\n", true, None);
66     check!("\n", true, None);
67 
68     check!("\x60犬 \t 猫\r馬\n うさぎ \0ネズミ", true, None);
69     check!("నా \\పిల్లి లావుగా ఉంది", true, None);
70     check!("నా \\పిల్లి లావుగా ��\"ఉంది", true, None);
71     check!("\\నా\\ పిల్లి లావుగా\" ఉంది\"", true, None);
72     check!("\"నా \\�� పిల్లి లావుగా \" ఉంది\\", true, None);
73 
74     check!("\x00", true, None);
75     check!(" \x01", true, None);
76     check!("\x0c ��", true, None);
77     check!(" ��\x0D ", true, None);
78     check!("\\x13", true, None);
79     check!("\"x30", true, None);
80 }
81 
82 #[test]
unicode_escapes()83 fn unicode_escapes() {
84     check!("\u{0}", true, None);
85     check!(" \u{00}", true, None);
86     check!("\u{b} ", true, None);
87     check!(" \u{B} ", true, None);
88     check!("\u{7e}", true, None);
89     check!("నక్క\u{E4}", true, None);
90     check!("\u{e4} నక్క", true, None);
91     check!(" \u{fc}నక్క ", true, None);
92     check!("\u{Fc}", true, None);
93     check!("\u{fC}��\nлиса", true, None);
94     check!("лиса\u{FC}", true, None);
95     check!("лиса\u{b10}నక్క��", true, None);
96     check!("\"నక్క\u{B10}", true, None);
97     check!("лиса\\\u{0b10}", true, None);
98     check!("ли��са\\\"\u{0b10}", true, None);
99     check!("నక్క\\\\u{0b10}", true, None);
100     check!("\u{2764}Füchsin", true, None);
101     check!("Füchse \u{1f602}", true, None);
102     check!("cd\u{1F602}ab", true, None);
103 
104     check!("\u{0}��", true, None);
105     check!("лиса\u{0__}", true, None);
106     check!("\\��\u{3_b}", true, None);
107     check!("��\u{1_F_6_0_2}Füchsin", true, None);
108     check!("నక్క\\\u{1_F6_02_____}నక్క", true, None);
109 }
110 
111 #[test]
string_continue()112 fn string_continue() {
113     check!("నక్క\
114         bar", true, None);
115     check!("foo\
116 ��", true, None);
117 
118     check!("foo\
119 
120         banana", true, None);
121 
122     // Weird whitespace characters
123     let lit = StringLit::parse("\"foo\\\n\r\t\n \n\tbar\"").expect("failed to parse");
124     assert_eq!(lit.value(), "foobar");
125     let lit = StringLit::parse("\"foo\\\n\u{85}bar\"").expect("failed to parse");
126     assert_eq!(lit.value(), "foo\u{85}bar");
127     let lit = StringLit::parse("\"foo\\\n\u{a0}bar\"").expect("failed to parse");
128     assert_eq!(lit.value(), "foo\u{a0}bar");
129 
130     // Raw strings do not handle "string continues"
131     check!(r"foo\
132         bar", false, Some(0));
133 }
134 
135 #[test]
crlf_newlines()136 fn crlf_newlines() {
137     let lit = StringLit::parse("\"foo\r\nbar\"").expect("failed to parse");
138     assert_eq!(lit.value(), "foo\nbar");
139 
140     let lit = StringLit::parse("\"\r\nbar\"").expect("failed to parse");
141     assert_eq!(lit.value(), "\nbar");
142 
143     let lit = StringLit::parse("\"лиса\r\n\"").expect("failed to parse");
144     assert_eq!(lit.value(), "лиса\n");
145 
146     let lit = StringLit::parse("r\"foo\r\nbar\"").expect("failed to parse");
147     assert_eq!(lit.value(), "foo\nbar");
148 
149     let lit = StringLit::parse("r#\"\r\nbar\"#").expect("failed to parse");
150     assert_eq!(lit.value(), "\nbar");
151 
152     let lit = StringLit::parse("r##\"лиса\r\n\"##").expect("failed to parse");
153     assert_eq!(lit.value(), "лиса\n");
154 }
155 
156 #[test]
raw_string()157 fn raw_string() {
158     check!(r"", false, Some(0));
159     check!(r"a", false, Some(0));
160     check!(r"peter", false, Some(0));
161     check!(r"Sei gegrüßt, Bärthelt!", false, Some(0));
162     check!(r"أنا لا أتحدث العربية", false, Some(0));
163     check!(r"お前はもう死んでいる", false, Some(0));
164     check!(r"Пушки - интересные музыкальные инструменты", false, Some(0));
165     check!(r"lit �� �� af", false, Some(0));
166 
167     check!(r#""#, false, Some(1));
168     check!(r#"a"#, false, Some(1));
169     check!(r##"peter"##, false, Some(2));
170     check!(r###"Sei gegrüßt, Bärthelt!"###, false, Some(3));
171     check!(r########"lit �� �� af"########, false, Some(8));
172 
173     check!(r#"foo " bar"#, false, Some(1));
174     check!(r##"foo " bar"##, false, Some(2));
175     check!(r#"foo """" '"'" bar"#, false, Some(1));
176     check!(r#""foo""#, false, Some(1));
177     check!(r###""foo'"###, false, Some(3));
178     check!(r#""x'#_#s'"#, false, Some(1));
179     check!(r"#", false, Some(0));
180     check!(r"foo#", false, Some(0));
181     check!(r"##bar", false, Some(0));
182     check!(r###""##foo"##bar'"###, false, Some(3));
183 
184     check!(r"さび\n\t\r\0\\x60\u{123}フェリス", false, Some(0));
185     check!(r#"さび\n\t\r\0\\x60\u{123}フェリス"#, false, Some(1));
186 }
187 
188 #[test]
parse_err()189 fn parse_err() {
190     assert_err!(StringLit, r#"""#, UnterminatedString, None);
191     assert_err!(StringLit, r#""犬"#, UnterminatedString, None);
192     assert_err!(StringLit, r#""Jürgen"#, UnterminatedString, None);
193     assert_err!(StringLit, r#""foo bar baz"#, UnterminatedString, None);
194 
195     assert_err!(StringLit, r#""fox"peter"#, UnexpectedChar, 5..10);
196     assert_err!(StringLit, r#""fox"peter""#, UnexpectedChar, 5..11);
197     assert_err!(StringLit, r#""fox"��"#, UnexpectedChar, 5..9);
198     assert_err!(StringLit, r###"r#"foo "# bar"#"###, UnexpectedChar, 9..15);
199 
200     assert_err!(StringLit, "\"\r\"", IsolatedCr, 1);
201     assert_err!(StringLit, "\"fo\rx\"", IsolatedCr, 3);
202     assert_err!(StringLit, "r\"\r\"", IsolatedCr, 2);
203     assert_err!(StringLit, "r\"fo\rx\"", IsolatedCr, 4);
204 
205     assert_err!(StringLit, r##"r####""##, UnterminatedRawString, None);
206     assert_err!(StringLit, r#####"r##"foo"#bar"#####, UnterminatedRawString, None);
207     assert_err!(StringLit, r##"r####"##, InvalidLiteral, None);
208     assert_err!(StringLit, r##"r####x"##, InvalidLiteral, None);
209 }
210 
211 #[test]
invald_ascii_escapes()212 fn invald_ascii_escapes() {
213     assert_err!(StringLit, r#""\x80""#, NonAsciiXEscape, 1..5);
214     assert_err!(StringLit, r#""��\x81""#, NonAsciiXEscape, 5..9);
215     assert_err!(StringLit, r#"" \x8a""#, NonAsciiXEscape, 2..6);
216     assert_err!(StringLit, r#""\x8Ff""#, NonAsciiXEscape, 1..5);
217     assert_err!(StringLit, r#""\xa0 ""#, NonAsciiXEscape, 1..5);
218     assert_err!(StringLit, r#""నక్క\xB0""#, NonAsciiXEscape, 13..17);
219     assert_err!(StringLit, r#""\xc3నక్క""#, NonAsciiXEscape, 1..5);
220     assert_err!(StringLit, r#""\xDf��""#, NonAsciiXEscape, 1..5);
221     assert_err!(StringLit, r#""నక్క\xffనక్క""#, NonAsciiXEscape, 13..17);
222     assert_err!(StringLit, r#""\xfF ""#, NonAsciiXEscape, 1..5);
223     assert_err!(StringLit, r#"" \xFf""#, NonAsciiXEscape, 2..6);
224     assert_err!(StringLit, r#""నక్క  \xFF""#, NonAsciiXEscape, 15..19);
225 }
226 
227 #[test]
invald_escapes()228 fn invald_escapes() {
229     assert_err!(StringLit, r#""\a""#, UnknownEscape, 1..3);
230     assert_err!(StringLit, r#""foo\y""#, UnknownEscape, 4..6);
231     assert_err!(StringLit, r#""\"#, UnterminatedString, None);
232     assert_err!(StringLit, r#""\x""#, UnterminatedEscape, 1..3);
233     assert_err!(StringLit, r#""��\x1""#, UnterminatedEscape, 5..8);
234     assert_err!(StringLit, r#"" \xaj""#, InvalidXEscape, 2..6);
235     assert_err!(StringLit, r#""నక్క\xjb""#, InvalidXEscape, 13..17);
236 }
237 
238 #[test]
invalid_unicode_escapes()239 fn invalid_unicode_escapes() {
240     assert_err!(StringLit, r#""\u""#, UnicodeEscapeWithoutBrace, 1..3);
241     assert_err!(StringLit, r#""��\u ""#, UnicodeEscapeWithoutBrace, 5..7);
242     assert_err!(StringLit, r#""\u3""#, UnicodeEscapeWithoutBrace, 1..3);
243 
244     assert_err!(StringLit, r#""\u{""#, UnterminatedUnicodeEscape, 1..4);
245     assert_err!(StringLit, r#""\u{12""#, UnterminatedUnicodeEscape, 1..6);
246     assert_err!(StringLit, r#""��\u{a0b""#, UnterminatedUnicodeEscape, 5..11);
247     assert_err!(StringLit, r#""\u{a0_b  ""#, UnterminatedUnicodeEscape, 1..10);
248 
249     assert_err!(StringLit, r#""\u{_}నక్క""#, InvalidStartOfUnicodeEscape, 4);
250     assert_err!(StringLit, r#""\u{_5f}""#, InvalidStartOfUnicodeEscape, 4);
251 
252     assert_err!(StringLit, r#""fox\u{x}""#, NonHexDigitInUnicodeEscape, 7);
253     assert_err!(StringLit, r#""\u{0x}��""#, NonHexDigitInUnicodeEscape, 5);
254     assert_err!(StringLit, r#""నక్క\u{3bx}""#, NonHexDigitInUnicodeEscape, 18);
255     assert_err!(StringLit, r#""\u{3b_x}лиса""#, NonHexDigitInUnicodeEscape, 7);
256     assert_err!(StringLit, r#""\u{4x_}""#, NonHexDigitInUnicodeEscape, 5);
257 
258     assert_err!(StringLit, r#""\u{1234567}""#, TooManyDigitInUnicodeEscape, 10);
259     assert_err!(StringLit, r#""నక్క\u{1234567}��""#, TooManyDigitInUnicodeEscape, 22);
260     assert_err!(StringLit, r#""నక్క\u{1_23_4_56_7}""#, TooManyDigitInUnicodeEscape, 26);
261     assert_err!(StringLit, r#""\u{abcdef123}лиса""#, TooManyDigitInUnicodeEscape, 10);
262 
263     assert_err!(StringLit, r#""\u{110000}fox""#, InvalidUnicodeEscapeChar, 1..10);
264 }
265