Skip to content

Commit 34b32b0

Browse files
committed
Use Mode less.
It's passed to numerous places where we just need an `is_byte` bool. Passing the bool avoids the need for some assertions. Also rename `is_bytes()` as `is_byte()`, to better match `Mode::Byte`, `Mode::ByteStr`, and `Mode::RawByteStr`.
1 parent 84ca2c3 commit 34b32b0

File tree

2 files changed

+29
-31
lines changed

2 files changed

+29
-31
lines changed

compiler/rustc_lexer/src/unescape.rs

Lines changed: 22 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -85,14 +85,16 @@ where
8585
match mode {
8686
Mode::Char | Mode::Byte => {
8787
let mut chars = src.chars();
88-
let result = unescape_char_or_byte(&mut chars, mode);
88+
let result = unescape_char_or_byte(&mut chars, mode == Mode::Byte);
8989
// The Chars iterator moved forward.
9090
callback(0..(src.len() - chars.as_str().len()), result);
9191
}
92-
Mode::Str | Mode::ByteStr => unescape_str_or_byte_str(src, mode, callback),
92+
Mode::Str | Mode::ByteStr => unescape_str_or_byte_str(src, mode == Mode::ByteStr, callback),
9393
// NOTE: Raw strings do not perform any explicit character escaping, here we
9494
// only translate CRLF to LF and produce errors on bare CR.
95-
Mode::RawStr | Mode::RawByteStr => unescape_raw_str_or_raw_byte_str(src, mode, callback),
95+
Mode::RawStr | Mode::RawByteStr => {
96+
unescape_raw_str_or_raw_byte_str(src, mode == Mode::RawByteStr, callback)
97+
}
9698
}
9799
}
98100

@@ -103,7 +105,7 @@ pub fn unescape_byte_literal<F>(src: &str, mode: Mode, callback: &mut F)
103105
where
104106
F: FnMut(Range<usize>, Result<u8, EscapeError>),
105107
{
106-
debug_assert!(mode.is_bytes());
108+
debug_assert!(mode.is_byte());
107109
unescape_literal(src, mode, &mut |range, result| {
108110
callback(range, result.map(byte_from_char));
109111
})
@@ -113,15 +115,14 @@ where
113115
/// unescaped char or an error
114116
pub fn unescape_char(src: &str) -> Result<char, (usize, EscapeError)> {
115117
let mut chars = src.chars();
116-
unescape_char_or_byte(&mut chars, Mode::Char)
117-
.map_err(|err| (src.len() - chars.as_str().len(), err))
118+
unescape_char_or_byte(&mut chars, false).map_err(|err| (src.len() - chars.as_str().len(), err))
118119
}
119120

120121
/// Takes a contents of a byte literal (without quotes), and returns an
121122
/// unescaped byte or an error.
122123
pub fn unescape_byte(src: &str) -> Result<u8, (usize, EscapeError)> {
123124
let mut chars = src.chars();
124-
unescape_char_or_byte(&mut chars, Mode::Byte)
125+
unescape_char_or_byte(&mut chars, true)
125126
.map(byte_from_char)
126127
.map_err(|err| (src.len() - chars.as_str().len(), err))
127128
}
@@ -145,15 +146,15 @@ impl Mode {
145146
}
146147
}
147148

148-
pub fn is_bytes(self) -> bool {
149+
pub fn is_byte(self) -> bool {
149150
match self {
150151
Mode::Byte | Mode::ByteStr | Mode::RawByteStr => true,
151152
Mode::Char | Mode::Str | Mode::RawStr => false,
152153
}
153154
}
154155
}
155156

156-
fn scan_escape(chars: &mut Chars<'_>, mode: Mode) -> Result<char, EscapeError> {
157+
fn scan_escape(chars: &mut Chars<'_>, is_byte: bool) -> Result<char, EscapeError> {
157158
// Previous character was '\\', unescape what follows.
158159
let res = match chars.next().ok_or(EscapeError::LoneSlash)? {
159160
'"' => '"',
@@ -176,7 +177,7 @@ fn scan_escape(chars: &mut Chars<'_>, mode: Mode) -> Result<char, EscapeError> {
176177
let value = hi * 16 + lo;
177178

178179
// For a non-byte literal verify that it is within ASCII range.
179-
if !mode.is_bytes() && !is_ascii(value) {
180+
if !is_byte && !is_ascii(value) {
180181
return Err(EscapeError::OutOfRangeHexEscape);
181182
}
182183
let value = value as u8;
@@ -212,7 +213,7 @@ fn scan_escape(chars: &mut Chars<'_>, mode: Mode) -> Result<char, EscapeError> {
212213

213214
// Incorrect syntax has higher priority for error reporting
214215
// than unallowed value for a literal.
215-
if mode.is_bytes() {
216+
if is_byte {
216217
return Err(EscapeError::UnicodeEscapeInByte);
217218
}
218219

@@ -244,23 +245,22 @@ fn scan_escape(chars: &mut Chars<'_>, mode: Mode) -> Result<char, EscapeError> {
244245
}
245246

246247
#[inline]
247-
fn ascii_check(c: char, mode: Mode) -> Result<char, EscapeError> {
248-
if mode.is_bytes() && !c.is_ascii() {
248+
fn ascii_check(c: char, is_byte: bool) -> Result<char, EscapeError> {
249+
if is_byte && !c.is_ascii() {
249250
// Byte literal can't be a non-ascii character.
250251
Err(EscapeError::NonAsciiCharInByte)
251252
} else {
252253
Ok(c)
253254
}
254255
}
255256

256-
fn unescape_char_or_byte(chars: &mut Chars<'_>, mode: Mode) -> Result<char, EscapeError> {
257-
debug_assert!(mode == Mode::Char || mode == Mode::Byte);
257+
fn unescape_char_or_byte(chars: &mut Chars<'_>, is_byte: bool) -> Result<char, EscapeError> {
258258
let c = chars.next().ok_or(EscapeError::ZeroChars)?;
259259
let res = match c {
260-
'\\' => scan_escape(chars, mode),
260+
'\\' => scan_escape(chars, is_byte),
261261
'\n' | '\t' | '\'' => Err(EscapeError::EscapeOnlyChar),
262262
'\r' => Err(EscapeError::BareCarriageReturn),
263-
_ => ascii_check(c, mode),
263+
_ => ascii_check(c, is_byte),
264264
}?;
265265
if chars.next().is_some() {
266266
return Err(EscapeError::MoreThanOneChar);
@@ -270,11 +270,10 @@ fn unescape_char_or_byte(chars: &mut Chars<'_>, mode: Mode) -> Result<char, Esca
270270

271271
/// Takes a contents of a string literal (without quotes) and produces a
272272
/// sequence of escaped characters or errors.
273-
fn unescape_str_or_byte_str<F>(src: &str, mode: Mode, callback: &mut F)
273+
fn unescape_str_or_byte_str<F>(src: &str, is_byte: bool, callback: &mut F)
274274
where
275275
F: FnMut(Range<usize>, Result<char, EscapeError>),
276276
{
277-
debug_assert!(mode == Mode::Str || mode == Mode::ByteStr);
278277
let mut chars = src.chars();
279278

280279
// The `start` and `end` computation here is complicated because
@@ -293,14 +292,14 @@ where
293292
skip_ascii_whitespace(&mut chars, start, callback);
294293
continue;
295294
}
296-
_ => scan_escape(&mut chars, mode),
295+
_ => scan_escape(&mut chars, is_byte),
297296
}
298297
}
299298
'\n' => Ok('\n'),
300299
'\t' => Ok('\t'),
301300
'"' => Err(EscapeError::EscapeOnlyChar),
302301
'\r' => Err(EscapeError::BareCarriageReturn),
303-
_ => ascii_check(c, mode),
302+
_ => ascii_check(c, is_byte),
304303
};
305304
let end = src.len() - chars.as_str().len();
306305
callback(start..end, result);
@@ -337,11 +336,10 @@ where
337336
/// sequence of characters or errors.
338337
/// NOTE: Raw strings do not perform any explicit character escaping, here we
339338
/// only translate CRLF to LF and produce errors on bare CR.
340-
fn unescape_raw_str_or_raw_byte_str<F>(src: &str, mode: Mode, callback: &mut F)
339+
fn unescape_raw_str_or_raw_byte_str<F>(src: &str, is_byte: bool, callback: &mut F)
341340
where
342341
F: FnMut(Range<usize>, Result<char, EscapeError>),
343342
{
344-
debug_assert!(mode == Mode::RawStr || mode == Mode::RawByteStr);
345343
let mut chars = src.chars();
346344

347345
// The `start` and `end` computation here matches the one in
@@ -351,7 +349,7 @@ where
351349
let start = src.len() - chars.as_str().len() - c.len_utf8();
352350
let result = match c {
353351
'\r' => Err(EscapeError::BareCarriageReturnInRawString),
354-
c if mode.is_bytes() && !c.is_ascii() => Err(EscapeError::NonAsciiCharInByteString),
352+
c if is_byte && !c.is_ascii() => Err(EscapeError::NonAsciiCharInByteString),
355353
c => Ok(c),
356354
};
357355
let end = src.len() - chars.as_str().len();

compiler/rustc_parse/src/lexer/unescape_error_reporting.rs

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -108,7 +108,7 @@ pub(crate) fn emit_unescape_error(
108108
}
109109

110110
if !has_help {
111-
let (prefix, msg) = if mode.is_bytes() {
111+
let (prefix, msg) = if mode.is_byte() {
112112
("b", "if you meant to write a byte string literal, use double quotes")
113113
} else {
114114
("", "if you meant to write a `str` literal, use double quotes")
@@ -142,7 +142,7 @@ pub(crate) fn emit_unescape_error(
142142
EscapeError::EscapeOnlyChar => {
143143
let (c, char_span) = last_char();
144144

145-
let msg = if mode.is_bytes() {
145+
let msg = if mode.is_byte() {
146146
"byte constant must be escaped"
147147
} else {
148148
"character constant must be escaped"
@@ -182,11 +182,11 @@ pub(crate) fn emit_unescape_error(
182182
let (c, span) = last_char();
183183

184184
let label =
185-
if mode.is_bytes() { "unknown byte escape" } else { "unknown character escape" };
185+
if mode.is_byte() { "unknown byte escape" } else { "unknown character escape" };
186186
let ec = escaped_char(c);
187187
let mut diag = handler.struct_span_err(span, &format!("{}: `{}`", label, ec));
188188
diag.span_label(span, label);
189-
if c == '{' || c == '}' && !mode.is_bytes() {
189+
if c == '{' || c == '}' && !mode.is_byte() {
190190
diag.help(
191191
"if used in a formatting string, curly braces are escaped with `{{` and `}}`",
192192
);
@@ -196,7 +196,7 @@ pub(crate) fn emit_unescape_error(
196196
version control settings",
197197
);
198198
} else {
199-
if !mode.is_bytes() {
199+
if !mode.is_byte() {
200200
diag.span_suggestion(
201201
span_with_quotes,
202202
"if you meant to write a literal backslash (perhaps escaping in a regular expression), consider a raw string literal",
@@ -231,7 +231,7 @@ pub(crate) fn emit_unescape_error(
231231
.emit();
232232
}
233233
EscapeError::NonAsciiCharInByte => {
234-
assert!(mode.is_bytes());
234+
assert!(mode.is_byte());
235235
let (c, span) = last_char();
236236
let mut err = handler.struct_span_err(span, "non-ASCII character in byte constant");
237237
let postfix = if unicode_width::UnicodeWidthChar::width(c).unwrap_or(1) == 0 {
@@ -271,7 +271,7 @@ pub(crate) fn emit_unescape_error(
271271
err.emit();
272272
}
273273
EscapeError::NonAsciiCharInByteString => {
274-
assert!(mode.is_bytes());
274+
assert!(mode.is_byte());
275275
let (c, span) = last_char();
276276
let postfix = if unicode_width::UnicodeWidthChar::width(c).unwrap_or(1) == 0 {
277277
format!(" but is {:?}", c)

0 commit comments

Comments
 (0)