Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 0 additions & 1 deletion Lib/test/test_json/test_decode.py
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,6 @@ def test_float(self):
self.assertIsInstance(rval, float)
self.assertEqual(rval, 1.0)

@unittest.skip("TODO: RUSTPYTHON; called `Result::unwrap()` on an `Err` value: ParseFloatError { kind: Invalid }")
def test_nonascii_digits_rejected(self):
# JSON specifies only ascii digits, see gh-125687
for num in ["1\uff10", "0.\uff10", "0e\uff10"]:
Expand Down
5 changes: 1 addition & 4 deletions Lib/test/test_json/test_fail.py
Original file line number Diff line number Diff line change
Expand Up @@ -239,7 +239,4 @@ def test_linecol(self):
(line, col, idx))

class TestPyFail(TestFail, PyTest): pass
class TestCFail(TestFail, CTest):
@unittest.expectedFailure # TODO: RUSTPYTHON
def test_failures(self):
return super().test_failures()
class TestCFail(TestFail, CTest): pass
57 changes: 39 additions & 18 deletions crates/stdlib/src/json.rs
Original file line number Diff line number Diff line change
Expand Up @@ -189,30 +189,51 @@ mod _json {

fn parse_number(&self, bytes: &[u8], vm: &VirtualMachine) -> Option<(PyResult, usize)> {
flame_guard!("JsonScanner::parse_number");
let mut has_neg = false;
let mut has_decimal = false;
let mut has_exponent = false;
let mut has_e_sign = false;
// RFC 8259 defines JSON numbers in ASCII syntax, including digits,
// '-', '.', 'e'/'E', and an optional exponent sign, so byte iteration
// is equivalent to char iteration here.
let mut i = 0;
// JSON numbers are ASCII per RFC 8259 (digits, '-', '+', '.', 'e', 'E'),
// so byte iteration is equivalent to char iteration here.
for &b in bytes {
match b {
b'-' if i == 0 => has_neg = true,
b'0'..=b'9' => {}
b'.' if !has_decimal => has_decimal = true,
b'e' | b'E' if !has_exponent => has_exponent = true,
b'+' | b'-' if !has_e_sign => has_e_sign = true,
_ => break,
}
if bytes.get(i) == Some(&b'-') {
i += 1;
}
if i == 0 || (i == 1 && has_neg) {
return None;
match bytes.get(i) {
Some(b'0') => i += 1,
Some(b'1'..=b'9') => {
i += 1;
while matches!(bytes.get(i), Some(b'0'..=b'9')) {
i += 1;
}
}
_ => return None,
}

let mut is_float = false;
if bytes.get(i) == Some(&b'.') && matches!(bytes.get(i + 1), Some(b'0'..=b'9')) {
is_float = true;
i += 2;
while matches!(bytes.get(i), Some(b'0'..=b'9')) {
i += 1;
}
}

if matches!(bytes.get(i), Some(b'e' | b'E')) {
let mut exponent_end = i + 1;
if matches!(bytes.get(exponent_end), Some(b'+' | b'-')) {
exponent_end += 1;
}
if matches!(bytes.get(exponent_end), Some(b'0'..=b'9')) {
is_float = true;
exponent_end += 1;
while matches!(bytes.get(exponent_end), Some(b'0'..=b'9')) {
exponent_end += 1;
}
i = exponent_end;
}
}

// SAFETY: the loop above accepts only ASCII bytes, so bytes[..i] is valid UTF-8.
let buf = unsafe { core::str::from_utf8_unchecked(&bytes[..i]) };
let ret = if has_decimal || has_exponent {
let ret = if is_float {
// float
if let Some(ref parse_float) = self.parse_float {
parse_float.call((buf,), vm)
Expand Down
Loading