Skip to content

Commit

Permalink
Flowing errors in tokenizer atom-constructor functions through to parser
Browse files Browse the repository at this point in the history
  • Loading branch information
luketpeterson committed Mar 21, 2024
1 parent 819f49a commit fc7c18c
Show file tree
Hide file tree
Showing 4 changed files with 38 additions and 23 deletions.
20 changes: 10 additions & 10 deletions lib/src/metta/runner/arithmetics.rs
Original file line number Diff line number Diff line change
Expand Up @@ -56,14 +56,14 @@ impl Into<f64> for Number {
}

impl Number {
pub fn from_int_str(num: &str) -> Self {
let n = num.parse::<i64>().expect("Could not parse integer");
Self::Integer(n)
pub fn from_int_str(num: &str) -> Result<Self, String> {
let n = num.parse::<i64>().map_err(|e| format!("Could not parse integer: '{num}', {e}"))?;
Ok(Self::Integer(n))
}

pub fn from_float_str(num: &str) -> Self {
let n = num.parse::<f64>().expect("Could not parse float");
Self::Float(n)
pub fn from_float_str(num: &str) -> Result<Self, String> {
let n = num.parse::<f64>().map_err(|e| format!("Could not parse float: '{num}', {e}"))?;
Ok(Self::Float(n))
}

pub fn promote(a: Number, b: Number) -> (Number, Number) {
Expand Down Expand Up @@ -406,10 +406,10 @@ mod tests {

#[test]
fn number() {
assert_eq!(Number::from_int_str("12345"), Number::Integer(12345i64));
assert_eq!(Number::from_float_str("123.45"), Number::Float(123.45f64));
assert_eq!(Number::from_float_str("12345e-02"), Number::Float(123.45f64));
assert_eq!(Number::from_float_str("1.2345e+2"), Number::Float(123.45f64));
assert_eq!(Number::from_int_str("12345").unwrap(), Number::Integer(12345i64));
assert_eq!(Number::from_float_str("123.45").unwrap(), Number::Float(123.45f64));
assert_eq!(Number::from_float_str("12345e-02").unwrap(), Number::Float(123.45f64));
assert_eq!(Number::from_float_str("1.2345e+2").unwrap(), Number::Float(123.45f64));
assert_eq!(format!("{}", Number::Integer(12345i64)), "12345");
assert_eq!(format!("{}", Number::Float(123.45f64)), "123.45");
}
Expand Down
12 changes: 6 additions & 6 deletions lib/src/metta/runner/stdlib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -1415,12 +1415,12 @@ mod non_minimal_only_stdlib {
let mut rust_tokens = Tokenizer::new();
let tref = &mut rust_tokens;

tref.register_token(regex(r"[\-\+]?\d+"),
|token| { Atom::gnd(Number::from_int_str(token)) });
tref.register_token(regex(r"[\-\+]?\d+\.\d+"),
|token| { Atom::gnd(Number::from_float_str(token)) });
tref.register_token(regex(r"[\-\+]?\d+(\.\d+)?[eE][\-\+]?\d+"),
|token| { Atom::gnd(Number::from_float_str(token)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+"),
|token| { Ok(Atom::gnd(Number::from_int_str(token)?)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+\.\d+"),
|token| { Ok(Atom::gnd(Number::from_float_str(token)?)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+(\.\d+)?[eE][\-\+]?\d+"),
|token| { Ok(Atom::gnd(Number::from_float_str(token)?)) });
tref.register_token(regex(r"True|False"),
|token| { Atom::gnd(Bool::from_str(token)) });
let sum_op = Atom::gnd(SumOp{});
Expand Down
12 changes: 6 additions & 6 deletions lib/src/metta/runner/stdlib_minimal.rs
Original file line number Diff line number Diff line change
Expand Up @@ -428,12 +428,12 @@ pub fn register_rust_stdlib_tokens(target: &mut Tokenizer) {
let mut rust_tokens = Tokenizer::new();
let tref = &mut rust_tokens;

tref.register_token(regex(r"[\-\+]?\d+"),
|token| { Atom::gnd(Number::from_int_str(token)) });
tref.register_token(regex(r"[\-\+]?\d+\.\d+"),
|token| { Atom::gnd(Number::from_float_str(token)) });
tref.register_token(regex(r"[\-\+]?\d+(\.\d+)?[eE][\-\+]?\d+"),
|token| { Atom::gnd(Number::from_float_str(token)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+"),
|token| { Ok(Atom::gnd(Number::from_int_str(token)?)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+\.\d+"),
|token| { Ok(Atom::gnd(Number::from_float_str(token)?)) });
tref.register_fallible_token(regex(r"[\-\+]?\d+(\.\d+)?[eE][\-\+]?\d+"),
|token| { Ok(Atom::gnd(Number::from_float_str(token)?)) });
tref.register_token(regex(r"True|False"),
|token| { Atom::gnd(Bool::from_str(token)) });
let sum_op = Atom::gnd(SumOp{});
Expand Down
17 changes: 16 additions & 1 deletion lib/src/metta/text.rs
Original file line number Diff line number Diff line change
Expand Up @@ -194,7 +194,8 @@ impl SyntaxNode {
let token_text = self.parsed_text.as_ref().unwrap();
let constr = tokenizer.find_token(token_text);
if let Some(constr) = constr {
let new_atom = constr(token_text).unwrap(); //TODO, If the Tokenizer's atom constructor throws an error, then gracefully alert the user
let new_atom = constr(token_text)
.map_err(|e| format!("byte range = ({:?}) | {e}", self.src_range))?;
Ok(Some(new_atom))
} else {
let new_atom = Atom::sym(token_text);
Expand Down Expand Up @@ -663,6 +664,20 @@ mod tests {
assert_eq!(Err(String::from("Unexpected right bracket")), parser.parse(&Tokenizer::new()));
}

#[test]
fn test_error_from_tokenizer() {
//NOTE: This test relies on an intentional bug in the regex, so that it will accept an invalid
// float. However it could be hit in legitimate cases, such as an integer that overflows the
// type's capacity before we implement bigint, or any type where the representation's actual
// contours can't be captured by a regex.
let mut tokenizer = Tokenizer::new();
tokenizer.register_fallible_token(Regex::new(r"[\-\+]?\d+.\d+").unwrap(),
|token| Ok(Atom::gnd(metta::runner::arithmetics::Number::from_float_str(token)?))
);
let mut parser = SExprParser::new("12345678901234567:8901234567890");
assert!(parser.parse(&tokenizer).is_err());
}

#[test]
fn test_comment_base() {
let program = ";(a 4)
Expand Down

0 comments on commit fc7c18c

Please sign in to comment.