use regex::Regex; use crate::parser::Sexpr::*; #[derive(Debug, Clone)] pub enum Sexpr { Int(i64), Float(f64), Str(String), Boolean(bool), Symbol(String), Cons(Box, Vec), Nil, } pub type ParseResult = Result; pub struct Parser { unparsed: Vec, position: usize, } impl Parser { pub fn new(src: Vec) -> Parser { Parser { unparsed: src, position: 0, } } fn peek(&mut self) -> Option { self.unparsed.get(self.position).cloned() } fn next(&mut self) -> Option { self.position += 1; self.unparsed.get(self.position - 1).cloned() } pub fn parse(&mut self) -> ParseResult { match self.peek() { Some(s) => match s.as_str() { ")" => Err(format!("Unexpected ')' at position {}", self.position)), "'" => { self.next(); Ok(Cons(Box::new(Str("quote".to_string())), vec![self.parse()?])) }, "(" => self.parse_sequence(")"), _ => self.parse_atom(), } None => return Err("Unexpected EOF".to_string()), } } fn parse_sequence(&mut self, end: &str) -> ParseResult { self.next(); let car = self.parse()?; let mut cdr = Vec::new(); loop { let token = match self.peek() { Some(token) => token, None => return Err(format!("Unexpected end of input, expected '{}'", end)), }; if token == end { break; } cdr.push(self.parse()?) } self.next(); Ok(Sexpr::Cons(Box::new(car), cdr)) } fn parse_atom(&mut self) -> ParseResult { let token = self.next().unwrap(); match token.as_str() { "null" => Ok(Nil), "true" => Ok(Boolean(true)), "false" => Ok(Boolean(false)), _ => { if Regex::new(r#"[+-]?([0-9]*[.])?[0-9]+"#).unwrap().is_match(&token) { Ok(Int(token.parse().unwrap())) } else if Regex::new(r#"[+-]?([0-9]*[.])?[0-9]+"#).unwrap().is_match(&token) { Ok(Float(token.parse().unwrap())) } else if Regex::new(r#""(?:\\.|[^\\"])*""#).unwrap().is_match(&token) { Ok(Str(token[1..token.len() - 1].to_string())) } else { Ok(Symbol(token)) } } } } } pub fn tokenize(str: &str) -> Vec { str.replace("(", " ( ") .replace(")", " ) ") .split_whitespace() .map(|s| s.to_string()) .collect() }