From a4db9df058c5ab20a461526a0d00a477b98d77ca Mon Sep 17 00:00:00 2001
From: Kasper <kasperkh.kh@gmail.com>
Date: Sat, 21 Dec 2019 16:49:37 +0100
Subject: [PATCH] Added units

---
 src/lexer.rs  | 20 ++++++++++++++++++--
 src/main.rs   | 19 +++++++++++++++++--
 src/parser.rs | 38 ++++++++++++++++++++++++++++----------
 3 files changed, 63 insertions(+), 14 deletions(-)
diff --git a/src/lexer.rs b/src/lexer.rs
index e71fc29..bff1677 100644
--- a/src/lexer.rs
+++ b/src/lexer.rs
@@ -5,7 +5,7 @@ use crate::Operator::{Percent, Caret, Divide, Factorial, LeftParen, Minus, Modul
 use crate::TextOperator::{Of, To};
 use crate::Constant::{E, Pi};
 use crate::FunctionIdentifier::{Acos, Acosh, Asin, Asinh, Atan, Atanh, Cbrt, Ceil, Cos, Cosh, Exp, Fabs, Floor, Ln, Log, Round, Sin, Sinh, Sqrt, Tan, Tanh};
-use crate::Unit::{Normal};
+use crate::Unit::*;
 
 pub fn lex(input: &str) -> Result<TokenVector, String> {
 
@@ -92,6 +92,22 @@ pub fn lex(input: &str) -> Result<TokenVector, String> {
           "asinh" => tokens.push(Token::FunctionIdentifier(Asinh)),
           "acosh" => tokens.push(Token::FunctionIdentifier(Acosh)),
           "atanh" => tokens.push(Token::FunctionIdentifier(Atanh)),
+
+          "ns" | "nanosecond" | "nanoseconds" => tokens.push(Token::Unit(Nanosecond)),
+          "μs" | "us" | "microsecond" | "microseconds" => tokens.push(Token::Unit(Microsecond)),
+          "ms" | "millisecond" | "milliseconds" => tokens.push(Token::Unit(Millisecond)),
+          "s" | "sec" | "second" | "seconds" => tokens.push(Token::Unit(Second)),
+          "min" | "minute" | "minutes" => tokens.push(Token::Unit(Minute)),
+          "h" | "hour" | "hours" => tokens.push(Token::Unit(Hour)),
+          "day" | "days" => tokens.push(Token::Unit(Day)),
+          "week" | "weeks" => tokens.push(Token::Unit(Week)),
+          "mo" | "month" | "months" => tokens.push(Token::Unit(Month)),
+          "q" | "quater" | "quaters" => tokens.push(Token::Unit(Month)),
+          "yr" | "year" | "years" => tokens.push(Token::Unit(Year)),
+          "decade" | "decades" => tokens.push(Token::Unit(Decade)),
+          "century" | "centuries" => tokens.push(Token::Unit(Century)),
+          "millenium" | "milleniums" => tokens.push(Token::Unit(Milleniums)),
+          
           _ => {
             return Err(format!("Invalid string: {}", string));
           }
@@ -116,7 +132,7 @@ pub fn lex(input: &str) -> Result<TokenVector, String> {
         match d128::from_str(number_string) {
           Ok(number) => {
             if d128::get_status().is_empty() {
-              tokens.push(Token::Number((number, Normal)));
+              tokens.push(Token::Number(number));
             } else {
               return Err(format!("Error parsing d128 number: {}", number_string));
             }
diff --git a/src/main.rs b/src/main.rs
index 42b986b..fad85c3 100644
--- a/src/main.rs
+++ b/src/main.rs
@@ -57,17 +57,32 @@ pub enum FunctionIdentifier {
 
 #[derive(Clone, Copy, Debug)]
 pub enum Unit {
-  Normal,
+  Nanosecond,
+  Microsecond,
+  Millisecond,
+  Second,
+  Minute,
+  Hour,
+  Day,
+  Week,
+  Month,
+  Quarter,
+  Year,
+  Decade,
+  Century,
+  Milleniums,
 }
 
 #[derive(Clone, Debug)]
 pub enum Token {
   Operator(Operator),
-  Number((d128, Unit)),
+  Number(d128),
   FunctionIdentifier(FunctionIdentifier),
   Constant(Constant),
   Paren, // parser only
   TextOperator(TextOperator),
+  Negative, // parser only
+  Unit(Unit),
 }
 
 pub type TokenVector = Vec<Token>;
diff --git a/src/parser.rs b/src/parser.rs
index e36f2bf..d175801 100644
--- a/src/parser.rs
+++ b/src/parser.rs
@@ -6,14 +6,14 @@ use crate::TextOperator::{To, Of};
 #[derive(Debug)]
 pub struct AstNode {
     children: Vec<AstNode>,
-    entry: Token,
+    token: Token,
 }
 
 impl AstNode {
   pub fn new(token: Token) -> AstNode {
     AstNode {
       children: Vec::new(),
-      entry: token,
+      token: token,
     }
   }
 }
@@ -118,12 +118,11 @@ fn parse_level_4(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), S
 
 // level 5 precedence: !, percent
 fn parse_level_5(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), String> {
-  let (mut node, mut pos) = parse_level_6(tokens, pos)?;
+  let (mut node, mut pos) = parse_level_6(tokens, pos, None)?;
   loop {
     let token = tokens.get(pos);
     match token {
       Some(&Token::Operator(Factorial)) | Some(&Token::Operator(Percent)) => {
-        
         // Here we are handling unary operators, aka stuff written as
         // "Number Operator" (3!) instead of "Number Operator Number" (3+3).
         // Therefore, if we find a match, we don't parse what comes after it.
@@ -132,8 +131,14 @@ fn parse_level_5(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), S
         node = new_node;
         pos += 1;
       },
+      Some(&Token::Unit(_unit)) => {
+        // We won't allow units to repeat, like "1min min", so we end the loop if it's found.
+        let mut new_node = AstNode::new(token.unwrap().clone());
+        new_node.children.push(node);
+        return Ok((new_node, pos + 1));
+      },
       _ => {
-        // let's say we parse 1+2. parse_level_6 then returns 1, and token
+        // let's say we parse 1+2. parse_level_7 then returns 1, and token
         // is set to plus. Plus has lower precedence than level 4, so we
         // don't do anything, and pass the number down to a lower precedence.
         return Ok((node, pos));
@@ -143,13 +148,28 @@ fn parse_level_5(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), S
 }
 
 // level 6 precedence: numbers, parens
-fn parse_level_6(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), String> {
+fn parse_level_6(tokens: &TokenVector, pos: usize, last_token: Option<Token>) -> Result<(AstNode, usize), String> {
   let token: &Token = tokens.get(pos).expect(&format!("Unexpected end of input at {}", pos));
   match token {
-    &Token::Number((_number, _unit)) => {
+    Token::Operator(Minus) => {
+      if let None = last_token {
+        let (right_node, next_pos) = parse_level_6(tokens, pos + 1, Some(Token::Operator(Minus)))?;
+        let mut new_node = AstNode::new(Token::Negative);
+        new_node.children.push(right_node);
+        Ok((new_node, next_pos))
+      } else {
+        // 3-1 might end up here?
+        return Err(format!("Unexpected unary operator {0:?} at {1}", token, pos));
+      }
+    },
+    &Token::Number(_number) => {
       let node = AstNode::new(token.clone());
       Ok((node, pos + 1))
     },
+    &Token::Unit(_unit) => {
+      let node = AstNode::new(token.clone());
+      Ok((node, pos + 1))
+    }
     Token::Constant(_constant) => {
       let node = AstNode::new(token.clone());
       Ok((node, pos + 1))
@@ -157,7 +177,7 @@ fn parse_level_6(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), S
     Token::FunctionIdentifier(_function_identifier) => {
       let left_paren_pos = pos + 1;
       let left_paren_token = tokens.get(left_paren_pos);
-      // check if ( comes after function identifier, like log(
+      // check if '(' comes after function identifier, like 'log('
       match left_paren_token {
         Some(&Token::Operator(LeftParen)) => {
           // parse everything inside as you would with normal parentheses,
@@ -176,8 +196,6 @@ fn parse_level_6(tokens: &TokenVector, pos: usize) -> Result<(AstNode, usize), S
           return Err(format!("Expected ( after {} at {:?} but found {:?}", left_paren_pos, token, left_paren_token));
         }
       }
-
-      // Ok((node, pos + 1))
     },
     Token::Operator(LeftParen) => {
       parse_level_1(tokens, pos + 1).and_then(|(node, next_pos)| {