mirror of
				https://github.com/rm-dr/daisy
				synced 2025-10-26 12:04:27 -07:00 
			
		
		
		
	
		
			
				
	
	
		
			199 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			Rust
		
	
	
	
	
	
			
		
		
	
	
			199 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			Rust
		
	
	
	
	
	
| use std::collections::VecDeque;
 | ||
| use crate::context::Context;
 | ||
| 
 | ||
| use super::super::{
 | ||
| 	Token,
 | ||
| 	LineLocation,
 | ||
| 	Operator
 | ||
| };
 | ||
| 
 | ||
| // Called whenever a token is finished.
 | ||
| #[inline(always)]
 | ||
| fn push_token(
 | ||
| 	context: &Context,
 | ||
| 	g: &mut VecDeque<Token>,
 | ||
| 	t: Option<Token>,
 | ||
| 	stop_i: usize
 | ||
| ) {
 | ||
| 
 | ||
| 	if t.is_none() { return }
 | ||
| 	let mut t = t.unwrap();
 | ||
| 
 | ||
| 	match t {
 | ||
| 		Token::TupleDelim(ref mut l)
 | ||
| 		| Token::GroupStart(ref mut l)
 | ||
| 		| Token::GroupEnd(ref mut l)
 | ||
| 		| Token::Operator(ref mut l, _)
 | ||
| 		| Token::Quantity(ref mut l, _)
 | ||
| 		| Token::Word(ref mut l, _)
 | ||
| 		=> {
 | ||
| 			*l = LineLocation{
 | ||
| 				pos: l.pos,
 | ||
| 				len: stop_i - l.pos,
 | ||
| 			};
 | ||
| 		},
 | ||
| 
 | ||
| 		Token::Group(_,_)
 | ||
| 		| Token::Tuple(_,_)
 | ||
| 		| Token::Container(_)
 | ||
| 		=> unreachable!()
 | ||
| 	};
 | ||
| 
 | ||
| 
 | ||
| 	// `2e` isn't exponential notation, it's 2*e.
 | ||
| 	// If a number ends in `e`, disconnect the `e` and make it a word.
 | ||
| 	if let Token::Quantity(l, s) = &t {
 | ||
| 		let last = &s[s.len()-1..];
 | ||
| 		if last == "e" {
 | ||
| 			g.push_back(Token::Quantity(
 | ||
| 				LineLocation { pos: l.pos, len: l.len-1 },
 | ||
| 				String::from(&s[0..s.len()-1])
 | ||
| 			));
 | ||
| 			g.push_back(Token::Word(
 | ||
| 				LineLocation { pos: l.pos + l.len - 1, len: 1 },
 | ||
| 				String::from("e")
 | ||
| 			));
 | ||
| 
 | ||
| 			return;
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	// Some operators are written as words.
 | ||
| 	if let Token::Word(l, s) = &t {
 | ||
| 		if Operator::from_string(context, s).is_some() {
 | ||
| 			t = Token::Operator(*l, s.clone());
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	g.push_back(t);
 | ||
| }
 | ||
| 
 | ||
| /// Turns a string into Tokens. First stage of parsing.
 | ||
| pub fn tokenize(context: &Context, input: &String) -> VecDeque<Token> {
 | ||
| 	let mut t: Option<Token> = None; // The current token we're reading
 | ||
| 	let mut g: VecDeque<Token> = VecDeque::with_capacity(32);
 | ||
| 
 | ||
| 
 | ||
| 	for (i, c) in input.chars().enumerate() {
 | ||
| 		match c {
 | ||
| 			// Numbers
 | ||
| 			'.' | '0'..='9' => {
 | ||
| 				match &mut t {
 | ||
| 					// If we're already building a number,
 | ||
| 					// append.
 | ||
| 					Some(Token::Quantity(_, val)) => {
 | ||
| 						val.push(if c == ',' {'.'} else {c});
 | ||
| 					},
 | ||
| 
 | ||
| 					// If we're not building a number, finalize
 | ||
| 					// previous token and start one.
 | ||
| 					_ => {
 | ||
| 						push_token(context, &mut g, t, i);
 | ||
| 						t = Some(Token::Quantity(LineLocation{pos: i, len: 0}, String::from(c)));
 | ||
| 					}
 | ||
| 				};
 | ||
| 			},
 | ||
| 
 | ||
| 			// 'e' needs special treatment.
 | ||
| 			// Can be both a word or a number.
 | ||
| 			'e' => {
 | ||
| 				match &mut t {
 | ||
| 					Some(Token::Word(_, val)) => { val.push(c); },
 | ||
| 					Some(Token::Quantity(_, val)) => { val.push(c); },
 | ||
| 
 | ||
| 					_ => {
 | ||
| 						push_token(context, &mut g, t, i);
 | ||
| 						t = Some(Token::Word(LineLocation{pos: i, len: 0}, String::from(c)));
 | ||
| 					}
 | ||
| 				};
 | ||
| 			}
 | ||
| 
 | ||
| 			// The minus sign also needs special treatment.
 | ||
| 			// It can be the `neg` operator, the `minus` operator,
 | ||
| 			// or it can specify a negative exponent.
 | ||
| 			'-' | '+' => {
 | ||
| 				match &mut t {
 | ||
| 					Some(Token::Quantity(_, val)) => {
 | ||
| 						if &val[val.len()-1..] == "e" {
 | ||
| 							// If the current number ends in an `e`,
 | ||
| 							// this negative specifies a negative exponent
 | ||
| 							// like 2e-2 = 0.02.
 | ||
| 							val.push(c);
 | ||
| 						} else {
 | ||
| 							// Otherwise, end the number.
 | ||
| 							// We probably have a subtraction.
 | ||
| 							push_token(context, &mut g, t, i);
 | ||
| 							t = Some(Token::Operator(
 | ||
| 								LineLocation{pos: i, len: 1},
 | ||
| 								String::from(c)
 | ||
| 							));
 | ||
| 						}
 | ||
| 					},
 | ||
| 
 | ||
| 					// This may be a negative or a subtraction.
 | ||
| 					// Multi-character operators with - and + are NOT supported!
 | ||
| 					// (for example, we can't use -> for unit conversion)
 | ||
| 					_ => {
 | ||
| 						push_token(context, &mut g, t, i);
 | ||
| 						t = Some(Token::Operator(
 | ||
| 							LineLocation{pos: i, len: 1},
 | ||
| 							String::from(c)
 | ||
| 						));
 | ||
| 					}
 | ||
| 				};
 | ||
| 			},
 | ||
| 
 | ||
| 			',' => {
 | ||
| 				push_token(context, &mut g, t, i);
 | ||
| 				t = Some(Token::TupleDelim(LineLocation{pos: i, len: 1}));
 | ||
| 			},
 | ||
| 
 | ||
| 			// Operator
 | ||
| 			'^'|'!'|'%'|'\\'|
 | ||
| 			'*'|'×'|'/'|'÷'|
 | ||
| 			'>'|'<'|'?'|'@'|
 | ||
| 			'&'|'|'|'~'
 | ||
| 			=> {
 | ||
| 				match &mut t {
 | ||
| 					Some(Token::Operator(_, val)) => { val.push(c); },
 | ||
| 					_ => {
 | ||
| 						push_token(context, &mut g, t, i);
 | ||
| 						t = Some(Token::Operator(LineLocation{pos: i, len: 0}, String::from(c)));
 | ||
| 					}
 | ||
| 				};
 | ||
| 			},
 | ||
| 
 | ||
| 			// Group
 | ||
| 			'(' => {
 | ||
| 				push_token(context, &mut g, t, i);
 | ||
| 				t = Some(Token::GroupStart(LineLocation{pos: i, len: 0}));
 | ||
| 			},
 | ||
| 			')' => {
 | ||
| 				push_token(context, &mut g, t, i);
 | ||
| 				t = Some(Token::GroupEnd(LineLocation{pos: i, len: 0}));
 | ||
| 			},
 | ||
| 
 | ||
| 			// Space. Basic seperator.
 | ||
| 			' ' => {
 | ||
| 				push_token(context, &mut g, t, i);
 | ||
| 				t = None;
 | ||
| 			}
 | ||
| 
 | ||
| 			// Word
 | ||
| 			_ => {
 | ||
| 				match &mut t {
 | ||
| 					Some(Token::Word(_, val)) => { val.push(c); },
 | ||
| 
 | ||
| 					_ => {
 | ||
| 						push_token(context, &mut g, t, i);
 | ||
| 						t = Some(Token::Word(LineLocation{pos: i, len: 0}, String::from(c)));
 | ||
| 					}
 | ||
| 				};
 | ||
| 			}
 | ||
| 		};
 | ||
| 	}
 | ||
| 
 | ||
| 	push_token(context, &mut g, t, input.chars().count());
 | ||
| 
 | ||
| 	return g;
 | ||
| } |