moved all crates into seperate folder + related path fixes

2025-10-01 07:41:12 +00:00 · 2022-07-01 17:37:43 +02:00 · 2022-07-01 17:37:43 +02:00 · eee85fa45d
commit eee85fa45d
parent 12ef03bb86
1063 changed files with 92 additions and 93 deletions
--- a/crates/compiler/parse/src/number_literal.rs
+++ b/crates/compiler/parse/src/number_literal.rs
@ -0,0 +1,161 @@
+use crate::ast::Base;
+use crate::parser::{ENumber, ParseResult, Parser, Progress};
+use crate::state::State;
+
+pub enum NumLiteral<'a> {
+    Float(&'a str),
+    Num(&'a str),
+    NonBase10Int {
+        string: &'a str,
+        base: Base,
+        is_negative: bool,
+    },
+}
+
+pub fn positive_number_literal<'a>() -> impl Parser<'a, NumLiteral<'a>, ENumber> {
+    move |_arena, state: State<'a>| {
+        match state.bytes().get(0) {
+            Some(first_byte) if (*first_byte as char).is_ascii_digit() => {
+                parse_number_base(false, state.bytes(), state)
+            }
+            _ => {
+                // this is not a number at all
+                Err((Progress::NoProgress, ENumber::End, state))
+            }
+        }
+    }
+}
+
+pub fn number_literal<'a>() -> impl Parser<'a, NumLiteral<'a>, ENumber> {
+    move |_arena, state: State<'a>| {
+        match state.bytes().get(0) {
+            Some(first_byte) if *first_byte == b'-' => {
+                // drop the minus
+                parse_number_base(true, &state.bytes()[1..], state)
+            }
+            Some(first_byte) if (*first_byte as char).is_ascii_digit() => {
+                parse_number_base(false, state.bytes(), state)
+            }
+            _ => {
+                // this is not a number at all
+                Err((Progress::NoProgress, ENumber::End, state))
+            }
+        }
+    }
+}
+
+fn parse_number_base<'a>(
+    is_negated: bool,
+    bytes: &'a [u8],
+    state: State<'a>,
+) -> ParseResult<'a, NumLiteral<'a>, ENumber> {
+    match bytes.get(0..2) {
+        Some(b"0b") => chomp_number_base(Base::Binary, is_negated, &bytes[2..], state),
+        Some(b"0o") => chomp_number_base(Base::Octal, is_negated, &bytes[2..], state),
+        Some(b"0x") => chomp_number_base(Base::Hex, is_negated, &bytes[2..], state),
+        _ => chomp_number_dec(is_negated, bytes, state),
+    }
+}
+
+fn chomp_number_base<'a>(
+    base: Base,
+    is_negative: bool,
+    bytes: &'a [u8],
+    state: State<'a>,
+) -> ParseResult<'a, NumLiteral<'a>, ENumber> {
+    let (_is_float, chomped) = chomp_number(bytes);
+
+    let string = unsafe { std::str::from_utf8_unchecked(&bytes[..chomped]) };
+
+    let new = state.advance(chomped + 2 + is_negative as usize);
+
+    Ok((
+        Progress::MadeProgress,
+        NumLiteral::NonBase10Int {
+            is_negative,
+            string,
+            base,
+        },
+        new,
+    ))
+}
+
+fn chomp_number_dec<'a>(
+    is_negative: bool,
+    bytes: &'a [u8],
+    state: State<'a>,
+) -> ParseResult<'a, NumLiteral<'a>, ENumber> {
+    let (is_float, chomped) = chomp_number(bytes);
+
+    if is_negative && chomped == 0 {
+        // we're probably actually looking at unary negation here
+        return Err((Progress::NoProgress, ENumber::End, state));
+    }
+
+    if !bytes.get(0).copied().unwrap_or_default().is_ascii_digit() {
+        // we're probably actually looking at unary negation here
+        return Err((Progress::NoProgress, ENumber::End, state));
+    }
+
+    let string =
+        unsafe { std::str::from_utf8_unchecked(&state.bytes()[0..chomped + is_negative as usize]) };
+
+    let new = state.advance(chomped + is_negative as usize);
+
+    Ok((
+        Progress::MadeProgress,
+        if is_float {
+            NumLiteral::Float(string)
+        } else {
+            NumLiteral::Num(string)
+        },
+        new,
+    ))
+}
+
+fn chomp_number(mut bytes: &[u8]) -> (bool, usize) {
+    let start_bytes_len = bytes.len();
+    let mut is_float = false;
+
+    while let Some(byte) = bytes.get(0) {
+        match byte {
+            b'.' => {
+                // skip, fix multiple `.`s in canonicalization
+                is_float = true;
+                bytes = &bytes[1..];
+            }
+            b'e' => {
+                // maybe scientific notation?
+                match bytes.get(1) {
+                    Some(b'-') => {
+                        is_float = true;
+                        bytes = &bytes[2..];
+                    }
+                    Some(c) if (*c as char).is_ascii_digit() => {
+                        is_float = true;
+                        bytes = &bytes[2..];
+                    }
+                    _ => {
+                        bytes = &bytes[1..];
+                    }
+                }
+            }
+            b'_' => {
+                // skip
+                bytes = &bytes[1..];
+            }
+            _ if byte.is_ascii_digit() || byte.is_ascii_alphabetic() => {
+                // valid digits (alphabetic in hex digits, and the `e` in `12e26` scientific notation
+                bytes = &bytes[1..];
+            }
+            _ => {
+                // not a valid digit; we're done
+                return (is_float, start_bytes_len - bytes.len());
+            }
+        }
+    }
+
+    // if the above loop exits, we must be dealing with an empty slice
+    // therefore we parsed all of the bytes in the input
+    (is_float, start_bytes_len)
+}