sync for backup
This commit is contained in:
parent
09f8df41a6
commit
5a835dc742
4 changed files with 162 additions and 21 deletions
|
@ -1 +1,3 @@
|
||||||
pub (crate) mod preparser;
|
pub(crate) mod preparser;
|
||||||
|
|
||||||
|
pub(crate) mod tokeniser;
|
||||||
|
|
|
@ -4,7 +4,7 @@ use std::str::Chars;
|
||||||
enum QuoteMethod {
|
enum QuoteMethod {
|
||||||
Single,
|
Single,
|
||||||
Double,
|
Double,
|
||||||
Backtick
|
Backtick,
|
||||||
}
|
}
|
||||||
|
|
||||||
// Normalised empty space in codeblocks, ensuring that all whitespace in codeblocks is one character wide
|
// Normalised empty space in codeblocks, ensuring that all whitespace in codeblocks is one character wide
|
||||||
|
@ -13,7 +13,7 @@ pub fn clear_spaces(raw: &str) -> String {
|
||||||
clear_in_code(&mut raw.chars())
|
clear_in_code(&mut raw.chars())
|
||||||
}
|
}
|
||||||
|
|
||||||
fn clear_in_code<'a, 'b>(raw: &mut Chars<'a>) -> String {
|
fn clear_in_code(raw: &mut Chars) -> String {
|
||||||
let mut cleared = String::new();
|
let mut cleared = String::new();
|
||||||
let mut last_char = 'a';
|
let mut last_char = 'a';
|
||||||
while let Some(c) = raw.next() {
|
while let Some(c) = raw.next() {
|
||||||
|
@ -44,45 +44,45 @@ fn clear_in_code<'a, 'b>(raw: &mut Chars<'a>) -> String {
|
||||||
}
|
}
|
||||||
'}' => {
|
'}' => {
|
||||||
cleared.push('}');
|
cleared.push('}');
|
||||||
return cleared
|
return cleared;
|
||||||
}
|
}
|
||||||
x => {
|
x => {
|
||||||
if last_char.is_whitespace() && x.is_whitespace() {
|
if last_char.is_whitespace() && x.is_whitespace() {
|
||||||
last_char = x.clone();
|
last_char = *x;
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
cleared.push(x.clone());
|
cleared.push(*x);
|
||||||
last_char = x.clone();
|
last_char = *x;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
};
|
}
|
||||||
|
|
||||||
cleared
|
cleared
|
||||||
}
|
}
|
||||||
|
|
||||||
fn clear_in_quotes<'a, 'b>(raw: &mut Chars<'a>, method: QuoteMethod) -> String {
|
fn clear_in_quotes(raw: &mut Chars, method: QuoteMethod) -> String {
|
||||||
let mut cleared = String::new();
|
let mut cleared = String::new();
|
||||||
let mut last_char = 'a';
|
let mut last_char = 'a';
|
||||||
while let Some(c) = raw.next() {
|
while let Some(c) = raw.next() {
|
||||||
match c {
|
match c {
|
||||||
'"' => {
|
'"' => {
|
||||||
cleared.push('"');
|
cleared.push('"');
|
||||||
if method == QuoteMethod::Double && last_char != '\\' {
|
if method == QuoteMethod::Double && last_char != '\\' {
|
||||||
return cleared
|
return cleared;
|
||||||
}
|
}
|
||||||
last_char = '"';
|
last_char = '"';
|
||||||
}
|
}
|
||||||
'\'' => {
|
'\'' => {
|
||||||
cleared.push('\'');
|
cleared.push('\'');
|
||||||
if method == QuoteMethod::Single && last_char != '\\' {
|
if method == QuoteMethod::Single && last_char != '\\' {
|
||||||
return cleared
|
return cleared;
|
||||||
}
|
}
|
||||||
last_char = '\'';
|
last_char = '\'';
|
||||||
}
|
}
|
||||||
'`' => {
|
'`' => {
|
||||||
cleared.push('`');
|
cleared.push('`');
|
||||||
if method == QuoteMethod::Backtick && last_char != '\\' {
|
if method == QuoteMethod::Backtick && last_char != '\\' {
|
||||||
return cleared
|
return cleared;
|
||||||
}
|
}
|
||||||
last_char = '`';
|
last_char = '`';
|
||||||
}
|
}
|
||||||
|
@ -98,8 +98,8 @@ fn clear_in_quotes<'a, 'b>(raw: &mut Chars<'a>, method: QuoteMethod) -> String {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
x => {
|
x => {
|
||||||
cleared.push(x.clone());
|
cleared.push(x);
|
||||||
last_char = x.clone();
|
last_char = x;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -130,19 +130,25 @@ fn test_clear_spaces3() {
|
||||||
#[test]
|
#[test]
|
||||||
fn test_clear_spaces4() {
|
fn test_clear_spaces4() {
|
||||||
let res = clear_spaces("'foo bar'");
|
let res = clear_spaces("'foo bar'");
|
||||||
assert_eq!(res, "'foo bar'".to_owned())
|
assert_eq!(res, "'foo bar'".to_owned())
|
||||||
}
|
}
|
||||||
|
|
||||||
// Test to make sure that code blocks inside single quotes are treated as quoted as well
|
// Test to make sure that code blocks inside single quotes are treated as quoted as well
|
||||||
#[test]
|
#[test]
|
||||||
fn test_clear_spaces5() {
|
fn test_clear_spaces5() {
|
||||||
let res = clear_spaces("pre quote'foo {shouldn\\'t compress space} inside'post quote");
|
let res = clear_spaces("pre quote'foo {shouldn\\'t compress space} inside'post quote");
|
||||||
assert_eq!(res, "pre quote'foo {shouldn\\'t compress space} inside'post quote".to_owned())
|
assert_eq!(
|
||||||
|
res,
|
||||||
|
"pre quote'foo {shouldn\\'t compress space} inside'post quote".to_owned()
|
||||||
|
)
|
||||||
}
|
}
|
||||||
|
|
||||||
// Test to make sure that code blocks inside double quotes are treated as non-quoted
|
// Test to make sure that code blocks inside double quotes are treated as non-quoted
|
||||||
#[test]
|
#[test]
|
||||||
fn test_clear_spaces6() {
|
fn test_clear_spaces6() {
|
||||||
let res = clear_spaces("pre quote`foo ${should compress space} inside`post quote");
|
let res = clear_spaces("pre quote`foo ${should compress space} inside`post quote");
|
||||||
assert_eq!(res, "pre quote`foo ${should compress space} inside`post quote".to_owned())
|
assert_eq!(
|
||||||
}
|
res,
|
||||||
|
"pre quote`foo ${should compress space} inside`post quote".to_owned()
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
|
@ -3,7 +3,7 @@ use crate::utils::str_safe_split;
|
||||||
// Takes space normalised source code and adds semicolons where needed
|
// Takes space normalised source code and adds semicolons where needed
|
||||||
// May not work properly if string isn't space normalised beforehand
|
// May not work properly if string isn't space normalised beforehand
|
||||||
pub fn insert_semicolons(raw: &str) -> String {
|
pub fn insert_semicolons(raw: &str) -> String {
|
||||||
let _splits = str_safe_split(raw, vec![' ','\t']);
|
let _splits = str_safe_split(raw, vec![' ','\t', '\n']);
|
||||||
|
|
||||||
"".to_owned()
|
"".to_owned()
|
||||||
}
|
}
|
133
src/parser/tokeniser.rs
Normal file
133
src/parser/tokeniser.rs
Normal file
|
@ -0,0 +1,133 @@
|
||||||
|
use num_bigint::BigInt;
|
||||||
|
|
||||||
|
const LINE_BREAKS: [char; 4] = ['\u{000A}', '\u{000D}', '\u{2028}', '\u{2029}'];
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
enum OldTokens {
|
||||||
|
MinusOne,
|
||||||
|
Minus,
|
||||||
|
MinusEquals,
|
||||||
|
Comma,
|
||||||
|
Semicolon,
|
||||||
|
Colon,
|
||||||
|
Not,
|
||||||
|
NotEquals,
|
||||||
|
StrongNotEquals,
|
||||||
|
DoubleQuestion,
|
||||||
|
QuestionQuestionEquals,
|
||||||
|
QuestionDot,
|
||||||
|
Question,
|
||||||
|
Dot,
|
||||||
|
TrippleDot,
|
||||||
|
BracketOpen,
|
||||||
|
BracketClose,
|
||||||
|
SquareBracketOpen,
|
||||||
|
SquareBracketClose,
|
||||||
|
CurlyBracketOpen,
|
||||||
|
CurlyBracketClose,
|
||||||
|
Multiply,
|
||||||
|
PowerOf,
|
||||||
|
PowerOfEquals,
|
||||||
|
MultiplyEquals,
|
||||||
|
Divide,
|
||||||
|
DivideEquals,
|
||||||
|
BitAnd,
|
||||||
|
LogicAnd,
|
||||||
|
LogicAndEquals,
|
||||||
|
BitAndEquals,
|
||||||
|
Hashtag,
|
||||||
|
Modulo,
|
||||||
|
ModuloEquals,
|
||||||
|
BitXOr,
|
||||||
|
BitXOrEquals,
|
||||||
|
Add,
|
||||||
|
AddOne,
|
||||||
|
AddEquals,
|
||||||
|
LessThan,
|
||||||
|
LeftShift,
|
||||||
|
LeftShitEquals,
|
||||||
|
LessOrEqual,
|
||||||
|
EqualAssign,
|
||||||
|
EqualCompare,
|
||||||
|
EqualStrongCompare,
|
||||||
|
Arrow,
|
||||||
|
MoreThan,
|
||||||
|
MoreOrEqual,
|
||||||
|
RightShift,
|
||||||
|
RightShiftEquals,
|
||||||
|
UnsignedRightShift,
|
||||||
|
UnsignedRightShiftEquals,
|
||||||
|
BitOr,
|
||||||
|
BitOrEquals,
|
||||||
|
LogicOr,
|
||||||
|
LogicOrEquals,
|
||||||
|
Bitflip,
|
||||||
|
KeyAwait,
|
||||||
|
KeyBreak,
|
||||||
|
KeyCase,
|
||||||
|
KeyCatch,
|
||||||
|
KeyClass,
|
||||||
|
KeyComment,
|
||||||
|
KeyConst,
|
||||||
|
KeyContinue,
|
||||||
|
KeyDebugger,
|
||||||
|
KeyDefault,
|
||||||
|
KeyDelete,
|
||||||
|
KeyDo,
|
||||||
|
KyeElse,
|
||||||
|
KeyEnum,
|
||||||
|
KeyExport,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum Actions {
|
||||||
|
Assign,
|
||||||
|
Codeflow(Codeflow),
|
||||||
|
Raw(RawValue),
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum RawValue {
|
||||||
|
Bool(bool),
|
||||||
|
Float(f64),
|
||||||
|
Int(BigInt),
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum Codeflow {
|
||||||
|
Compare(Comparison),
|
||||||
|
TryCatch,
|
||||||
|
Loop,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum Comparison {
|
||||||
|
WeakEquals,
|
||||||
|
StrongEquals,
|
||||||
|
WeakNotEquals,
|
||||||
|
StrongNotEquals,
|
||||||
|
LessThan,
|
||||||
|
LessOrEqual,
|
||||||
|
MoreThan,
|
||||||
|
MoreOrEqual,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum Keywords {
|
||||||
|
Await,
|
||||||
|
Break,
|
||||||
|
Case,
|
||||||
|
Catch,
|
||||||
|
Class,
|
||||||
|
Const,
|
||||||
|
Continue,
|
||||||
|
Debugger,
|
||||||
|
Default,
|
||||||
|
Delete,
|
||||||
|
Do,
|
||||||
|
Else,
|
||||||
|
Enum,
|
||||||
|
Export,
|
||||||
|
Extends,
|
||||||
|
Finally,
|
||||||
|
}
|
Loading…
Reference in a new issue