grain-lang
diff --git a/‎compiler/package.json‎
Lines changed: 1 addition & 0 deletions b/‎compiler/package.json‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎compiler/src/formatting/format.re‎
Lines changed: 52 additions & 51 deletions b/‎compiler/src/formatting/format.re‎
Lines changed: 52 additions & 51 deletions
diff --git a/‎compiler/src/parsing/lexer.re‎
Lines changed: 66 additions & 26 deletions b/‎compiler/src/parsing/lexer.re‎
Lines changed: 66 additions & 26 deletions
@@ -29,6 +29,7 @@
     "parser:interpret": "esy b menhir src/parsing/parser.mly --unused-tokens --interpret",
     "parser:interpret-error": "esy b menhir src/parsing/parser.mly --unused-tokens --interpret-error",
     "parser:list-errors": "esy b menhir src/parsing/parser.mly --unused-tokens --list-errors > src/parsing/parser.messages.generated",
+    "parser:update-errors": "esy b menhir src/parsing/parser.mly --unused-tokens --update-errors src/parsing/parser.messages > src/parsing/parser.messages.generated && cp src/parsing/parser.messages.generated src/parsing/parser.messages",
     "parser:check-errors": "npm run parser:list-errors && esy b menhir src/parsing/parser.mly --unused-tokens --compare-errors src/parsing/parser.messages.generated --compare-errors src/parsing/parser.messages",
     "import-dependencies": "esy import-dependencies _export",
     "export-dependencies": "esy export-dependencies",
 
@@ -8,33 +8,40 @@ module Doc = Res_doc;
 
 let exception_primitives = [|"throw", "fail", "assert"|];
 
-let op_precedence = fn =>
-  switch (fn) {
-  | "*"
-  | "/"
-  | "%" => 120
-  | "+"
-  | "-"
-  | "++" => 110
-  | "<<"
-  | ">>"
-  | ">>>" => 100
-  | "<"
-  | "<="
-  | ">"
-  | ">=" => 90
-  | "=="
-  | "!="
-  | "is"
-  | "isnt" => 80
-  | "&" => 70
-  | "^" => 60
-  | "|" => 50
-  | "&&" => 40
-  | "||" => 30
-  | "_" => 10
-  | _ => 9999
+let op_precedence = fn => {
+  let op_precedence = fn =>
+    switch (fn) {
+    | '*'
+    | '/'
+    | '%' => 120
+    | '+'
+    | '-' => 110
+    | '<'
+    | '>' => 90
+    | '&' => 70
+    | '^' => 60
+    | '|' => 50
+    | '_' => 10
+    | _ => 9999
+    };
+  if (String.length(fn) > 1) {
+    switch (String.sub(fn, 0, 2)) {
+    | "++" => 110
+    | "<<"
+    | ">>" => 100
+    | "=="
+    | "!="
+    | "is" => 80
+    | "&&" => 40
+    | "||" => 30
+    | _ => op_precedence(fn.[0])
+    };
+  } else if (String.length(fn) > 0) {
+    op_precedence(fn.[0]);
+  } else {
+    9999;
   };
+};
 let list_cons = "[...]";
 
 exception IllegalParse(string);
@@ -184,37 +191,31 @@ let add_parens = (doc: Doc.t) =>
   ]);
 
 let infixop = (op: string) => {
-  switch (op) {
-  | "+"
-  | "-"
-  | "*"
-  | "/"
-  | "%"
-  | "is"
-  | "isnt"
-  | "=="
-  | "++"
-  | "!="
-  | "^"
-  | "<"
-  | "<<"
-  | ">"
-  | ">>"
-  | ">>>"
-  | "<="
-  | ">="
-  | "&"
-  | "&&"
-  | "|"
-  | "||" => true
+  switch (op.[0]) {
+  | '+'
+  | '-'
+  | '*'
+  | '/'
+  | '%'
+  | '='
+  | '^'
+  | '<'
+  | '>'
+  | '&'
+  | '|' => true
+  | _ when op == "is" => true
+  | _ when op == "isnt" => true
+  | _ when op == "!=" => true
   | _ => false
+  | exception _ => false
   };
 };
 
 let prefixop = (op: string) => {
-  switch (op) {
-  | "!" => true
+  switch (op.[0]) {
+  | '!' => true
   | _ => false
+  | exception _ => false
   };
 };
 
 
@@ -118,6 +118,33 @@ let lident = [%sedlex.regexp?
   (Sub(xid_start, lu) | '_', Star(xid_continue))
 ];
 
+let operator_char = [%sedlex.regexp?
+  '$' | '&' | '*' | '/' | '+' | '-' | '=' | '>' | '<' | '^' | '|' | '!' | '?' |
+  '%' |
+  ':' |
+  '.'
+];
+let operator_chars = [%sedlex.regexp? Star(operator_char)];
+
+// We make sure that `>` operators contain at least one non-`>` char to not
+// confuse them for `>>>` chains at the end of types, e.g. `List<Option<Box<a>>>`
+let rcaret_operator_char = [%sedlex.regexp? Sub(operator_char, '>')];
+let rcaret_operator_chars = [%sedlex.regexp?
+  (operator_chars, rcaret_operator_char, operator_chars)
+];
+
+// Similarly, we do this for `<` even though it's a simpler case
+let lcaret_operator_char = [%sedlex.regexp? Sub(operator_char, '<')];
+let lcaret_operator_chars = [%sedlex.regexp?
+  (operator_chars, lcaret_operator_char, operator_chars)
+];
+
+// Infix operators are not allowed to start with `//` or `/*` as they
+// indicate comments
+let slash_operator_chars = [%sedlex.regexp?
+  (Sub(operator_char, '/' | '*'), operator_chars)
+];
+
 // Tabs and space separators (https://www.compart.com/en/unicode/category/Zs)
 let blank = [%sedlex.regexp? Plus(zs | '\t')];
 
@@ -203,6 +230,10 @@ let rec token = lexbuf => {
   | "export" => positioned(EXPORT)
   | "except" => positioned(EXCEPT)
   | "from" => positioned(FROM)
+  | "*" => positioned(STAR)
+  | "/" => positioned(SLASH)
+  | "|" => positioned(PIPE)
+  | "-" => positioned(DASH)
   | "->" => positioned(ARROW)
   | "=>" => positioned(THICKARROW)
   | "type" => positioned(TYPE)
@@ -223,9 +254,6 @@ let rec token = lexbuf => {
   | "::" => positioned(COLONCOLON)
   | ":=" => positioned(GETS)
   | ":" => positioned(COLON)
-  | "is" => positioned(IS)
-  | "isnt" => positioned(ISNT)
-  | "==" => positioned(EQEQ)
   | "=" => positioned(EQUAL)
   | "," => positioned(COMMA)
   | ";" => positioned(SEMI)
@@ -237,32 +265,44 @@ let rec token = lexbuf => {
   | "[" => positioned(LBRACK)
   | "[>" => positioned(LBRACKRCARET)
   | "]" => positioned(RBRACK)
-  | "^" => positioned(CARET)
   | "<" => positioned(LCARET)
-  | "<<" => positioned(LCARETLCARET)
   /* We do not lex >> or >>> as a single token as type vectors can contain
-     these, e.g. List<Option<a>> */
+     these, e.g. List<Option<a>>. An operator like `>>>>` is lexed as four
+     seperate tokens and the parser sorts it out. */
   | ">" => positioned(RCARET)
-  | "^" => positioned(CARET)
-  | "++" => positioned(PLUSPLUS)
-  | "+" => positioned(PLUS)
-  | "-" => positioned(DASH)
-  | "*" => positioned(STAR)
-  | "/" => positioned(SLASH)
-  | "%" => positioned(PERCENT)
-  | "+=" => positioned(PLUSEQ)
-  | "-=" => positioned(DASHEQ)
-  | "*=" => positioned(STAREQ)
-  | "/=" => positioned(SLASHEQ)
-  | "%=" => positioned(PERCENTEQ)
-  | "<=" => positioned(LESSEQ)
-  | ">=" => positioned(GREATEREQ)
-  | "&" => positioned(AMP)
-  | "&&" => positioned(AMPAMP)
-  | "|" => positioned(PIPE)
-  | "||" => positioned(PIPEPIPE)
-  | "!" => positioned(NOT)
-  | "!=" => positioned(NOTEQ)
+  /* The order of these is somewhat important and is why they are
+     not sorted by precedence */
+  | "+="
+  | "-="
+  | "*="
+  | "/="
+  | "%=" =>
+    positioned(INFIX_ASSIGNMENT_10(Sedlexing.Utf8.sub_lexeme(lexbuf, 0, 1)))
+  | ("==" | "!=", operator_chars)
+  | "is"
+  | "isnt" => positioned(INFIX_80(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("<<", operator_chars)
+  | (">>", rcaret_operator_chars) =>
+    positioned(INFIX_100(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("<", lcaret_operator_chars)
+  | (">", rcaret_operator_chars) =>
+    positioned(INFIX_90(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("^", operator_chars) =>
+    positioned(INFIX_60(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("+" | "-", operator_chars) =>
+    positioned(INFIX_110(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("*" | "%", operator_chars)
+  | ("/", slash_operator_chars) =>
+    positioned(INFIX_120(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("&&", operator_chars) =>
+    positioned(INFIX_40(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("&", operator_chars) =>
+    positioned(INFIX_70(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("||" | "??", operator_chars) =>
+    positioned(INFIX_30(Sedlexing.Utf8.lexeme(lexbuf)))
+  | ("|", operator_chars) =>
+    positioned(INFIX_50(Sedlexing.Utf8.lexeme(lexbuf)))
+  | "!" => positioned(PREFIX_150(Sedlexing.Utf8.lexeme(lexbuf)))
   | "@" => positioned(AT)
   | '"' =>
     let (start_p, _) = Sedlexing.lexing_positions(lexbuf);