- let integer = (x) => {
- let wrapped_x = toSome(x);
- let plusMinus = orDo(match1Char('+'), match1Char('-')); // ([+]|[-])
- let d = matchRange('0', '9'); // \d
- var result = thenDo(thenDo(thenDo(wrapped_x, zeroOrOnceDo(plusMinus)), d), zeroOrMoreDo(d));
- if (result._tag == "Some") {
- result.value.matched_type = TokenType.INT;
- }
- return result;
- };
- let space = (x) => {
- let wrapped_x = toSome(x);
- let s_aux = orDo(match1Char(' '), match1Char('\t')); // (" " | "\t")
- var result = thenDo(thenDo(wrapped_x, s_aux), zeroOrMoreDo(s_aux));
- if (result._tag == "Some") {
- result.value.matched_type = TokenType.SP;
- }
- return result;
- };
- let newline = (x) => {
- let wrapped_x = toSome(x);
- // nl = \r?\n
- let result = thenDo(thenDo(wrapped_x, zeroOrOnceDo(match1Char('\r'))), match1Char('\n'));
- if (result._tag == "Some") {
- result.value.matched_type = TokenType.NL;
- }
- return result;
- };
+ let integer = bTerm((x) => thenDo(thenDo(thenDo(x, zeroOrOnceDo(plusMinus)), d), zeroOrMoreDo(d)), TokenType.INT);
+ // space = [ \t]+
+ let space = bTerm((x) => thenDo(thenDo(x, s_aux), zeroOrMoreDo(s_aux)), TokenType.INT);
+ // newline = \r?\n
+ let newline = bTerm((x) => thenDo(thenDo(x, zeroOrOnceDo(match1Char('\r'))), match1Char('\n')), TokenType.NL);
+ // [_A-Za-z]
+ let idHead = orDo(orDo(matchRange('a', 'z'), matchRange('A', 'Z')), match1Char('_'));
+ let idRemained = orDo(idHead, matchRange('0', '9')); // [_A-Za-z0-9]
+ // id = [_A-Za-z][_A-Za-z0-9]*
+ let id = bTerm((x) => thenDo(thenDo(x, idHead), zeroOrMoreDo(idRemained)), TokenType.ID);
+ let doublequote = match1Char("\"");
+ // [\\][\"]
+ let escapeReverseSlash = (x) => thenDo(thenDo(toSome(x), match1Char("\\")), doublequote);
+ // ([\\]["]|[^\"])*
+ let stringInnerPattern = zeroOrMoreDo(orDo(escapeReverseSlash, notDo(match1Char("\""))));
+ // str = ["]([\\]["]|[^"])*["]
+ let str = bTerm((x) => thenDo(thenDo(thenDo(x, doublequote), stringInnerPattern), doublequote), TokenType.STR);
+ // float = [+-]?\d+[.]\d+
+ function floatPattern(x) {
+ return thenDo(thenDo(thenDo(thenDo(thenDo(thenDo(x, zeroOrOnceDo(plusMinus)), d), zeroOrMoreDo(d)), match1Char(".")), d), zeroOrMoreDo(d));
+ }
+ ;
+ let float = bTerm(floatPattern, TokenType.FLO);
+ // operators
+ // +.
+ let floatAdd = bTerm((x) => thenDo(thenDo(x, match1Char("+")), match1Char(".")), TokenType.F_ADD);
+ // +.
+ let floatSub = bTerm((x) => thenDo(thenDo(x, match1Char("-")), match1Char(".")), TokenType.F_SUB);
+ // *.
+ let floatMul = bTerm((x) => thenDo(thenDo(x, match1Char("*")), match1Char(".")), TokenType.F_MUL);
+ // /.
+ let floatDiv = bTerm((x) => thenDo(thenDo(x, match1Char("/")), match1Char(".")), TokenType.F_DIV);
+ // ==
+ let eq = bTerm((x) => thenDo(thenDo(x, match1Char("=")), match1Char("=")), TokenType.EQ);
+ // >=
+ let ge = bTerm((x) => thenDo(thenDo(x, match1Char(">")), match1Char("=")), TokenType.GE);
+ // <=
+ let le = bTerm((x) => thenDo(thenDo(x, match1Char("<")), match1Char("=")), TokenType.LE);
+ // ->
+ let rightArrow = bTerm((x) => thenDo(thenDo(x, match1Char("-")), match1Char(">")), TokenType.R_ARROW);
+ /**
+ * unary operator : generating the pattern of basic unary operator
+ * @param char : uniry char for the operator
+ * @param token_type : the corresponding token_type
+ */
+ function unaryOp(char, token_type) {
+ return bTerm((x) => thenDo(x, match1Char(char)), token_type);
+ }
+ ;
+ let intAdd = unaryOp('+', TokenType.I_ADD);
+ let intSub = unaryOp('-', TokenType.I_SUB);
+ let intMul = unaryOp('*', TokenType.I_MUL);
+ let intDiv = unaryOp('/', TokenType.I_DIV);
+ let lParen = unaryOp('(', TokenType.L_PAREN);
+ let rParen = unaryOp(')', TokenType.R_PAREN);
+ let lBracket = unaryOp('[', TokenType.L_BRACK);
+ let rBracket = unaryOp(']', TokenType.R_BRACK);
+ let lBrace = unaryOp('{', TokenType.L_BRACE);
+ let rBrace = unaryOp('}', TokenType.R_BRACE);
+ let comma = unaryOp(',', TokenType.COMMA);
+ let dot = unaryOp('.', TokenType.DOT);
+ let colon = unaryOp(':', TokenType.COLON);
+ let semicolon = unaryOp(';', TokenType.SEMI_C);
+ let at = unaryOp('@', TokenType.AT);
+ let hash = unaryOp('#', TokenType.HASH);
+ let set = unaryOp('=', TokenType.SET);
+ let greaterthan = unaryOp('>', TokenType.GT);
+ let lessthan = unaryOp('<', TokenType.LE);