tokeniser.js 1.1 KB

123456789101112131415161718192021222324252627282930
  1. var lop = require("lop");
  2. var RegexTokeniser = lop.RegexTokeniser;
  3. exports.tokenise = tokenise;
  4. var stringPrefix = "'((?:\\\\.|[^'])*)";
  5. function tokenise(string) {
  6. var identifierCharacter = "(?:[a-zA-Z\\-_]|\\\\.)";
  7. var tokeniser = new RegexTokeniser([
  8. {name: "identifier", regex: new RegExp("(" + identifierCharacter + "(?:" + identifierCharacter + "|[0-9])*)")},
  9. {name: "dot", regex: /\./},
  10. {name: "colon", regex: /:/},
  11. {name: "gt", regex: />/},
  12. {name: "whitespace", regex: /\s+/},
  13. {name: "arrow", regex: /=>/},
  14. {name: "equals", regex: /=/},
  15. {name: "startsWith", regex: /\^=/},
  16. {name: "open-paren", regex: /\(/},
  17. {name: "close-paren", regex: /\)/},
  18. {name: "open-square-bracket", regex: /\[/},
  19. {name: "close-square-bracket", regex: /\]/},
  20. {name: "string", regex: new RegExp(stringPrefix + "'")},
  21. {name: "unterminated-string", regex: new RegExp(stringPrefix)},
  22. {name: "integer", regex: /([0-9]+)/},
  23. {name: "choice", regex: /\|/},
  24. {name: "bang", regex: /(!)/}
  25. ]);
  26. return tokeniser.tokenise(string);
  27. }