-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathscanner.mll
More file actions
executable file
·84 lines (77 loc) · 2.45 KB
/
scanner.mll
File metadata and controls
executable file
·84 lines (77 loc) · 2.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
(* Ocamllex scanner for Texy, based off of the MicroC scanner *)
{ open Parser }
let digit = ['0' - '9']
let digits = digit+
rule token = parse
[' ' '\t' '\r' '\n'] { token lexbuf } (* Whitespace *)
| "/*" { comment lexbuf } (* Comments *)
| '(' { LPAREN }
| ')' { RPAREN }
| '{' { LBRACE }
| '}' { RBRACE }
| ';' { SEMI }
| ',' { COMMA }
| '+' { PLUS }
| '-' { MINUS }
| '*' { TIMES }
| '/' { DIVIDE }
| '=' { ASSIGN }
| '[' { LBRACKET }
| ']' { RBRACKET }
| '.' { DOT }
| '"' { wordlit (Buffer.create 80) lexbuf }
| "==" { EQ }
| "!=" { NEQ }
| '<' { LT }
| "<=" { LEQ }
| ">" { GT }
| ">=" { GEQ }
| "&&" { AND }
| "||" { OR }
| "!" { NOT }
| "#" { CONBIN }
| "%" { BINCON }
| "~" { BITFLIP }
| "#+" { SHIFTUP }
| "#-" { SHIFTDOWN }
| "^" { CONCAT }
| "@" { AT }
| "if" { IF }
| "else" { ELSE }
| "for" { FOR }
| "while" { WHILE }
| "return" { RETURN }
| "int" { INT }
| "bool" { BOOL }
| "char" { CHAR }
| "Word" { WORD }
| "File" { FILE }
| "float" { FLOAT }
| "void" { VOID }
| "struct" { STRUCT }
| "true" { BLIT(true) }
| "false" { BLIT(false) }
| digits as lxm { LITERAL(int_of_string lxm) }
| digits '.' digit* ( ['e' 'E'] ['+' '-']? digits )? as lxm { FLIT(lxm) }
| '''([' '-'!' '#'-'[' ']'-'~' ]|['0'-'9'])''' as lxm {CHARLIT( String.get lxm 1)}
| ['a'-'z' 'A'-'Z']['a'-'z' 'A'-'Z' '0'-'9' '_']* as lxm { ID(lxm) }
| eof { EOF }
| _ as char { raise (Failure("illegal character " ^ Char.escaped char)) }
(* https://realworldocaml.org/v1/en/html/parsing-with-ocamllex-and-menhir.html
*)
and wordlit wbuf =
parse
| '"' { WLIT (Buffer.contents wbuf) }
| '\\' '/' { Buffer.add_char wbuf '/'; wordlit wbuf lexbuf }
| '\\' '\\' { Buffer.add_char wbuf '\\'; wordlit wbuf lexbuf }
| '\\' 'b' { Buffer.add_char wbuf '\b'; wordlit wbuf lexbuf }
| '\\' 'n' { Buffer.add_char wbuf '\n'; wordlit wbuf lexbuf }
| '\\' 'f' { Buffer.add_char wbuf '\012'; wordlit wbuf lexbuf }
| '\\' 'r' { Buffer.add_char wbuf '\r'; wordlit wbuf lexbuf }
| '\\' 't' { Buffer.add_char wbuf '\t'; wordlit wbuf lexbuf }
| [^ '"' '\\']+ { Buffer.add_string wbuf (Lexing.lexeme lexbuf); wordlit wbuf lexbuf}
| _ { raise (Failure("Illegal word character " ^ Lexing.lexeme lexbuf)) }
| eof { raise (Failure("Unterminated word ")) }
and comment = parse
"*/" { token lexbuf }
| _ { comment lexbuf }