-
Notifications
You must be signed in to change notification settings - Fork 0
/
scanner.mll
88 lines (82 loc) · 2.38 KB
/
scanner.mll
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
(* Ocamllex scanner for MicroC *)
{ open Parser }
let digit = ['0' - '9']
let digits = digit+
rule token = parse
[' ' '\t' '\r' '\n'] { token lexbuf } (* Whitespace *)
| "/*" { comment lexbuf } (* Comments *)
| "//" { inline lexbuf } (* Inline*)
(* Syntax *)
| '"' { QUOTE }
| '(' { LPAREN }
| ')' { RPAREN }
| '{' { LBRACE }
| '}' { RBRACE }
| '[' { LBRACK }
| ']' { RBRACK }
| ':' { COLON }
| ';' { SEMI }
| ',' { COMMA }
(* Operators *)
| '`' { TRANSPOSE }
| '+' { PLUS }
| "++" { INC }
| "--" { DEC }
| '-' { MINUS }
| '*' { TIMES }
| ".*" { TIMES_M }
| "./" { DIVIDE_M }
| "**" { DOT }
(* | '~' { INVERSE } *)
| '/' { DIVIDE }
| '%' { MOD }
| '=' { ASSIGN }
| "==" { EQ }
(* | "===" { PEQ } *)
| "!=" { NEQ }
| '<' { LT }
| "<=" { LEQ }
| ">" { GT }
| ">=" { GEQ }
| "&&" { AND }
| "||" { OR }
| "!" { NOT }
(* Control *)
| "class" { CLASS }
| "func" { FUNC }
| "if" { IF }
| "else" { ELSE }
| "for" { FOR }
| "while" { WHILE }
| "return" { RETURN }
(* Types *)
| "int" { INT }
| "int[]" { INTM }
| "float[]" { FLOATM }
| "char[]" { CHARM }
| "string[]" { STRINGM }
| "bool[]" { BOOLM }
(*| "int[" digits "]" ('[' digits ']')* as lxm { INTM(lxm) }*)
| "char" { CHAR }
| "bool" { BOOL }
| "float" { FLOAT }
| "void" { VOID }
| "Fpoint" { FPOINT }
| "list" { LIST }
| "string" { STRING }
(* Literals *)
| "true" { TRUE }
| "false" { FALSE }
| digits as lxm { LITERAL(int_of_string lxm) }
| digits '.' digit* ( ['e' 'E'] ['+' '-']? digits )? as lxm { FLIT(lxm) }
| ['a'-'z' 'A'-'Z']['a'-'z' 'A'-'Z' '0'-'9' '_']* as lxm { ID(lxm) }
| '"'[^'"']* '"' as lxm {SLIT(String.sub lxm 1 ((String.length lxm )- 2))}
| ''' ['a'-'z' 'A'-'Z' '0'-'9' '_'] ''' as lxm {CHLIT(lxm)}
| eof { EOF }
| _ as char { raise (Failure("illegal character " ^ Char.escaped char)) }
and comment = parse
"*/" { token lexbuf }
| _ { comment lexbuf }
and inline = parse
'\n' { token lexbuf }
| _ { inline lexbuf }