forked from ocaml/ocaml
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparse.ml
173 lines (156 loc) · 7.05 KB
/
parse.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
(**************************************************************************)
(* *)
(* OCaml *)
(* *)
(* Xavier Leroy, projet Cristal, INRIA Rocquencourt *)
(* *)
(* Copyright 1996 Institut National de Recherche en Informatique et *)
(* en Automatique. *)
(* *)
(* All rights reserved. This file is distributed under the terms of *)
(* the GNU Lesser General Public License version 2.1, with the *)
(* special exception on linking described in the file LICENSE. *)
(* *)
(**************************************************************************)
(* Entry points in the parser *)
(* Skip tokens to the end of the phrase *)
let last_token = ref Parser.EOF
let token lexbuf =
let token = Lexer.token lexbuf in
last_token := token;
token
let rec skip_phrase lexbuf =
match token lexbuf with
| Parser.SEMISEMI | Parser.EOF -> ()
| _ -> skip_phrase lexbuf
| exception (Lexer.Error (Lexer.Unterminated_comment _, _)
| Lexer.Error (Lexer.Unterminated_string, _)
| Lexer.Error (Lexer.Reserved_sequence _, _)
| Lexer.Error (Lexer.Unterminated_string_in_comment _, _)
| Lexer.Error (Lexer.Illegal_character _, _)) ->
skip_phrase lexbuf
let maybe_skip_phrase lexbuf =
match !last_token with
| Parser.SEMISEMI | Parser.EOF -> ()
| _ -> skip_phrase lexbuf
let wrap parsing_fun lexbuf =
try
Docstrings.init ();
Lexer.init ();
let ast = parsing_fun lexbuf in
Parsing.clear_parser();
Docstrings.warn_bad_docstrings ();
last_token := Parser.EOF;
ast
with
| Lexer.Error(Lexer.Illegal_character _, _) as err
when !Location.input_name = "//toplevel//"->
skip_phrase lexbuf;
raise err
| Syntaxerr.Error _ as err
when !Location.input_name = "//toplevel//" ->
maybe_skip_phrase lexbuf;
raise err
| Parsing.Parse_error | Syntaxerr.Escape_error ->
let loc = Location.curr lexbuf in
if !Location.input_name = "//toplevel//"
then maybe_skip_phrase lexbuf;
raise(Syntaxerr.Error(Syntaxerr.Other loc))
let rec loop lexbuf in_error checkpoint =
let module I = Parser.MenhirInterpreter in
match checkpoint with
| I.InputNeeded _env ->
let triple =
if in_error then
(* The parser detected an error.
At this point we don't want to consume input anymore. In the
top-level, it would translate into waiting for the user to type
something, just to raise an error at some earlier position, rather
than just raising the error immediately.
This worked before with yacc because, AFAICT (@let-def):
- yacc eagerly reduces "default reduction" (when the next action
is to reduce the same production no matter what token is read,
yacc reduces it immediately rather than waiting for that token
to be read)
- error productions in OCaml grammar are always in a position that
allows default reduction ("error" symbol is the last producer,
and the lookahead token will not be used to disambiguate between
two possible error rules)
This solution is fragile because it relies on an optimization
(default reduction), that changes the semantics of the parser the
way it is implemented in Yacc (an optimization that changes
semantics? hmmmm).
Rather than relying on implementation details of the parser, when
an error is detected in this loop we stop looking at the input and
fill the parser with EOF tokens.
The skip_phrase logic will resynchronize the input stream by
looking for the next ';;'. *)
(Parser.EOF, lexbuf.Lexing.lex_curr_p, lexbuf.Lexing.lex_curr_p)
else
let token = token lexbuf in
(token, lexbuf.Lexing.lex_start_p, lexbuf.Lexing.lex_curr_p)
in
let checkpoint = I.offer checkpoint triple in
loop lexbuf in_error checkpoint
| I.Shifting _ | I.AboutToReduce _ ->
loop lexbuf in_error (I.resume checkpoint)
| I.Accepted v -> v
| I.Rejected -> raise Parser.Error
| I.HandlingError _ ->
loop lexbuf true (I.resume checkpoint)
let wrap_menhir entry lexbuf =
let initial = entry lexbuf.Lexing.lex_curr_p in
wrap (fun lexbuf -> loop lexbuf false initial) lexbuf
let implementation = wrap_menhir Parser.Incremental.implementation
and interface = wrap_menhir Parser.Incremental.interface
and toplevel_phrase = wrap_menhir Parser.Incremental.toplevel_phrase
and use_file = wrap_menhir Parser.Incremental.use_file
and core_type = wrap_menhir Parser.Incremental.parse_core_type
and expression = wrap_menhir Parser.Incremental.parse_expression
and pattern = wrap_menhir Parser.Incremental.parse_pattern
let longident = wrap_menhir Parser.Incremental.parse_any_longident
let val_ident = wrap_menhir Parser.Incremental.parse_val_longident
let constr_ident= wrap_menhir Parser.Incremental.parse_constr_longident
let extended_module_path =
wrap_menhir Parser.Incremental.parse_mod_ext_longident
let simple_module_path = wrap_menhir Parser.Incremental.parse_mod_longident
let type_ident = wrap_menhir Parser.Incremental.parse_mty_longident
(* Error reporting for Syntaxerr *)
(* The code has been moved here so that one can reuse Pprintast.tyvar *)
let prepare_error err =
let open Syntaxerr in
match err with
| Unclosed(opening_loc, opening, closing_loc, closing) ->
Location.errorf
~loc:closing_loc
~sub:[
Location.msg ~loc:opening_loc
"This '%s' might be unmatched" opening
]
"Syntax error: '%s' expected" closing
| Expecting (loc, nonterm) ->
Location.errorf ~loc "Syntax error: %s expected." nonterm
| Not_expecting (loc, nonterm) ->
Location.errorf ~loc "Syntax error: %s not expected." nonterm
| Applicative_path loc ->
Location.errorf ~loc
"Syntax error: applicative paths of the form F(X).t \
are not supported when the option -no-app-func is set."
| Variable_in_scope (loc, var) ->
Location.errorf ~loc
"In this scoped type, variable %a \
is reserved for the local type %s."
Pprintast.tyvar var var
| Other loc ->
Location.errorf ~loc "Syntax error"
| Ill_formed_ast (loc, s) ->
Location.errorf ~loc
"broken invariant in parsetree: %s" s
| Invalid_package_type (loc, s) ->
Location.errorf ~loc "invalid package type: %s" s
let () =
Location.register_error_of_exn
(function
| Syntaxerr.Error err -> Some (prepare_error err)
| _ -> None
)