-
Notifications
You must be signed in to change notification settings - Fork 11
/
coq2html.mll
535 lines (461 loc) · 15.4 KB
/
coq2html.mll
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
(* *********************************************************************)
(* *)
(* The Coq2HTML documentation generator *)
(* *)
(* Xavier Leroy, Collège de France and INRIA Paris *)
(* *)
(* Copyright Institut National de Recherche en Informatique et en *)
(* Automatique. All rights reserved. This file is distributed *)
(* under the terms of the GNU General Public License as published by *)
(* the Free Software Foundation, either version 2 of the License, or *)
(* (at your option) any later version. *)
(* *)
(* *********************************************************************)
{
open Printf
(** Cross-referencing *)
let current_module = ref ""
(* Record cross-references found in .glob files *)
type xref =
| Def of string * string (* path, type *)
| Ref of string * string * string (* unit, path, type *)
(* (name of module, character position in file) -> cross-reference *)
let xref_table : (string * int, xref) Hashtbl.t = Hashtbl.create 273
(* Records all module names for which a .glob file is given *)
let xref_modules : (string, unit) Hashtbl.t = Hashtbl.create 29
let path sp id =
match sp, id with
| "<>", "<>" -> ""
| "<>", _ -> id
| _ , "<>" -> sp
| _ , _ -> sp ^ "." ^ id
let add_module m =
(*eprintf "add_module %s\n" m;*)
Hashtbl.add xref_modules m ()
let add_reference curmod pos dp sp id ty =
(*eprintf "add_reference %s %d %s %s %s %s\n" curmod pos dp sp id ty;*)
if not (Hashtbl.mem xref_table (curmod, pos))
then Hashtbl.add xref_table (curmod, pos) (Ref(dp, path sp id, ty))
let add_definition curmod pos sp id ty =
if not (Hashtbl.mem xref_table (curmod, pos))
then Hashtbl.add xref_table (curmod, pos) (Def(path sp id, ty))
(* Map module names to URLs *)
let coqlib_url = "https://coq.inria.fr/library/"
(* logical name with final '.' -> absolute or relative URL *)
let documentation_urls : (string * string) list ref = ref [("Coq.", coqlib_url)]
let add_documentation_url logicalname url =
documentation_urls := (logicalname ^ ".", url) :: !documentation_urls
let starts_with s x =
let ls = String.length s and lx = String.length x in
ls >= lx && String.sub s 0 lx = x
let ends_with s x =
let ls = String.length s and lx = String.length x in
ls >= lx && String.sub s (ls - lx) lx = x
let url_concat url suff =
(if ends_with url "/" then url else url ^ "/") ^ suff
let url_for_module m =
(*eprintf "url_for_module %s\n" m;*)
let rec url_for = function
| [] ->
if Hashtbl.mem xref_modules m then m ^ ".html" else raise Not_found
| (pref, url) :: rem ->
if starts_with m pref then url_concat url m ^ ".html" else url_for rem
in url_for !documentation_urls
(* Produce a HTML link if possible *)
type link = Link of string | Anchor of string | Nolink
let re_sane_path = Str.regexp "[A-Za-z0-9_.\x80-\xFF]+$"
let crossref m pos =
(*eprintf "crossref %s %d\n" m pos;*)
try match Hashtbl.find xref_table (m, pos) with
| Def(p, _) ->
Anchor p
| Ref(m', p, _) ->
let url = url_for_module m' in (* can raise Not_found *)
if p = "" then
Link url
else if Str.string_match re_sane_path p 0 then
Link(url ^ "#" ^ p)
else
Nolink
with Not_found ->
Nolink
(** Keywords *)
module StringSet = Set.Make(String)
let mkset l = List.fold_right StringSet.add l StringSet.empty
let coq_keywords = mkset [
(* "The following character sequences are keywords defined in the
main Coq grammar that cannot be used as identifiers"
(reference manual) *)
"Axiom"; "CoFixpoint"; "Definition"; "Fixpoint"; "Hypothesis";
"Parameter"; "Prop"; "SProp"; "Set"; "Theorem"; "Type"; "Variable";
"as"; "at"; "cofix"; "else"; "end"; "fix"; "for"; "forall"; "fun";
"if"; "in"; "let"; "match"; "return"; "then"; "where"; "with";
(* "The following are keywords defined in notations or plugins
loaded in the prelude" (reference manual) *)
"IF"; "by"; "exists"; "exists2"; "using";
(* The commands from the "Command Index" part of the reference manual.
Some commands I don't expect to see in .v files were removed. *)
"Abort"; "About"; "Admitted"; "Arguments"; "Axiom"; "Axioms";
"Canonical"; "Cd"; "Check"; "Class"; "Close"; "CoFixpoint";
"CoInductive"; "Coercion"; "Collection"; "Combined"; "Comments";
"Compute"; "Conjecture"; "Conjectures"; "Constraint"; "Context";
"Corollary"; "Defined"; "Definition"; "End"; "Eval"; "Example";
"Existential"; "Export"; "Fact"; "Fail"; "Fixpoint"; "Focus"; "From";
"Function"; "Functional"; "Goal"; "Hint"; "Hypotheses"; "Hypothesis";
"Implicit"; "Import"; "Include"; "Inductive"; "Infix"; "Instance";
"Lemma"; "Let"; "Ltac"; "Ltac2"; "Module"; "Next"; "Notation";
"Obligation"; "Obligations"; "Opaque"; "Open"; "Parameter";
"Parameters"; "Proof"; "Proposition"; "Qed"; "Record"; "Remark";
"Require"; "Reserved"; "Scheme"; "Scope"; "Section"; "Set";
"Strategy"; "Structure"; "SubClass"; "Tactic"; "Theorem";
"Transparent"; "Type"; "Universe"; "Variable"; "Variables"; "Variant";
"using"; "with"
]
(** HTML generation *)
let oc = ref stdout
let character = function
| '<' -> output_string !oc "<"
| '>' -> output_string !oc ">"
| '&' -> output_string !oc "&"
| c -> output_char !oc c
let section_level = function
| "*" -> 1
| "**" -> 2
| _ -> 3
let start_section sect =
fprintf !oc "<h%d>" (section_level sect)
let end_section sect =
fprintf !oc "</h%d>\n" (section_level sect)
let start_doc_right () =
fprintf !oc "<span class=\"docright\">(* "
let end_doc_right () =
fprintf !oc " *)</span>"
let enum_depth = ref 0
let set_enum_depth d =
if !enum_depth < d then begin
fprintf !oc "<ul>\n";
fprintf !oc "<li>\n";
incr enum_depth;
end
else if !enum_depth > d then begin
fprintf !oc "</li>\n";
fprintf !oc "</ul>\n";
decr enum_depth;
end
else if !enum_depth > 0 then begin
fprintf !oc "</li>\n";
fprintf !oc "<li>\n"
end
let start_doc () =
fprintf !oc "<div class=\"doc\">"
let end_doc () =
set_enum_depth 0;
fprintf !oc "</div>\n"
let ident pos id =
if StringSet.mem id coq_keywords then
fprintf !oc "<span class=\"kwd\">%s</span>" id
else if id = "_" then
fprintf !oc "_"
else match crossref !current_module pos with
| Nolink ->
fprintf !oc "<span class=\"id\">%s</span>" id
| Link p ->
fprintf !oc "<span class=\"id\"><a href=\"%s\">%s</a></span>" p id
| Anchor p ->
fprintf !oc "<span class=\"id\"><a name=\"%s\">%s</a></span>" p id
let space s =
for _ = 1 to String.length s do fprintf !oc " " done
let newline () =
fprintf !oc "<br/>\n"
let dashes = function
| "-" -> set_enum_depth 1
| "--" -> set_enum_depth 2
| "---" -> set_enum_depth 3
| "----" -> set_enum_depth 4
| _ -> fprintf !oc "<hr/>\n"
let start_verbatim () =
fprintf !oc "<pre>\n"
let end_verbatim () =
fprintf !oc "</pre>\n"
let start_comment () =
fprintf !oc "<span class=\"comment\">(*"
let end_comment () =
fprintf !oc "*)</span>"
let start_bracket () =
fprintf !oc "<span class=\"bracket\">"
let end_bracket () =
fprintf !oc "</span>"
let start_string () =
fprintf !oc "<span class=\"string\">\""
let end_string () =
fprintf !oc "\"</span>"
let in_proof = ref false
let start_proof s kwd =
in_proof := true;
fprintf !oc "<details>\n";
space s;
fprintf !oc "<summary class=\"toggleproof\">%s</summary>\n" kwd;
fprintf !oc "<div class=\"proofscript\">\n"
let end_proof kwd =
fprintf !oc "%s</div></details>\n" kwd;
in_proof := false
(* Like Str.global_replace but don't interpret '\1' etc in replacement text *)
let global_replace re subst txt =
Str.global_substitute re (fun _ -> subst) txt
let start_html_page modname =
output_string !oc
(global_replace (Str.regexp "\\$NAME") modname Resources.header)
let end_html_page () =
output_string !oc Resources.footer
}
let space = [' ' '\t']
let utf8 = ['\192'-'\255'] ['\128'-'\191']*
let identstart = ['A'-'Z' 'a'-'z' '_'] | utf8
let identnext = ['A'-'Z' 'a'-'z' '_' '0'-'9' '\''] | utf8
let ident = identstart identnext*
let path = ident ("." ident)*
let start_proof = ("Proof" space* ".") | ("Proof" space+ "with") | ("Next" space+ "Obligation.")
let end_proof = "Qed." | "Defined." | "Save." | "Admitted." | "Abort."
let globkind = ['a'-'z']+
let xref = (['A'-'Z' 'a'-'z' '0'-'9' '_' '.'] | utf8)+ | "<>"
let integer = ['0'-'9']+
rule coq_bol = parse
| (space* as s) (start_proof as sp)
{ start_proof s sp;
skip_newline lexbuf }
| space* "(** " ("*"+ as sect)
{ start_section sect;
doc lexbuf;
end_section sect;
skip_newline lexbuf }
| space* "(** "
{ start_doc();
doc lexbuf;
end_doc();
skip_newline lexbuf }
| (space* as s) "(*"
{ if !in_proof then (space s; start_comment());
comment lexbuf;
if !in_proof then coq lexbuf else skip_newline lexbuf }
| eof
{ () }
| space* as s
{ space s;
coq lexbuf }
and skip_newline = parse
| space* "\n"
{ coq_bol lexbuf }
| ""
{ coq lexbuf }
and coq = parse
| end_proof as ep
{ end_proof ep;
skip_newline lexbuf }
| "(**r "
{ start_doc_right();
doc lexbuf;
end_doc_right();
coq lexbuf }
| "(*"
{ if !in_proof then start_comment();
comment lexbuf;
coq lexbuf }
| path as id
{ ident (Lexing.lexeme_start lexbuf) id; coq lexbuf }
| "\""
{ start_string();
string lexbuf;
end_string();
coq lexbuf }
| "\n"
{ newline(); coq_bol lexbuf }
| eof
{ () }
| _ as c
{ character c; coq lexbuf }
and string = parse
| "\"\""
{ character '\"'; character '\"'; string lexbuf }
| "\""
{ () }
| eof
{ () }
| _ as c
{ character c; string lexbuf }
and bracket = parse
| ']'
{ () }
| '['
{ character '['; bracket lexbuf; character ']'; bracket lexbuf }
| path as id
{ ident (Lexing.lexeme_start lexbuf) id; bracket lexbuf }
| "\""
{ start_string();
string lexbuf;
end_string();
coq lexbuf }
| eof
{ () }
| _ as c
{ character c; bracket lexbuf }
and comment = parse
| "*)"
{ if !in_proof then end_comment() }
| "(*"
{ if !in_proof then start_comment();
comment lexbuf; comment lexbuf }
| eof
{ () }
| "\n"
{ if !in_proof then newline();
comment lexbuf }
| space* as s
{ if !in_proof then space s;
comment lexbuf }
| eof
{ () }
| _ as c
{ if !in_proof then character c;
comment lexbuf }
and doc_bol = parse
| "<<" space* "\n"
{ start_verbatim();
verbatim lexbuf;
end_verbatim();
doc_bol lexbuf }
| "-"+ as d
{ dashes d; doc lexbuf }
| "\n"
{ set_enum_depth 0; doc_bol lexbuf }
| ""
{ doc lexbuf }
and doc = parse
| "*)"
{ () }
| "\n"
{ character '\n'; doc_bol lexbuf }
| "["
{ start_bracket(); bracket lexbuf; end_bracket(); doc lexbuf }
| "#" ([^ '\n' '#']* as html) "#"
{ output_string !oc html; doc lexbuf }
| eof
{ () }
| _ as c
{ character c; doc lexbuf }
and verbatim = parse
| "\n>>" space* "\n"
{ () }
| eof
{ () }
| _ as c
{ character c; verbatim lexbuf }
and globfile = parse
| eof
{ () }
| "F" (path as m) space* "\n"
{ current_module := m; add_module m;
globfile lexbuf }
| "R" (integer as pos) ":" (integer)
space+ (xref as dp)
space+ (xref as sp)
space+ (xref as id)
space+ (globkind as ty)
space* "\n"
{ add_reference !current_module (int_of_string pos) dp sp id ty;
globfile lexbuf }
| (globkind as ty)
space+ (integer as pos) ":" (integer)
space+ (xref as sp)
space+ (xref as id)
space* "\n"
{ add_definition !current_module (int_of_string pos) sp id ty;
globfile lexbuf }
| [^ '\n']* "\n"
{ globfile lexbuf }
{
let make_redirect fromfile toURL =
let oc = open_out fromfile in
output_string oc
(global_replace (Str.regexp "\\$URL") toURL Resources.redirect);
close_out oc
let output_dir = ref Filename.current_dir_name
let logical_name_base = ref ""
let generate_css = ref true
let use_short_names = ref false
let generate_redirects = ref false
let module_name_of_file_name f =
let components = Str.split (Str.regexp "/") f in
String.concat "." (List.filter (fun s -> s <> "." && s <> "..") components)
let process_v_file f =
let pref_f = Filename.chop_suffix f ".v" in
let base_f = Filename.basename pref_f in
let module_name = !logical_name_base ^ module_name_of_file_name pref_f in
current_module := module_name;
let friendly_name = if !use_short_names then base_f else module_name in
let ic = open_in f in
oc := open_out (Filename.concat !output_dir (module_name ^ ".html"));
enum_depth := 0; in_proof := false;
start_html_page friendly_name;
coq_bol (Lexing.from_channel ic);
end_html_page();
close_out !oc; oc := stdout;
close_in ic;
if !generate_redirects && !logical_name_base <> "" then
make_redirect (Filename.concat !output_dir (base_f ^ ".html"))
(module_name ^ ".html")
let process_glob_file f =
current_module := "";
let ic = open_in f in
globfile (Lexing.from_channel ic);
close_in ic
let write_file txt filename =
let oc = open_out filename in
output_string oc txt;
close_out oc
let _ =
let v_files = ref [] and glob_files = ref [] in
let process_file f =
if Filename.check_suffix f ".v" then
v_files := f :: !v_files
else if Filename.check_suffix f ".glob" then
glob_files := f :: !glob_files
else begin
eprintf "Don't know what to do with file %s\n" f; exit 2
end in
Arg.parse (Arg.align [
"-base", Arg.String (fun s -> logical_name_base := s ^ "."),
"<coqdir> Set the name space for the modules being processed";
"-coqlib", Arg.String (fun s -> add_documentation_url "Coq" s),
"<url> Set base URL for Coq standard library";
"-d", Arg.Set_string output_dir,
"<dir> Output files to directory <dir> (default: current directory)";
"-external",
(let x = ref "" in
Arg.Tuple [
Arg.Set_string x;
Arg.String (fun y -> add_documentation_url y !x)
]),
"<url> <coqdir> Set base URL for linking references whose names start with <coqdir>";
"-no-css", Arg.Clear generate_css,
" Do not add coq2html.css to the output directory";
"-redirect", Arg.Set generate_redirects,
" Generate redirection files modname.html -> coqdir.modname.html";
"-short-names", Arg.Set use_short_names,
" Use short, unqualified module names in the output"
])
process_file
"Usage: coq2html [options] file.glob ... file.v ...\nOptions are:";
if !v_files = [] then begin
eprintf "No .v file provided, aborting\n";
exit 2
end;
if (try not (Sys.is_directory !output_dir) with Sys_error _ -> true)
then begin
eprintf "Error: output directory %s does not exist or is not a directory.\n" !output_dir;
exit 2
end;
List.iter process_glob_file (List.rev !glob_files);
List.iter process_v_file (List.rev !v_files);
if !generate_css then
write_file Resources.css (Filename.concat !output_dir "coq2html.css")
}