let regexp ident_letter = [ 'a' - 'z' 'A' - 'Z' ]
+ (* must be in sync with "is_ligature_char" below *)
let regexp ligature_char = [ "'`~!?@*()[]<>-+=|:;.,/\"" ]
let regexp ligature = ligature_char ligature_char+
+let is_ligature_char =
+ (* must be in sync with "regexp ligature_char" above *)
+ let chars = "'`~!?@*()[]<>-+=|:;.,/\"" in
+ (fun char ->
+ (try
+ ignore (String.index chars char);
+ true
+ with Not_found -> false))
+
let regexp ident_decoration = '\'' | '?' | '`'
let regexp ident_cont = ident_letter | xml_digit | '_'
let regexp ident = ident_letter ident_cont* ident_decoration*
let _ =
List.iter (fun k -> Hashtbl.add level2_ast_keywords k ())
[ "CProp"; "Prop"; "Type"; "Set"; "let"; "rec"; "corec"; "match";
- "with"; "in"; "and"; "to"; "as"; "on" ]
+ "with"; "in"; "and"; "to"; "as"; "on"; "return" ]
let add_level2_ast_keyword k = Hashtbl.add level2_ast_keywords k ()
let remove_level2_ast_keyword k = Hashtbl.remove level2_ast_keywords k
("<>", <:unicode<neq>>); (":=", <:unicode<def>>);
]
+let regexp uri_step = [ 'a' - 'z' 'A' - 'Z' '0' - '9' '_' '-' ]+
+
let regexp uri =
("cic:/" | "theory:/") (* schema *)
- ident ('/' ident)* (* path *)
+(* ident ('/' ident)* |+ path +| *)
+ uri_step ('/' uri_step)* (* path *)
('.' ident)+ (* ext *)
("#xpointer(" number ('/' number)+ ")")? (* xpointer *)
lexer
| ligature ->
let lexeme = Ulexing.utf8_lexeme lexbuf in
- (match Hashtbl.find_all ligatures lexeme with
+ (match List.rev (Hashtbl.find_all ligatures lexeme) with
| [] -> (* ligature not found, rollback and try default lexer *)
Ulexing.rollback lexbuf;
k lexbuf
- | ligs -> (* ligatures found, use the default one *)
- let default_lig = List.hd (List.rev ligs) in
+ | default_lig :: _ -> (* ligatures found, use the default one *)
return_symbol lexbuf default_lig)
| eof -> return_eoi lexbuf
| _ -> (* not a ligature, rollback and try default lexer *)
let level2_ast_lexer = mk_lexer level2_ast_token
let level2_meta_lexer = mk_lexer level2_meta_token
+let lookup_ligatures lexeme =
+ try
+ if lexeme.[0] = '\\'
+ then [ Utf8Macro.expand (String.sub lexeme 1 (String.length lexeme - 1)) ]
+ else List.rev (Hashtbl.find_all ligatures lexeme)
+ with Invalid_argument _ | Utf8Macro.Macro_not_found _ as exn -> []
+