let indtyuri_of_uri uri =
let index_sharp = String.index uri '#' in
let index_num = index_sharp + 3 in
- (UriManager.uri_of_string (String.sub uri 0 index_sharp),
- int_of_string (String.sub uri index_num (String.length uri - index_num)) - 1
- )
+ try
+ (UriManager.uri_of_string (String.sub uri 0 index_sharp),
+ int_of_string(String.sub uri index_num (String.length uri - index_num)) - 1
+ )
+ with
+ Failure msg ->
+ raise (CicTextualParser0.LexerFailure "Not an inductive URI")
;;
let indconuri_of_uri uri =
let index_sharp = String.index uri '#' in
let index_div = String.rindex uri '/' in
let index_con = index_div + 1 in
- (UriManager.uri_of_string (String.sub uri 0 index_sharp),
- int_of_string
- (String.sub uri (index_sharp + 3) (index_div - index_sharp - 3)) - 1,
- int_of_string
- (String.sub uri index_con (String.length uri - index_con))
- )
+ try
+ (UriManager.uri_of_string (String.sub uri 0 index_sharp),
+ int_of_string
+ (String.sub uri (index_sharp + 3) (index_div - index_sharp - 3)) - 1,
+ int_of_string
+ (String.sub uri index_con (String.length uri - index_con))
+ )
+ with
+ Failure msg ->
+ raise (CicTextualParser0.LexerFailure "Not a constructor URI")
+ ;;
+
+ (* TeX unquoting for "_" *)
+ let unquote str =
+ Str.global_replace (Str.regexp "\\\\_") "_" str
;;
}
let dollar = '$'
let num = ['1'-'9']['0'-'9']* | '0'
-let alfa = ['A'-'Z' 'a'-'z' '_' ''' '-'] | "\\_"
-let ident = alfa (alfa | num)*
+let letter = ['A'-'Z' 'a'-'z']
+let alfa = letter | ['_' ''' '-'] | "\\_"
+let ident = letter (alfa | num)*
let baseuri = '/'(ident '/')* ident '.'
let conuri = baseuri "con"
let varuri = baseuri "var"
let indtyuri = baseuri "ind#1/" num
let indconuri = baseuri "ind#1/" num "/" num
-let blanks = [' ' '\t' '\n' '~'] | "\\;"
+let blanks = [' ' '\t' '\n' '~' '{' '}'] | "\\;" | "\\rm"
rule token =
parse
blanks { token lexbuf } (* skip blanks *)
| "\\Set" { SET }
| "\\Prop" { PROP }
| "\\Type" { TYPE }
- | ident { ID (L.lexeme lexbuf) }
- | conuri { CONURI (U.uri_of_string ("cic:" ^ L.lexeme lexbuf)) }
- | varuri { VARURI (U.uri_of_string ("cic:" ^ L.lexeme lexbuf)) }
- | indtyuri { INDTYURI (indtyuri_of_uri ("cic:" ^ L.lexeme lexbuf)) }
- | indconuri { INDCONURI (indconuri_of_uri("cic:" ^ L.lexeme lexbuf)) }
+ | ident { ID (unquote (L.lexeme lexbuf)) }
+ | conuri { CONURI
+ (U.uri_of_string ("cic:" ^ (unquote (L.lexeme lexbuf)))) }
+ | varuri { VARURI
+ (U.uri_of_string ("cic:" ^ (unquote (L.lexeme lexbuf)))) }
+ | indtyuri { INDTYURI
+ (indtyuri_of_uri ("cic:" ^ (unquote (L.lexeme lexbuf)))) }
+ | indconuri { INDCONURI
+ (indconuri_of_uri("cic:" ^ (unquote (L.lexeme lexbuf)))) }
| num { NUM (int_of_string (L.lexeme lexbuf)) }
| '?' num { let lexeme = L.lexeme lexbuf in
META
| eof { EOF }
(* Arithmetical operators *)
| '+' { PLUS }
+ | '-' { MINUS }
| '*' { TIMES }
| '=' { EQ }
{}