This commit was manufactured by cvs2svn to create branch 'moogle'.

[helm.git] / helm / ocaml / cic_disambiguation / cicTextualLexer2.ml
diff --git a/helm/ocaml/cic_disambiguation/cicTextualLexer2.ml b/helm/ocaml/cic_disambiguation/cicTextualLexer2.ml

deleted file mode 100644 (file)

index 22c911e..0000000
--- a/helm/ocaml/cic_disambiguation/cicTextualLexer2.ml
+++ /dev/null
@@ -1,139 +0,0 @@
-(* Copyright (C) 2004, HELM Team.
- * 
- * This file is part of HELM, an Hypertextual, Electronic
- * Library of Mathematics, developed at the Computer Science
- * Department, University of Bologna, Italy.
- * 
- * HELM is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
- * of the License, or (at your option) any later version.
- * 
- * HELM is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with HELM; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place - Suite 330, Boston,
- * MA  02111-1307, USA.
- * 
- * For details, see the HELM World-Wide-Web page,
- * http://helm.cs.unibo.it/
- *)
-
-exception Error of int * int * string
-
-exception Not_an_extended_ident
-
-let regexp alpha = [ 'a' - 'z' 'A' - 'Z' ]
-let regexp digit = [ '0' - '9' ]
-let regexp blank = [ ' ' '\t' '\n' ]
-
-let regexp blanks = blank+
-let regexp num = digit+
-let regexp tex_token = '\\' alpha+
-let regexp symbol = [^ 'a' - 'z' 'A' - 'Z' '0' - '9' ' ' '\t' '\n' ]
-let regexp ident_cont = alpha | num | '_' | '\''
-let regexp ident_cont' = ident_cont | tex_token
-let regexp ident = (alpha ident_cont*) | ('_' ident_cont+)
-let regexp ident' = ((alpha | tex_token) ident_cont'*) | ('_' ident_cont'+)
-let regexp paren = [ '(' '[' '{' ')' ']' '}' ]
-let regexp implicit = '?'
-let regexp meta = '?' num
-let regexp qstring = '"' [^ '"']* '"'
-let regexp uri =
-  (*      schema      *) (*     path     *) (*  ext   *) (*    xpointer     *)
-  ("cic:/" | "theory:/") ident ('/' ident)* ('.' ident)+ ('#' num ('/' num)*)?
-(* let regexp catchall = .* *)
-
-let keywords = Hashtbl.create 17
-let _ =
-  List.iter (fun keyword -> Hashtbl.add keywords keyword ("", keyword))
-    [ "Prop"; "Type"; "Set"; "let"; "Let"; "rec"; "using"; "match"; "with" ]
-
-let error lexbuf msg =
-  raise (Error (Ulexing.lexeme_start lexbuf, Ulexing.lexeme_end lexbuf, msg))
-let error_at_end lexbuf msg =
-  raise (Error (Ulexing.lexeme_end lexbuf, Ulexing.lexeme_end lexbuf, msg))
-
-let return lexbuf token = (token, Ulexing.loc lexbuf)
-
-(*
-let parse_ext_ident ident =
-  let len = String.length ident in
-  let buf = Buffer.create len in
-  let in_tex_token = ref false in
-  let tex_token = Buffer.create 10 in
-  try
-    for i = 0 to len - 1 do
-      match ident.[i] with
-      | '\' when not !in_tex_token ->
-          if i < len - 1 &&
-          in_tex_token := true
-    done
-  with Invalid_argument -> assert false
-
-let rec token' = lexer
-  | ident' ->
-      (try
-        let ident = parse_ext_ident (Ulexing.utf8_lexeme lexbuf) in
-        return lexbuf ("IDENT'", ident)
-      with Not_an_extended_ident ->
-        Ulexing.rollback lexbuf;
-        token lexbuf)
-  | _ ->
-      Ulexing.rollback lexbuf;
-      token lexbuf
-
-and token = lexer
-*)
-let rec token = lexer
-  | blanks -> token lexbuf
-  | uri -> return lexbuf ("URI", Ulexing.utf8_lexeme lexbuf)
-  | ident ->
-      let lexeme = Ulexing.utf8_lexeme lexbuf in
-      (try
-        return lexbuf (Hashtbl.find keywords lexeme)
-      with Not_found -> return lexbuf ("IDENT", lexeme))
-  | num -> return lexbuf ("NUM", Ulexing.utf8_lexeme lexbuf)
-  | paren -> return lexbuf ("PAREN", Ulexing.utf8_lexeme lexbuf)
-  | meta -> return lexbuf ("META", Ulexing.utf8_lexeme lexbuf)
-  | implicit -> return lexbuf ("IMPLICIT", Ulexing.utf8_lexeme lexbuf)
-  | qstring ->
-      let lexeme = Ulexing.utf8_lexeme lexbuf in
-      let s = String.sub lexeme 1 (String.length lexeme - 2) in
-      return lexbuf ("QSTRING", s)
-  | symbol -> return lexbuf ("SYMBOL", Ulexing.utf8_lexeme lexbuf)
-  | tex_token ->
-      let macro =
-        Ulexing.utf8_sub_lexeme lexbuf 1 (Ulexing.lexeme_length lexbuf - 1)
-      in
-      (try
-        return lexbuf ("SYMBOL", CicTextualParser2Macro.expand macro)
-      with CicTextualParser2Macro.Macro_not_found _ ->
-        return lexbuf ("SYMBOL", Ulexing.utf8_lexeme lexbuf))
-  | eof -> return lexbuf ("EOI", "")
-  | _ -> error lexbuf "Invalid character"
-
-let tok_func stream =
-  let lexbuf = Ulexing.from_utf8_stream stream in
-  Token.make_stream_and_location
-    (fun () ->
-      try
-       token lexbuf
-      with
-      | Ulexing.Error -> error_at_end lexbuf "Unexpected character"
-      | Ulexing.InvalidCodepoint i -> error_at_end lexbuf "Invalid code point")
-
-let cic_lexer =
-  { 
-    Token.tok_func = tok_func;
-    Token.tok_using = (fun _ -> ());
-    Token.tok_removing = (fun _ -> ()); 
-    Token.tok_match = Token.default_match;
-    Token.tok_text = Token.lexer_text;
-    Token.tok_comm = None;
-  }
-