(* Copyright (C) 2005, HELM Team. * * This file is part of HELM, an Hypertextual, Electronic * Library of Mathematics, developed at the Computer Science * Department, University of Bologna, Italy. * * HELM is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * HELM is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with HELM; if not, write to the Free Software * Foundation, Inc., 59 Temple Place - Suite 330, Boston, * MA 02111-1307, USA. * * For details, see the HELM World-Wide-Web page, * http://helm.cs.unibo.it/ *) open Printf open CicNotationEnv open CicNotationPt exception Parse_error of Token.flocation * string exception Level_not_found of int let grammar = Grammar.gcreate CicNotationLexer.notation_lexer let min_precedence = 0 let max_precedence = 100 let default_precedence = 50 let level1_pattern = Grammar.Entry.create grammar "level1_pattern" let level2_pattern = Grammar.Entry.create grammar "level2_pattern" let level3_term = Grammar.Entry.create grammar "level3_term" let l2_pattern = Grammar.Entry.create grammar "l2_pattern" let notation = Grammar.Entry.create grammar "notation" (* level1 <-> level 2 *) let interpretation = Grammar.Entry.create grammar "interpretation" (* level2 <-> level 3 *) let phrase = Grammar.Entry.create grammar "phrase" let return_term loc term = () let fail floc msg = let (x, y) = loc_of_floc floc in failwith (sprintf "Error at characters %d - %d: %s" x y msg) let int_of_string s = try Pervasives.int_of_string s with Failure _ -> failwith (sprintf "Lexer failure: string_of_int \"%s\" failed" s) (** {2 Grammar extension} *) let symbol s = Gramext.Stoken ("SYMBOL", s) let ident s = Gramext.Stoken ("IDENT", s) let number s = Gramext.Stoken ("NUMBER", s) let term = Gramext.Sself let g_symbol_of_literal = function | `Symbol s -> symbol s | `Keyword s -> ident s | `Number s -> number s type binding = | NoBinding | Binding of string * value_type | Env of (string * value_type) list let make_action action bindings = let rec aux (vl : CicNotationEnv.t) = function [] -> prerr_endline "aux: make_action"; Gramext.action (fun (loc: location) -> action vl loc) | NoBinding :: tl -> prerr_endline "aux: none"; Gramext.action (fun _ -> aux vl tl) (* LUCA: DEFCON 2 BEGIN *) | Binding (name, TermType) :: tl -> prerr_endline "aux: term"; Gramext.action (fun (v:term) -> aux ((name, (TermType, (TermValue v)))::vl) tl) | Binding (name, StringType) :: tl -> prerr_endline "aux: string"; Gramext.action (fun (v:string) -> aux ((name, (StringType, (StringValue v))) :: vl) tl) | Binding (name, NumType) :: tl -> prerr_endline "aux: num"; Gramext.action (fun (v:string) -> aux ((name, (NumType, (NumValue v))) :: vl) tl) | Binding (name, OptType t) :: tl -> prerr_endline "aux: opt"; Gramext.action (fun (v:'a option) -> aux ((name, (OptType t, (OptValue v))) :: vl) tl) | Binding (name, ListType t) :: tl -> prerr_endline "aux: list"; Gramext.action (fun (v:'a list) -> aux ((name, (ListType t, (ListValue v))) :: vl) tl) | Env _ :: tl -> prerr_endline "aux: env"; Gramext.action (fun (v:CicNotationEnv.t) -> aux (v @ vl) tl) (* LUCA: DEFCON 2 END *) in aux [] (List.rev bindings) let flatten_opt = let rec aux acc = function [] -> List.rev acc | NoBinding :: tl -> aux acc tl | Env names :: tl -> aux (List.rev names @ acc) tl | Binding (name, ty) :: tl -> aux ((name, ty) :: acc) tl in aux [] (* given a level 1 pattern computes the new RHS of "term" grammar entry *) let extract_term_production pattern = let rec aux = function | AttributedTerm (_, t) -> aux t | Literal l -> aux_literal l | Layout l -> aux_layout l | Magic m -> aux_magic m | Variable v -> aux_variable v | t -> prerr_endline (CicNotationPp.pp_term t); assert false and aux_literal = function | `Symbol s -> [NoBinding, symbol s] | `Keyword s -> [NoBinding, ident s] | `Number s -> [NoBinding, number s] and aux_layout = function | Sub (p1, p2) -> aux p1 @ [NoBinding, symbol "\\SUB"] @ aux p2 | Sup (p1, p2) -> aux p1 @ [NoBinding, symbol "\\SUP"] @ aux p2 | Below (p1, p2) -> aux p1 @ [NoBinding, symbol "\\BELOW"] @ aux p2 | Above (p1, p2) -> aux p1 @ [NoBinding, symbol "\\ABOVE"] @ aux p2 | Frac (p1, p2) -> aux p1 @ [NoBinding, symbol "\\FRAC"] @ aux p2 | Atop (p1, p2) -> aux p1 @ [NoBinding, symbol "\\ATOP"] @ aux p2 | Over (p1, p2) -> aux p1 @ [NoBinding, symbol "\\OVER"] @ aux p2 | Root (p1, p2) -> [NoBinding, symbol "\\ROOT"] @ aux p2 @ [NoBinding, symbol "\\OF"] @ aux p1 | Sqrt p -> [NoBinding, symbol "\\SQRT"] @ aux p | Break -> [] | Box (_, pl) -> List.flatten (List.map aux pl) and aux_magic magic = match magic with | Opt p -> let p_bindings, p_atoms, p_names, p_action = inner_pattern p in let action (env_opt : CicNotationEnv.t option) (loc : location) = match env_opt with | Some env -> List.map opt_binding_some env | None -> List.map opt_binding_of_name p_names in [ Env (List.map opt_declaration p_names), Gramext.srules [ [ Gramext.Sopt (Gramext.srules [ p_atoms, p_action ]) ], Gramext.action action ] ] | List0 (p, _) | List1 (p, _) -> let p_bindings, p_atoms, p_names, p_action = inner_pattern p in let env0 = List.map list_binding_of_name p_names in let grow_env_entry env n v = prerr_endline "grow_env_entry"; List.map (function | (n', (ty, ListValue vl)) as entry -> if n' = n then n', (ty, ListValue (v :: vl)) else entry | _ -> assert false) env in let grow_env env_i env = prerr_endline "grow_env"; List.fold_left (fun env (n, (_, v)) -> grow_env_entry env n v) env env_i in let action (env_list : CicNotationEnv.t list) (loc : location) = prerr_endline "list action"; List.fold_right grow_env env_list env0 in let g_symbol s = match magic with | List0 (_, None) -> Gramext.Slist0 s | List1 (_, None) -> Gramext.Slist1 s | List0 (_, Some l) -> Gramext.Slist0sep (s, g_symbol_of_literal l) | List1 (_, Some l) -> Gramext.Slist1sep (s, g_symbol_of_literal l) | _ -> assert false in [ Env (List.map list_declaration p_names), Gramext.srules [ [ g_symbol (Gramext.srules [ p_atoms, p_action ]) ], Gramext.action action ] ] | _ -> assert false and aux_variable = function | NumVar s -> [Binding (s, NumType), number ""] | TermVar s -> [Binding (s, TermType), term] | IdentVar s -> [Binding (s, StringType), ident ""] | Ascription (p, s) -> assert false (* TODO *) | FreshVar _ -> assert false and inner_pattern p = let p_bindings, p_atoms = List.split (aux p) in let p_names = flatten_opt p_bindings in let _ = prerr_endline ("inner names: " ^ String.concat " " (List.map fst p_names)) in let action = make_action (fun (env : CicNotationEnv.t) (loc : location) -> env) p_bindings in p_bindings, p_atoms, p_names, action in aux pattern let level_of_int precedence = if precedence < min_precedence || precedence > max_precedence then raise (Level_not_found precedence); string_of_int precedence type rule_id = Token.t Gramext.g_symbol list let extend level1_pattern ?(precedence = default_precedence) ?associativity action = let p_bindings, p_atoms = List.split (extract_term_production level1_pattern) in let level = level_of_int precedence in let p_names = flatten_opt p_bindings in let _ = prerr_endline (string_of_int (List.length p_bindings)); Grammar.extend [ Grammar.Entry.obj (l2_pattern: 'a Grammar.Entry.e), Some (Gramext.Level level), [ None, associativity, [ p_atoms, (make_action (fun (env: CicNotationEnv.t) (loc: location) -> (action env loc)) p_bindings) ]]] in p_atoms let delete atoms = Grammar.delete_rule l2_pattern atoms (** {2 Grammar} *) let boxify = function | [ a ] -> a | l -> Layout (Box (H, l)) let fold_binder binder pt_names body = let fold_cluster binder terms ty body = List.fold_right (fun term body -> Binder (binder, (term, ty), body)) terms body (* terms are names: either Ident or FreshVar *) in List.fold_right (fun (names, ty) body -> fold_cluster binder names ty body) pt_names body let return_term loc term = AttributedTerm (`Loc loc, term) let _ = (* create empty precedence level for "l2_pattern" *) let mk_level_list first last = let rec aux acc = function | i when i < first -> acc | i -> aux ((Some (string_of_int i), None, []) :: acc) (i - 1) in aux [] last in Grammar.extend [ Grammar.Entry.obj (l2_pattern: 'a Grammar.Entry.e), None, mk_level_list min_precedence max_precedence ] EXTEND GLOBAL: level1_pattern level2_pattern level3_term l2_pattern notation interpretation phrase; (* {{{ Grammar for concrete syntax patterns, notation level 1 *) level1_pattern: [ [ p = l1_simple_pattern -> p ] ]; l1_pattern: [ [ p = LIST1 l1_simple_pattern -> p ] ]; literal: [ [ s = SYMBOL -> `Symbol s | k = KEYWORD -> `Keyword k | n = NUMBER -> `Number n ] ]; sep: [ [ SYMBOL "\\SEP"; sep = literal -> sep ] ]; (* row_sep: [ [ SYMBOL "\\ROWSEP"; sep = literal -> sep ] ]; field_sep: [ [ SYMBOL "\\FIELDSEP"; sep = literal -> sep ] ]; *) l1_magic_pattern: [ [ SYMBOL "\\LIST0"; p = l1_simple_pattern; sep = OPT sep -> List0 (p, sep) | SYMBOL "\\LIST1"; p = l1_simple_pattern; sep = OPT sep -> List1 (p, sep) | SYMBOL "\\OPT"; p = l1_simple_pattern -> Opt p ] ]; l1_pattern_variable: [ [ SYMBOL "\\TERM"; id = IDENT -> TermVar id | SYMBOL "\\NUM"; id = IDENT -> NumVar id | SYMBOL "\\IDENT"; id = IDENT -> IdentVar id ] ]; l1_simple_pattern: [ "layout" LEFTA [ p1 = SELF; SYMBOL "\\SUB"; p2 = SELF -> return_term loc (Layout (Sub (p1, p2))) | p1 = SELF; SYMBOL "\\SUP"; p2 = SELF -> return_term loc (Layout (Sup (p1, p2))) | p1 = SELF; SYMBOL "\\BELOW"; p2 = SELF -> return_term loc (Layout (Below (p1, p2))) | p1 = SELF; SYMBOL "\\ABOVE"; p2 = SELF -> return_term loc (Layout (Above (p1, p2))) | p1 = SELF; SYMBOL "\\OVER"; p2 = SELF -> return_term loc (Layout (Over (p1, p2))) | p1 = SELF; SYMBOL "\\ATOP"; p2 = SELF -> return_term loc (Layout (Atop (p1, p2))) (* | SYMBOL "\\ARRAY"; p = SELF; csep = OPT field_sep; rsep = OPT row_sep -> return_term loc (Array (p, csep, rsep)) *) | SYMBOL "\\FRAC"; p1 = SELF; p2 = SELF -> return_term loc (Layout (Frac (p1, p2))) | SYMBOL "\\SQRT"; p = SELF -> return_term loc (Layout (Sqrt p)) | SYMBOL "\\ROOT"; index = SELF; SYMBOL "\\OF"; arg = SELF -> return_term loc (Layout (Root (arg, index))); | SYMBOL "\\HBOX"; DELIM "\\["; p = l1_pattern; DELIM "\\]" -> return_term loc (Layout (Box (H, p))) | SYMBOL "\\VBOX"; DELIM "\\["; p = l1_pattern; DELIM "\\]" -> return_term loc (Layout (Box (V, p))) | SYMBOL "\\BREAK" -> return_term loc (Layout Break) | DELIM "\\["; p = l1_pattern; DELIM "\\]" -> return_term loc (boxify p) | p = SELF; SYMBOL "\\AS"; id = IDENT -> return_term loc (Variable (Ascription (p, id))) ] | "simple" NONA [ i = IDENT -> return_term loc (Ident (i, None)) | m = l1_magic_pattern -> return_term loc (Magic m) | v = l1_pattern_variable -> return_term loc (Variable v) | l = literal -> return_term loc (Literal l) ] ]; (* }}} *) (* {{{ Grammar for ast patterns, notation level 2 *) level2_pattern: [ [ p = l2_pattern -> p ] ]; sort: [ [ SYMBOL "\\PROP" -> `Prop | SYMBOL "\\SET" -> `Set | SYMBOL "\\TYPE" -> `Type ] ]; explicit_subst: [ [ SYMBOL "\\subst"; (* to avoid catching frequent "a [1]" cases *) SYMBOL "["; substs = LIST1 [ i = IDENT; SYMBOL <:unicode> (* ≔ *); t = l2_pattern -> (i, t) ] SEP SYMBOL ";"; SYMBOL "]" -> substs ] ]; meta_subst: [ [ s = SYMBOL "_" -> None | p = l2_pattern -> Some p ] ]; meta_substs: [ [ SYMBOL "["; substs = LIST0 meta_subst; SYMBOL "]" -> substs ] ]; possibly_typed_name: [ [ SYMBOL "("; id = bound_name; SYMBOL ":"; typ = l2_pattern; SYMBOL ")" -> id, Some typ | id = bound_name -> id, None ] ]; match_pattern: [ [ id = IDENT -> id, [] | SYMBOL "("; id = IDENT; vars = LIST1 possibly_typed_name; SYMBOL ")" -> id, vars ] ]; binder: [ [ SYMBOL <:unicode> (* Π *) -> `Pi | SYMBOL <:unicode> (* ∃ *) -> `Exists | SYMBOL <:unicode> (* ∀ *) -> `Forall | SYMBOL <:unicode> (* λ *) -> `Lambda ] ]; bound_name: [ [ i = IDENT -> Ident (i, None) | SYMBOL "\\FRESH"; i = IDENT -> Variable (FreshVar i) ] ]; bound_names: [ [ vars = LIST1 bound_name SEP SYMBOL ","; ty = OPT [ SYMBOL ":"; p = l2_pattern -> p ] -> [ vars, ty ] | clusters = LIST1 [ SYMBOL "("; vars = LIST1 bound_name SEP SYMBOL ","; ty = OPT [ SYMBOL ":"; p = l2_pattern -> p ]; SYMBOL ")" -> vars, ty ] -> clusters ] ]; induction_kind: [ [ IDENT "rec" -> `Inductive | IDENT "corec" -> `CoInductive ] ]; let_defs: [ [ defs = LIST1 [ name = bound_name; args = bound_names; index_name = OPT [ IDENT "on"; id = bound_name -> id ]; ty = OPT [ SYMBOL ":" ; p = l2_pattern -> p ]; SYMBOL <:unicode> (* ≝ *); body = l2_pattern -> let body = fold_binder `Lambda args body in let ty = match ty with | None -> None | Some ty -> Some (fold_binder `Pi args ty) in let rec position_of name p = function | [] -> None, p | n :: _ when n = name -> Some p, p | _ :: tl -> position_of name (p + 1) tl in let rec find_arg name n = function | [] -> fail loc (sprintf "Argument %s not found" (CicNotationPp.pp_term name)) | (l,_) :: tl -> (match position_of name 0 l with | None, len -> find_arg name (n + len) tl | Some where, len -> n + where) in let index = match index_name with | None -> 0 | Some name -> find_arg name 0 args in (name, ty), body, index ] SEP IDENT "and" -> defs ] ]; l2_pattern_variable: [ [ SYMBOL "\\TERM"; id = IDENT -> TermVar id | SYMBOL "\\NUM"; id = IDENT -> NumVar id | SYMBOL "\\IDENT"; id = IDENT -> IdentVar id | SYMBOL "\\FRESH"; id = IDENT -> FreshVar id ] ]; l2_magic_pattern: [ [ SYMBOL "\\FOLD"; kind = [ IDENT "left" -> `Left | IDENT "right" -> `Right ]; DELIM "\\["; base = l2_pattern; DELIM "\\]"; SYMBOL "\\LAMBDA"; id = IDENT; DELIM "\\["; recursive = l2_pattern; DELIM "\\]" -> Fold (kind, base, [id], recursive) | SYMBOL "\\DEFAULT"; DELIM "\\["; some = l2_pattern; DELIM "\\]"; DELIM "\\["; none = l2_pattern; DELIM "\\]" -> Default (some, none) ] ]; l2_pattern: LEVEL "10" (* let in *) [ "10" NONA [ IDENT "let"; var = possibly_typed_name; SYMBOL <:unicode> (* ≝ *); p1 = l2_pattern; "in"; p2 = l2_pattern -> return_term loc (LetIn (var, p1, p2)) | IDENT "let"; k = induction_kind; defs = let_defs; IDENT "in"; body = l2_pattern -> return_term loc (LetRec (k, defs, body)) ] ]; l2_pattern: LEVEL "20" (* binder *) [ "20" RIGHTA [ b = binder; names = bound_names; SYMBOL "."; body = l2_pattern -> return_term loc (fold_binder b names body) ] ]; l2_pattern: LEVEL "70" (* apply *) [ "70" LEFTA [ p1 = l2_pattern; p2 = l2_pattern -> let rec aux = function | Appl (hd :: tl) | AttributedTerm (_, Appl (hd :: tl)) -> aux hd @ tl | term -> [term] in return_term loc (Appl (aux p1 @ [p2])) ] ]; l2_pattern: LEVEL "90" (* simple *) [ "90" NONA [ id = IDENT -> return_term loc (Ident (id, None)) | id = IDENT; s = explicit_subst -> return_term loc (Ident (id, Some s)) | u = URI -> return_term loc (Uri (u, None)) | n = NUMBER -> prerr_endline "number"; return_term loc (Num (n, 0)) | IMPLICIT -> return_term loc (Implicit) | m = META -> return_term loc (Meta (int_of_string m, [])) | m = META; s = meta_substs -> return_term loc (Meta (int_of_string m, s)) | s = sort -> return_term loc (Sort s) | outtyp = OPT [ SYMBOL "["; ty = l2_pattern; SYMBOL "]" -> ty ]; IDENT "match"; t = l2_pattern; indty_ident = OPT [ SYMBOL ":"; id = IDENT -> id ]; IDENT "with"; SYMBOL "["; patterns = LIST0 [ lhs = match_pattern; SYMBOL <:unicode> (* ⇒ *); rhs = l2_pattern -> lhs, rhs ] SEP SYMBOL "|"; SYMBOL "]" -> return_term loc (Case (t, indty_ident, outtyp, patterns)) | SYMBOL "("; p1 = l2_pattern; SYMBOL ":"; p2 = l2_pattern; SYMBOL ")" -> return_term loc (Appl [ Symbol ("cast", 0); p1; p2 ]) | SYMBOL "("; p = l2_pattern; SYMBOL ")" -> p | v = l2_pattern_variable -> return_term loc (Variable v) | m = l2_magic_pattern -> return_term loc (Magic m) ] ]; (* }}} *) (* {{{ Grammar for interpretation, notation level 3 *) argument: [ [ id = IDENT -> IdentArg id | SYMBOL <:unicode> (* η *); SYMBOL "."; a = SELF -> EtaArg (None, a) | SYMBOL <:unicode> (* η *); id = IDENT; SYMBOL "."; a = SELF -> EtaArg (Some id, a) ] ]; level3_term: [ [ u = URI -> UriPattern u | a = argument -> ArgPattern a | SYMBOL "("; terms = LIST1 SELF; SYMBOL ")" -> (match terms with | [] -> assert false | [term] -> term | terms -> ApplPattern terms) ] ]; (* }}} *) (* {{{ Notation glues *) associativity: [ [ IDENT "left"; IDENT "associative" -> Gramext.LeftA | IDENT "right"; IDENT "associative" -> Gramext.RightA | IDENT "non"; IDENT "associative" -> Gramext.NonA ] ]; precedence: [ [ IDENT "with"; IDENT "precedence"; n = NUMBER -> int_of_string n ] ]; notation: [ [ p1 = level1_pattern; assoc = OPT associativity; prec = OPT precedence; IDENT "for"; p2 = level2_pattern -> (p1, assoc, prec, p2) ] ]; interpretation: [ [ s = SYMBOL; args = LIST1 argument; SYMBOL "="; t = level3_term -> (s, args, t) ] ]; (* }}} *) (* {{{ Top-level phrases *) phrase: [ [ IDENT "print"; p2 = level2_pattern; SYMBOL "." -> Print p2 | IDENT "notation"; (l1, assoc, prec, l2) = notation; SYMBOL "." -> Notation (l1, assoc, prec, l2) | IDENT "interpretation"; (symbol, args, l3) = interpretation; SYMBOL "." -> Interpretation ((symbol, args), l3) | IDENT "render"; u = URI; SYMBOL "." -> Render (UriManager.uri_of_string u) ] ]; (* }}} *) END (** {2 API implementation} *) let exc_located_wrapper f = try f () with | Stdpp.Exc_located (floc, Stream.Error msg) -> raise (Parse_error (floc, msg)) | Stdpp.Exc_located (floc, exn) -> raise (Parse_error (floc, (Printexc.to_string exn))) let parse_syntax_pattern stream = exc_located_wrapper (fun () -> Grammar.Entry.parse level1_pattern stream) let parse_ast_pattern stream = exc_located_wrapper (fun () -> Grammar.Entry.parse level2_pattern stream) let parse_interpretation stream = exc_located_wrapper (fun () -> Grammar.Entry.parse level3_term stream) let parse_phrase stream = exc_located_wrapper (fun () -> Grammar.Entry.parse phrase stream) (** {2 Debugging} *) let print_l2_pattern () = Grammar.print_entry Format.std_formatter (Grammar.Entry.obj l2_pattern); Format.pp_print_flush Format.std_formatter (); flush stdout (* vim:set encoding=utf8 foldmethod=marker: *)