1 (* Copyright (C) 2000, HELM Team.
3 * This file is part of HELM, an Hypertextual, Electronic
4 * Library of Mathematics, developed at the Computer Science
5 * Department, University of Bologna, Italy.
7 * HELM is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; either version 2
10 * of the License, or (at your option) any later version.
12 * HELM is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with HELM; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place - Suite 330, Boston,
22 * For details, see the HELM World-Wide-Web page,
23 * http://cs.unibo.it/helm/.
26 (******************************************************************************)
30 (* Claudio Sacerdoti Coen <sacerdot@cs.unibo.it> *)
33 (* This is the main (top level) module of a parser for cic objects from xml *)
34 (* files to the internal representation. It uses the modules cicParser2 *)
35 (* (objects level) and cicParser3 (terms level) *)
37 (******************************************************************************)
39 exception Getter_failure of string * string
40 exception Parser_failure of string
42 (** tries to recover from a parse error caused by the parsing of a getter
43 * error message (e.g. Key_not_found exception). Unfortunately we have to
44 * re-parse xml document to extract exception data *)
45 let try_recover exn filename =
49 Pxp_ev_parser.create_entity_manager ~is_document:true
50 PxpHelmConf.pxp_config (Pxp_types.from_file filename)
53 Pxp_ev_parser.create_pull_parser PxpHelmConf.pxp_config
54 (`Entry_document []) entity_manager
59 | Some (Pxp_types.E_start_tag ("html", attrs, _, _)) ->
60 let exn = List.assoc "helm:exception" attrs in
62 try List.assoc "helm:exception_arg" attrs with Not_found -> ""
64 rc := Some (Getter_failure (exn, arg))
68 with _ -> raise (Parser_failure (Printexc.to_string exn)));
70 | None -> raise (Parser_failure (Printexc.to_string exn))
71 | Some exn -> raise exn
73 let parse_document filename =
75 Pxp_tree_parser.parse_document_entity PxpHelmConf.pxp_config
76 (Pxp_types.from_file ~alt:[PxpUrlResolver.url_resolver] filename)
79 raise (try_recover exn filename)
81 (* given the filename of an xml file of a cic object it returns its internal *)
83 let annobj_of_xml filename filenamebody =
85 let doc = parse_document filename in
86 let docroot = doc#root in
87 match filenamebody with
90 let docbody = parse_document filename in
91 docroot,Some docbody#root
93 CicParser2.get_term root rootbody
95 let obj_of_xml filename filenamebody =
96 Deannotate.deannotate_obj (annobj_of_xml filename filenamebody)