(* Copyright (C) 2000, HELM Team. * * This file is part of HELM, an Hypertextual, Electronic * Library of Mathematics, developed at the Computer Science * Department, University of Bologna, Italy. * * HELM is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * HELM is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with HELM; if not, write to the Free Software * Foundation, Inc., 59 Temple Place - Suite 330, Boston, * MA 02111-1307, USA. * * For details, see the HELM World-Wide-Web page, * http://cs.unibo.it/helm/. *) (******************************************************************************) (* *) (* PROJECT HELM *) (* *) (* Claudio Sacerdoti Coen *) (* 24/01/2000 *) (* *) (* This is the main (top level) module of a parser for cic objects from xml *) (* files to the internal representation. It uses the modules cicParser2 *) (* (objects level) and cicParser3 (terms level) *) (* *) (******************************************************************************) exception Warnings;; class warner = object method warn w = prerr_endline ("WARNING: " ^ w) ; (raise Warnings : unit) end ;; exception EmptyUri of string;; (* given an uri u it returns the list of tokens of the base uri of u *) (* e.g.: token_of_uri "cic:/a/b/c/d.xml" returns ["a" ; "b" ; "c"] *) let tokens_of_uri uri = let uri' = UriManager.string_of_uri uri in let rec chop_list = function [] -> raise (EmptyUri uri') | [fn] -> [] | he::[fn] -> [he] | he::tl -> he::(chop_list tl) in let trimmed_uri = Str.replace_first (Str.regexp "cic:") "" uri' in let list_of_tokens = Str.split (Str.regexp "/") trimmed_uri in chop_list list_of_tokens ;; (* given the filename of an xml file of a cic object it returns its internal *) (* representation. *) let annobj_of_xml filename filenamebody uri = let module Y = Pxp_yacc in try let root, rootbody = (* sets the current base uri to resolve relative URIs *) CicParser3.current_sp := tokens_of_uri uri ; CicParser3.current_uri := uri ; let config = {Y.default_config with Y.warner = new warner} in let doc = Y.parse_document_entity config (Y.from_file ~alt:[PxpUrlResolver.url_resolver] filename) CicParser3.domspec in (* CSC: Until PXP bug is resolved *) PxpUrlResolver.url_resolver#close_all ; let docroot = doc#root in match filenamebody with None -> docroot,None | Some filename -> let docbody = Y.parse_document_entity config (Y.from_file ~alt:[PxpUrlResolver.url_resolver] filename) CicParser3.domspec in (* CSC: Until PXP bug is resolved *) PxpUrlResolver.url_resolver#close_all ; docroot,Some docbody#root in CicParser2.get_term root rootbody with e -> prerr_endline ("Filenames: " ^ filename ^ (match filenamebody with None -> "" | Some s -> ", " ^ s)) ; prerr_endline ("Exception: " ^ Pxp_types.string_of_exn e) ; raise e ;; let obj_of_xml filename filenamebody uri = Deannotate.deannotate_obj (annobj_of_xml filename filenamebody uri) ;;