(Lazy.force Http_getter_env.rdf_dir) escaped_prefix baseuri extension
in
let patch_fun =
- if patch then Http_getter_common.patch_xml ~via_http () else (fun x -> x)
+ if patch then
+ Http_getter_common.patch_xml ~xmlbases:(uri, url) ~via_http ()
+ else
+ (fun x -> x)
in
let basename = Pcre.replace ~pat:"\\.gz$" downloadname in
let contype = "text/xml" in
let patch_entity = patch_system "ENTITY"
let patch_doctype = patch_system "DOCTYPE"
+let patch_xmlbase =
+ let rex = Pcre.regexp "^(\\s*<\\w[^ ]*)(\\s|>)" in
+ fun xmlbases baseurl baseuri s ->
+ let s' =
+ Pcre.replace ~rex
+ ~templ:(sprintf "$1 xml:base=\"%s\" helm:base=\"%s\"$2" baseurl baseuri)
+ s
+ in
+ if s <> s' then xmlbases := None;
+ s'
+
let patch_dtd = patch_entity
-let patch_xml ?via_http () line =
- patch_doctype ?via_http () (patch_entity ?via_http () line)
+let patch_xml ?via_http ?xmlbases () =
+ let xmlbases = ref xmlbases in
+ fun line ->
+ match !xmlbases with
+ | None -> patch_doctype ?via_http () (patch_entity ?via_http () line)
+ | Some (xmlbaseuri, xmlbaseurl) ->
+ patch_xmlbase xmlbases xmlbaseurl xmlbaseuri
+ (patch_doctype ?via_http () (patch_entity ?via_http () line))
let return_file
~fname ?contype ?contenc
val uri_of_string: string -> uri
-val patch_xml : ?via_http:bool -> unit -> string -> string
+ (** @param xmlbases (xml base URI * xml base URL) *)
+val patch_xml :
+ ?via_http:bool -> ?xmlbases:(string * string) -> unit -> string -> string
val patch_dtd : ?via_http:bool -> unit -> string -> string
(* TODO via_http not yet supported for patch_xsl *)
val patch_xsl : ?via_http:bool -> unit -> string -> string