X-Git-Url: http://matita.cs.unibo.it/gitweb/?a=blobdiff_plain;f=helm%2Focaml%2Fmetadata%2FmetadataConstraints.ml;h=15177ddb1331d04b118eea1838e8a9dd2cbc9c45;hb=aca103d3c3d740efcc0bcc2932922cff77facb49;hp=fb782494a6a0c99318a9850a991260b6040f9be1;hpb=9ab46e3c1b1766cce0299604cd07db6356c8b9a9;p=helm.git diff --git a/helm/ocaml/metadata/metadataConstraints.ml b/helm/ocaml/metadata/metadataConstraints.ml index fb782494a..15177ddb1 100644 --- a/helm/ocaml/metadata/metadataConstraints.ml +++ b/helm/ocaml/metadata/metadataConstraints.ml @@ -24,9 +24,10 @@ *) open Printf +open MetadataTypes -let critical_value = 6 -let just_factor = 3 +let critical_value = 7 +let just_factor = 4 module StringSet = Set.Make (String) module SetSet = Set.Make (StringSet) @@ -36,6 +37,17 @@ type term_signature = (string * string list) option * StringSet.t type cardinality_condition = | Eq of int | Gt of int + | Lt of int + +type rating_criterion = + [ `Hits (** order by number of hits, most used objects first *) + ] + +let default_tables = + (library_obj_tbl,library_rel_tbl,library_sort_tbl,library_count_tbl) + +let current_tables () = + (obj_tbl (),rel_tbl (),sort_tbl (), count_tbl ()) let tbln n = "table" ^ string_of_int n @@ -59,88 +71,133 @@ let mk_positions positions cur_tbl = | `MainConclusion None | `MainHypothesis None -> sprintf "%s.h_position = \"%s\"" cur_tbl pos_str - | `MainConclusion (Some d) - | `MainHypothesis (Some d) -> - sprintf "(%s.h_position = \"%s\" and %s.h_depth = %d)" - cur_tbl pos_str cur_tbl d) + | `MainConclusion (Some r) + | `MainHypothesis (Some r) -> + let depth = MetadataPp.pp_relation r in + sprintf "(%s.h_position = \"%s\" and %s.h_depth %s)" + cur_tbl pos_str cur_tbl depth) (positions :> MetadataTypes.position list)) ^ ")" -let add_card_constr tbl (n,from,where) = function - | None -> (n,from,where) - | Some (Eq card) -> - let cur_tbl = tbln n in - (n+1, - (sprintf "%s as %s" tbl cur_tbl :: from), - (sprintf "%s.no=%d" cur_tbl card :: - (if n=0 then [] - else [sprintf "table0.source = %s.source" cur_tbl]) @ - where)) - | Some (Gt card) -> +let explode_card_constr = function + | Eq card -> "=", card + | Gt card -> ">", card + | Lt card -> "<", card + +let add_card_constr tbl col where = function + | None -> where + | Some constr -> + let op, card = explode_card_constr constr in + (* count(_utente).hypothesis = 3 *) + (sprintf "%s.%s %s %d" tbl col op card :: where) + +let add_diff_constr tbl where = function + | None -> where + | Some constr -> + let op, card = explode_card_constr constr in + (sprintf "%s.hypothesis - %s.conclusion %s %d" tbl tbl op card :: where) + +let add_all_constr ?(tbl=library_count_tbl) (n,from,where) concl full diff = + match (concl, full, diff) with + | None, None, None -> (n,from,where) + | _ -> let cur_tbl = tbln n in - (n+1, - (sprintf "%s as %s" tbl cur_tbl :: from), - (sprintf "%s.no>%d" cur_tbl card :: - (if n=0 then [] - else [sprintf "table0.source = %s.source" cur_tbl]) @ - where)) - -let at_least ~(dbh:Dbi.connection) ?concl_card ?full_card + let from = (sprintf "%s as %s" tbl cur_tbl) :: from in + let where = add_card_constr cur_tbl "conclusion" where concl in + let where = add_card_constr cur_tbl "statement" where full in + let where = add_diff_constr cur_tbl where diff in + (n+2,from, + (if n > 0 then + sprintf "table0.source = %s.source" cur_tbl :: where + else + where)) + + +let add_constraint ?(start=0) ?(tables=default_tables) (n,from,where) metadata = + let obj_tbl,rel_tbl,sort_tbl,count_tbl = tables + in + let cur_tbl = tbln n in + let start_table = tbln start in + match metadata with + | `Obj (uri, positions) -> + let from = (sprintf "%s as %s" obj_tbl cur_tbl) :: from in + let where = + (sprintf "(%s.h_occurrence = \"%s\")" cur_tbl uri) :: + mk_positions positions cur_tbl :: + (if n=start then [] + else [sprintf "%s.source = %s.source" start_table cur_tbl]) @ + where + in + ((n+2), from, where) + | `Rel positions -> + let from = (sprintf "%s as %s" rel_tbl cur_tbl) :: from in + let where = + mk_positions positions cur_tbl :: + (if n=start then [] + else [sprintf "%s.source = %s.source" start_table cur_tbl]) @ + where + in + ((n+2), from, where) + | `Sort (sort, positions) -> + let sort_str = CicPp.ppsort sort in + let from = (sprintf "%s as %s" sort_tbl cur_tbl) :: from in + let where = + (sprintf "%s.h_sort = \"%s\"" cur_tbl sort_str ) :: + mk_positions positions cur_tbl :: + (if n=start then + [] + else + [sprintf "%s.source = %s.source" start_table cur_tbl ]) @ where + in + ((n+2), from, where) + +let exec ~(dbd:Mysql.dbd) ?rating (n,from,where) = + let from = String.concat ", " from in + let where = String.concat " and " where in + let query = + match rating with + | None -> sprintf "select table0.source from %s where %s" from where + | Some `Hits -> + sprintf + ("select table0.source from %s, hits where %s + and table0.source = hits.source order by hits.no desc") + from where + in +(* prerr_endline query; *) + let result = Mysql.exec dbd query in + Mysql.map result + (fun row -> match row.(0) with Some s -> s | _ -> assert false) + + +let at_least ~(dbd:Mysql.dbd) ?concl_card ?full_card ?diff ?rating tables (metadata: MetadataTypes.constr list) = + let obj_tbl,rel_tbl,sort_tbl, count_tbl = tables + in if (metadata = []) && concl_card = None && full_card = None then failwith "MetadataQuery.at_least: no constraints given"; - let add_constraint (n,from,where) metadata = - let cur_tbl = tbln n in - match metadata with - | `Obj (uri, positions) -> - let tbl = MetadataTypes.obj_tbl in - let from = (sprintf "%s as %s" tbl cur_tbl) :: from in - let where = - (sprintf "%s.h_occurrence = \"%s\"" cur_tbl uri) :: - mk_positions positions cur_tbl :: - (if n=0 then [] - else [sprintf "table0.source = %s.source" cur_tbl]) @ - where - in - ((n+1), from, where) - | `Rel positions -> - let tbl = MetadataTypes.rel_tbl in - let from = (sprintf "%s as %s" tbl cur_tbl) :: from in - let where = - mk_positions positions cur_tbl :: - (if n=0 then [] - else [sprintf "table0.source = %s.source" cur_tbl]) @ - where - in - ((n+1), from, where) - | `Sort (sort, positions) -> - let tbl = MetadataTypes.sort_tbl in - let sort_str = MetadataPp.pp_sort sort in - let from = (sprintf "%s as %s" tbl cur_tbl) :: from in - let where = - (sprintf "%s.h_sort = \"%s\"" cur_tbl sort_str) :: - mk_positions positions cur_tbl :: - (if n=0 then [] - else [sprintf "table0.source = %s.source" cur_tbl]) @ - where - in - ((n+1), from, where) - in - let (n,from,where) = List.fold_left add_constraint (0,[],[]) metadata in let (n,from,where) = - add_card_constr MetadataTypes.conclno_tbl (n,from,where) concl_card + List.fold_left (add_constraint ~tables) (0,[],[]) metadata in let (n,from,where) = - add_card_constr MetadataTypes.conclno_hyp_tbl (n,from,where) full_card + add_all_constr ~tbl:count_tbl (n,from,where) concl_card full_card diff in - let from = String.concat ", " from in - let where = String.concat " and " where in - let query = sprintf "select table0.source from %s where %s" from where in - let query = dbh#prepare query in - query#execute []; - List.map (function [`String s] -> s | _ -> assert false) (query#fetchall ()) - + exec ~dbd ?rating (n,from,where) + +let at_least + ~(dbd:Mysql.dbd) ?concl_card ?full_card ?diff ?rating + (metadata: MetadataTypes.constr list) += + if are_tables_ownerized () then + (at_least + ~dbd ?concl_card ?full_card ?diff ?rating default_tables metadata) @ + (at_least + ~dbd ?concl_card ?full_card ?diff ?rating (current_tables ()) metadata) + else + at_least + ~dbd ?concl_card ?full_card ?diff ?rating default_tables metadata + + (** Prefix handling *) let filter_by_card n = @@ -374,61 +431,74 @@ let must_of_prefix ?(where = `Conclusion) m s = let escape = Str.global_replace (Str.regexp_string "\'") "\\'" -let get_constants (dbh:Dbi.connection) ~where uri = +let get_constants (dbd:Mysql.dbd) ~where uri = let uri = escape uri in let positions = match where with - | `Conclusion -> ["\"MainConclusion\""; "\"InConclusion\""] + | `Conclusion -> [ MetadataTypes.mainconcl_pos; MetadataTypes.inconcl_pos ] | `Statement -> - ["\"MainConclusion\""; "\"InConclusion\""; "\"InHypothesis\""; - "\"MainHypothesis\""] + [ MetadataTypes.mainconcl_pos; MetadataTypes.inconcl_pos; + MetadataTypes.inhyp_pos; MetadataTypes.mainhyp_pos ] in let query = - dbh#prepare - (sprintf "select h_occurrence from refObj where source=\"%s\" and (%s)" - uri (String.concat " or " positions)) + let pos_predicate = + String.concat " OR " + (List.map (fun pos -> sprintf "(h_position = \"%s\")" pos) positions) + in + sprintf ("SELECT h_occurrence FROM %s WHERE source=\"%s\" AND (%s) UNION "^^ + "SELECT h_occurrence FROM %s WHERE source=\"%s\" AND (%s)") + (MetadataTypes.obj_tbl ()) uri pos_predicate + MetadataTypes.library_obj_tbl uri pos_predicate + in - query#execute []; - query#fold_left (* transform the result in a set *) - (fun set fields -> - let uri = match fields with [`String uri] -> uri | _ -> assert false in - StringSet.add uri set) - StringSet.empty - -let at_most ~(dbh:Dbi.connection) ?(where = `Conclusion) only u = - let inconcl = get_constants dbh ~where u in + let result = Mysql.exec dbd query in + let set = ref StringSet.empty in + Mysql.iter result + (fun col -> + match col.(0) with + | Some uri -> set := StringSet.add uri !set + | _ -> assert false); + !set + +let at_most ~(dbd:Mysql.dbd) ?(where = `Conclusion) only u = + let inconcl = get_constants dbd ~where u in StringSet.subset inconcl only (* Special handling of equality. The problem is filtering out theorems just * containing variables (e.g. all the theorems in cic:/Coq/Ring/). Really * ad-hoc, no better solution found at the moment *) +let myspeciallist_of_facts = + [0,"cic:/Coq/Init/Logic/eq.ind#xpointer(1/1/1)"] let myspeciallist = [0,"cic:/Coq/Init/Logic/eq.ind#xpointer(1/1/1)"; - 0,"cic:/Coq/Init/Logic/sym_eq.con"; + (* 0,"cic:/Coq/Init/Logic/sym_eq.con"; *) 0,"cic:/Coq/Init/Logic/trans_eq.con"; 0,"cic:/Coq/Init/Logic/f_equal.con"; 0,"cic:/Coq/Init/Logic/f_equal2.con"; 0,"cic:/Coq/Init/Logic/f_equal3.con"] -let compute_exactly ~(dbh:Dbi.connection) where main prefixes = + +let compute_exactly ~(dbd:Mysql.dbd) ?(facts=false) ~where main prefixes = List.concat (List.map (fun (m,s) -> - if (m = 0) then - myspeciallist + if ((m = 0) && (main = HelmLibraryObjects.Logic.eq_XURI)) then + (if facts then myspeciallist_of_facts + else myspeciallist) else let res = let must = must_of_prefix ~where main s in match where with - | `Conclusion -> at_least ~dbh ~concl_card:(Eq (m+1)) must - | `Statement -> at_least ~dbh ~full_card:(Eq (m+1)) must + | `Conclusion -> at_least ~dbd ~concl_card:(Eq (m+1)) must + | `Statement -> at_least ~dbd ~full_card:(Eq (m+1)) must in List.map (fun uri -> (m, uri)) res) prefixes) (* critical value reached, fallback to "only" constraints *) -let compute_with_only ~(dbh:Dbi.connection) ?(where = `Conclusion) main - prefixes constants + +let compute_with_only ~(dbd:Mysql.dbd) ?(facts=false) ?(where = `Conclusion) + main prefixes constants = let max_prefix_length = match prefixes with @@ -448,26 +518,27 @@ let compute_with_only ~(dbh:Dbi.connection) ?(where = `Conclusion) main let must = must_of_prefix ~where main s in (let res = match where with - | `Conclusion -> at_least ~dbh ~concl_card:(Gt (m+1)) must - | `Statement -> at_least ~dbh ~full_card:(Gt (m+1)) must + | `Conclusion -> at_least ~dbd ~concl_card:(Gt (m+1)) must + | `Statement -> at_least ~dbd ~full_card:(Gt (m+1)) must in (* we tag the uri with m+1, for sorting purposes *) List.map (fun uri -> (m+1, uri)) res)) maximal_prefixes) in - List.filter (function (_,uri) -> at_most ~dbh ~where constants uri) all in - let equal_to = compute_exactly ~dbh where main prefixes in + List.filter (function (_,uri) -> at_most ~dbd ~where constants uri) all in + let equal_to = compute_exactly ~dbd ~facts ~where main prefixes in greater_than @ equal_to (* real match query implementation *) -let cmatch ~(dbh:Dbi.connection) t = + +let cmatch ~(dbd:Mysql.dbd) ?(facts=false) t = let (main, constants) = signature_of t in match main with | None -> [] | Some (main, types) -> (* the type of eq is not counted in constants_no *) let types_no = List.length types in - let constants_no = StringSet.cardinal constants + types_no in + let constants_no = StringSet.cardinal constants in if (constants_no > critical_value) then let prefixes = prefixes just_factor t in (match prefixes with @@ -475,26 +546,31 @@ let cmatch ~(dbh:Dbi.connection) t = let all_constants = List.fold_right StringSet.add types (StringSet.add main constants) in - compute_with_only ~dbh main all_concl all_constants + compute_with_only ~dbd ~facts main all_concl all_constants | _, _ -> []) else (* in this case we compute all prefixes, and we do not need to apply the only constraints *) let prefixes = - if constants_no = types_no then - Some main, [0, []; types_no, types] + if constants_no = 0 then + (if types_no = 0 then + Some main, [0, []] + else + Some main, [0, []; types_no, types]) else - prefixes constants_no t + prefixes (constants_no+types_no+1) t in (match prefixes with Some main, all_concl -> + compute_exactly ~dbd ~facts ~where:`Conclusion main all_concl +(* List.concat (List.map (fun (m,s) -> let must = must_of_prefix ~where:`Conclusion main s in - let res = at_least ~dbh ~concl_card:(Eq (m+1)) must in + let res = at_least ~dbd ~concl_card:(Eq (m+1)) must in List.map (fun uri -> (m, uri)) res) - all_concl) + all_concl) *) | _, _ -> []) let power_upto upto consts = @@ -515,7 +591,8 @@ let power consts = type where = [ `Conclusion | `Statement ] -let sigmatch ~(dbh:Dbi.connection) ?(where = `Conclusion) (main, constants) = +let sigmatch ~(dbd:Mysql.dbd) + ?(facts=false) ?(where = `Conclusion) (main, constants) = match main with None -> [] | Some (main, types) -> @@ -529,22 +606,26 @@ let sigmatch ~(dbh:Dbi.connection) ?(where = `Conclusion) (main, constants) = let all_constants = List.fold_right StringSet.add types (StringSet.add main constants) in - compute_with_only ~dbh ~where main subsets all_constants + compute_with_only ~dbd ~where main subsets all_constants else let subsets = let subsets = power constants in let types_no = List.length types in + if types_no > 0 then (0,[]) :: List.map (function (n,l) -> (n+types_no,types@l)) subsets + else subsets in - compute_exactly ~dbh where main subsets + compute_exactly ~dbd ~facts ~where main subsets (* match query wrappers *) -let cmatch' = cmatch -let cmatch ~dbh term = + +let cmatch'= cmatch + +let cmatch ~dbd ?(facts=false) term = List.map snd (List.sort (fun x y -> Pervasives.compare (fst y) (fst x)) - (cmatch' ~dbh term)) + (cmatch' ~dbd ~facts term)) let constants_of = signature_concl