isabelle: comparison src/HOL/Tools/Sledgehammer/sledgehammer

equal deleted inserted replaced

-:cb564ff43c28
+:4274b25ff4e7
 val mash_unlearn : Proof.context -> unit
 val nickname_of : thm -> string
 val suggested_facts :
 (string * 'a) list -> ('b * thm) list -> (('b * thm) * 'a) list
 val mesh_facts :
-int -> ((('a * thm) * real) list * ('a * thm) list) list -> ('a * thm) list
+int -> (real * ((('a * thm) * real) list * ('a * thm) list)) list
+-> ('a * thm) list
 val theory_ord : theory * theory -> order
 val thm_ord : thm * thm -> order
 val goal_of_thm : theory -> thm -> thm
 val run_prover_for_mash :
 Proof.context -> params -> string -> fact list -> thm -> prover_result
 val atp_dependencies_of :
 Proof.context -> params -> string -> int -> fact list -> unit Symtab.table
 -> thm -> bool * string list option
 val weight_mash_facts : ('a * thm) list -> (('a * thm) * real) list
 val mash_suggested_facts :
-Proof.context -> params -> string -> int -> term list -> term
+Proof.context -> params -> string -> int -> term list -> term -> fact list
--> fact list -> fact list * fact list
+-> fact list
 val mash_learn_proof :
 Proof.context -> params -> string -> term -> ('a * thm) list -> thm list
 -> unit
 val mash_learn :
 Proof.context -> params -> fact_override -> thm list -> bool -> unit
 val empty_state = {fact_G = Graph.empty, dirty = SOME []}
 local
-val version = "*** MaSh version 20121204a ***"
+val version = "*** MaSh version 20121205a ***"
 exception Too_New of unit
 fun extract_node line =
 case space_explode ":" line of
 val tab = Symtab.empty |> fold add_fact facts
 fun find_sugg (name, weight) =
 Symtab.lookup tab name |> Option.map (rpair weight)
 in map_filter find_sugg suggs end
-fun sum_avg [] = 0
+fun scaled_avg [] = 0
-| sum_avg xs =
+| scaled_avg xs =
 Real.ceil (100000000.0 * fold (curry (op +)) xs 0.0) div length xs
-fun normalize_scores [] = []
+fun avg [] = 0.0
-| normalize_scores ((fact, score) :: tail) =
+| avg xs = fold (curry (op +)) xs 0.0 / Real.fromInt (length xs)
-(fact, 1.0) :: map (apsnd (curry Real.* (1.0 / score))) tail
+fun normalize_scores _ [] = []
-fun mesh_facts max_facts [(sels, unks)] =
+| normalize_scores max_facts xs =
+let val avg = avg (map snd (take max_facts xs)) in
+map (apsnd (curry Real.* (1.0 / avg))) xs
+end
+fun mesh_facts max_facts [(_, (sels, unks))] =
 map fst (take max_facts sels) @ take (max_facts - length sels) unks
 | mesh_facts max_facts mess =
 let
-val mess = mess |> map (apfst (normalize_scores #> `length))
+val mess =
+mess |> map (apsnd (apfst (normalize_scores max_facts #> `length)))
 val fact_eq = Thm.eq_thm o pairself snd
-fun score_at sels = try (nth sels) #> Option.map snd
+fun score_in fact (global_weight, ((sel_len, sels), unks)) =
-fun score_in fact ((sel_len, sels), unks) =
+let
-case find_index (curry fact_eq fact o fst) sels of
+fun score_at j =
-~1 => (case find_index (curry fact_eq fact) unks of
+case try (nth sels) j of
-~1 => score_at sels sel_len
+SOME (_, score) => SOME (global_weight * score)
-| _ => NONE)
+| NONE => NONE
-| rank => score_at sels rank
+in
-fun weight_of fact = mess |> map_filter (score_in fact) |> sum_avg
+case find_index (curry fact_eq fact o fst) sels of
+~1 => (case find_index (curry fact_eq fact) unks of
+~1 => score_at sel_len
+| _ => NONE)
+| rank => score_at rank
+end
+fun weight_of fact = mess |> map_filter (score_in fact) |> scaled_avg
 val facts =
-fold (union fact_eq o map fst o take max_facts o snd o fst) mess []
+fold (union fact_eq o map fst o take max_facts o snd o fst o snd) mess
+[]
 in
 facts |> map (`weight_of) |> sort (int_ord o swap o pairself fst)
 |> map snd |> take max_facts
 end
 fun thy_feature_of s = ("y" ^ s, 1.0 (* FUDGE *))
 fun term_feature_of s = ("c" ^ s, 1.0 (* FUDGE *))
 fun type_feature_of s = ("t" ^ s, 1.0 (* FUDGE *))
 fun class_feature_of s = ("s" ^ s, 1.0 (* FUDGE *))
 fun status_feature_of status = (string_of_status status, 1.0 (* FUDGE *))
-val local_feature = ("local", 20.0 (* FUDGE *))
+val local_feature = ("local", 1.0 (* FUDGE *))
 val lams_feature = ("lams", 1.0 (* FUDGE *))
 val skos_feature = ("skos", 1.0 (* FUDGE *))
 fun theory_ord p =
 if Theory.eq_thy p then
 | patternify_term _ 0 _ = []
 | patternify_term args depth (t $ u) =
 let
 val ps = patternify_term (u :: args) depth t
 val qs = "" :: patternify_term [] (depth - 1) u
-in map_product (fn p => fn "" => p | q => "(" ^ q ^ ")") ps qs end
+in map_product (fn p => fn "" => p | q => p ^ "(" ^ q ^ ")") ps qs end
 | patternify_term _ _ _ = []
 val add_term_pattern =
 union (op = o pairself fst) o map term_feature_of oo patternify_term []
 fun add_term_patterns ~1 _ = I
 | add_term_patterns depth t =
 else
 (maxs, Graph.Keys.fold (insert_new seen)
 (Graph.imm_preds fact_G new) news))
 in find_maxes Symtab.empty ([], Graph.maximals fact_G) end
-(* Generate more suggestions than requested, because some might be thrown out
-later for various reasons and "meshing" gives better results with some
-slack. *)
-fun max_suggs_of max_facts = max_facts + Int.min (50, max_facts)
 fun is_fact_in_graph fact_G (_, th) =
 can (Graph.get_node fact_G) (nickname_of th)
-fun interleave 0 _ _ = []
-| interleave n [] ys = take n ys
-| interleave n xs [] = take n xs
-| interleave 1 (x :: _) _ = [x]
-| interleave n (x :: xs) (y :: ys) = x :: y :: interleave (n - 2) xs ys
 (* factor that controls whether unknown global facts should be included *)
 val include_unk_global_factor = 15
-val weight_mash_facts = weight_mepo_facts (* use MePo weights for now *)
+(* use MePo weights for now *)
+val weight_raw_mash_facts = weight_mepo_facts
+val weight_mash_facts = weight_raw_mash_facts
+(* FUDGE *)
+fun weight_of_proximity_fact rank =
+Math.pow (1.3, 15.5 - 0.05 * Real.fromInt rank) + 15.0
+fun weight_proximity_facts facts =
+facts ~~ map weight_of_proximity_fact (0 upto length facts - 1)
 fun mash_suggested_facts ctxt ({overlord, ...} : params) prover max_facts hyp_ts
 concl_t facts =
 let
 val thy = Proof_Context.theory_of ctxt
 let
 val parents = maximal_in_graph fact_G facts
 val feats =
 features_of ctxt prover thy (Local, General) (concl_t :: hyp_ts)
 in
-(fact_G, mash_QUERY ctxt overlord (max_suggs_of max_facts)
+(fact_G, mash_QUERY ctxt overlord max_facts (parents, feats))
-(parents, feats))
 end)
 val (chained, unchained) =
 List.partition (fn ((_, (scope, _)), _) => scope = Chained) facts
-val sels =
+val raw_mash =
 facts |> suggested_facts suggs
 (* The weights currently returned by "mash.py" are too spaced out to
 make any sense. *)
 |> map fst
-|> filter_out (member (Thm.eq_thm_prop o pairself snd) chained)
+val proximity =
-val (unk_global, unk_local) =
+chained @ (facts |> subtract (Thm.eq_thm_prop o pairself snd) chained
-unchained |> filter_out (is_fact_in_graph fact_G)
+|> sort (thm_ord o pairself snd o swap))
-|> List.partition (fn ((_, (scope, _)), _) => scope = Global)
+val unknown = facts |> filter_out (is_fact_in_graph fact_G)
-val (small_unk_global, big_unk_global) =
+val mess =
-([], unk_global)
+[(0.667 (* FUDGE *), (weight_raw_mash_facts raw_mash, unknown)),
-|> include_unk_global_factor * length unk_global <= max_facts ? swap
+(0.333 (* FUDGE *), (weight_proximity_facts proximity, []))]
-in
+in mesh_facts max_facts mess end
-(interleave max_facts (chained @ unk_local @ small_unk_global) sels,
-big_unk_global)
-end
 fun add_wrt_fact_graph ctxt (name, parents, feats, deps) (adds, graph) =
 let
 fun maybe_add_from from (accum as (parents, graph)) =
 try_graph ctxt "updating graph" accum (fn () =>
 end
 fun is_mash_enabled () = (getenv "MASH" = "yes")
 fun mash_can_suggest_facts ctxt = not (Graph.is_empty (#fact_G (mash_get ctxt)))
+(* Generate more suggestions than requested, because some might be thrown out
+later for various reasons. *)
+fun generous_max_facts max_facts = max_facts + Int.min (50, max_facts)
 (* The threshold should be large enough so that MaSh doesn't kick in for Auto
 Sledgehammer and Try. *)
 val min_secs_for_learning = 15
 fun relevant_facts ctxt (params as {learn, fact_filter, timeout, ...}) prover
 fun mepo () =
 mepo_suggested_facts ctxt params prover max_facts NONE hyp_ts concl_t
 facts
 |> weight_mepo_facts
 fun mash () =
-mash_suggested_facts ctxt params prover max_facts hyp_ts concl_t facts
+mash_suggested_facts ctxt params prover (generous_max_facts max_facts)
-|>> weight_mash_facts
+hyp_ts concl_t facts
+|> weight_mash_facts
 val mess =
-[] |> (if fact_filter <> mashN then cons (mepo (), []) else I)
+[] |> (if fact_filter <> mashN then cons (0.5, (mepo (), [])) else I)
-|> (if fact_filter <> mepoN then cons (mash ()) else I)
+|> (if fact_filter <> mepoN then cons (0.5, (mash (), [])) else I)
 in
 mesh_facts max_facts mess
 |> not (null add_ths) ? prepend_facts add_ths
 end

changeset 50383	4274b25ff4e7
parent 50382	cb564ff43c28
child 50389	ad0ac9112d2c