src/HOL/Tools/ATP/atp_systems.ML
author blanchet
Tue Jun 26 11:14:39 2012 +0200 (2012-06-26)
changeset 48130 defbcdc60fd6
parent 48129 933d43c31689
child 48131 1016664b8feb
permissions -rw-r--r--
tuning
blanchet@38047
     1
(*  Title:      HOL/Tools/ATP/atp_systems.ML
wenzelm@28592
     2
    Author:     Fabian Immler, TU Muenchen
blanchet@36371
     3
    Author:     Jasmin Blanchette, TU Muenchen
wenzelm@28592
     4
blanchet@36376
     5
Setup for supported ATPs.
wenzelm@28592
     6
*)
wenzelm@28592
     7
blanchet@36376
     8
signature ATP_SYSTEMS =
wenzelm@28592
     9
sig
blanchet@47038
    10
  type term_order = ATP_Problem.term_order
blanchet@45301
    11
  type atp_format = ATP_Problem.atp_format
blanchet@47976
    12
  type formula_role = ATP_Problem.formula_role
blanchet@39491
    13
  type failure = ATP_Proof.failure
blanchet@38023
    14
blanchet@46409
    15
  type slice_spec = int * atp_format * string * string * bool
blanchet@40059
    16
  type atp_config =
blanchet@47055
    17
    {exec : string list * string,
blanchet@47055
    18
     required_vars : string list list,
blanchet@42646
    19
     arguments :
blanchet@43473
    20
       Proof.context -> bool -> string -> Time.time
blanchet@47038
    21
       -> term_order * (unit -> (string * int) list)
blanchet@47038
    22
          * (unit -> (string * real) list) -> string,
blanchet@42578
    23
     proof_delims : (string * string) list,
blanchet@42578
    24
     known_failures : (failure * string) list,
blanchet@47976
    25
     prem_role : formula_role,
blanchet@43473
    26
     best_slices :
blanchet@47962
    27
       Proof.context -> (real * (bool * (slice_spec * string))) list,
blanchet@47962
    28
     best_max_mono_iters : int,
blanchet@47962
    29
     best_max_new_mono_instances : int}
blanchet@38023
    30
blanchet@47962
    31
  val default_max_mono_iters : int
blanchet@47962
    32
  val default_max_new_mono_instances : int
blanchet@44099
    33
  val force_sos : bool Config.T
blanchet@47032
    34
  val term_order : string Config.T
blanchet@43566
    35
  val e_smartN : string
blanchet@43566
    36
  val e_autoN : string
blanchet@43566
    37
  val e_fun_weightN : string
blanchet@43566
    38
  val e_sym_offset_weightN : string
blanchet@47032
    39
  val e_selection_heuristic : string Config.T
blanchet@42646
    40
  val e_default_fun_weight : real Config.T
blanchet@42646
    41
  val e_fun_weight_base : real Config.T
blanchet@42646
    42
  val e_fun_weight_span : real Config.T
blanchet@42646
    43
  val e_default_sym_offs_weight : real Config.T
blanchet@42646
    44
  val e_sym_offs_weight_base : real Config.T
blanchet@42646
    45
  val e_sym_offs_weight_span : real Config.T
blanchet@46643
    46
  val alt_ergoN : string
blanchet@46643
    47
  val dummy_thfN : string
blanchet@40059
    48
  val eN : string
blanchet@44590
    49
  val e_sineN : string
blanchet@44590
    50
  val e_tofofN : string
blanchet@45338
    51
  val iproverN : string
blanchet@45338
    52
  val iprover_eqN : string
blanchet@44590
    53
  val leo2N : string
blanchet@44590
    54
  val satallaxN : string
blanchet@44590
    55
  val snarkN : string
blanchet@40059
    56
  val spassN : string
blanchet@40059
    57
  val vampireN : string
blanchet@42938
    58
  val waldmeisterN : string
blanchet@44423
    59
  val z3_tptpN : string
blanchet@40060
    60
  val remote_prefix : string
blanchet@41738
    61
  val remote_atp :
blanchet@41738
    62
    string -> string -> string list -> (string * string) list
blanchet@47976
    63
    -> (failure * string) list -> formula_role
blanchet@47606
    64
    -> (Proof.context -> slice_spec * string) -> string * (unit -> atp_config)
blanchet@47606
    65
  val add_atp : string * (unit -> atp_config) -> theory -> theory
blanchet@47606
    66
  val get_atp : theory -> string -> (unit -> atp_config)
blanchet@41727
    67
  val supported_atps : theory -> string list
blanchet@40059
    68
  val is_atp_installed : theory -> string -> bool
blanchet@35867
    69
  val refresh_systems_on_tptp : unit -> unit
blanchet@47055
    70
  val effective_term_order : Proof.context -> string -> term_order
blanchet@35867
    71
  val setup : theory -> theory
wenzelm@28592
    72
end;
wenzelm@28592
    73
blanchet@36376
    74
structure ATP_Systems : ATP_SYSTEMS =
wenzelm@28592
    75
struct
wenzelm@28596
    76
blanchet@42577
    77
open ATP_Problem
blanchet@39491
    78
open ATP_Proof
blanchet@46320
    79
open ATP_Problem_Generate
boehmes@32864
    80
blanchet@40059
    81
(* ATP configuration *)
boehmes@32864
    82
blanchet@47962
    83
val default_max_mono_iters = 3 (* FUDGE *)
blanchet@47962
    84
val default_max_new_mono_instances = 200 (* FUDGE *)
blanchet@47962
    85
blanchet@46409
    86
type slice_spec = int * atp_format * string * string * bool
blanchet@46409
    87
blanchet@40059
    88
type atp_config =
blanchet@47055
    89
  {exec : string list * string,
blanchet@47055
    90
   required_vars : string list list,
blanchet@42646
    91
   arguments :
blanchet@43473
    92
     Proof.context -> bool -> string -> Time.time
blanchet@47038
    93
     -> term_order * (unit -> (string * int) list)
blanchet@47038
    94
        * (unit -> (string * real) list) -> string,
blanchet@42578
    95
   proof_delims : (string * string) list,
blanchet@42578
    96
   known_failures : (failure * string) list,
blanchet@47976
    97
   prem_role : formula_role,
blanchet@47962
    98
   best_slices : Proof.context -> (real * (bool * (slice_spec * string))) list,
blanchet@47962
    99
   best_max_mono_iters : int,
blanchet@47962
   100
   best_max_new_mono_instances : int}
wenzelm@28596
   101
blanchet@42723
   102
(* "best_slices" must be found empirically, taking a wholistic approach since
blanchet@46407
   103
   the ATPs are run in parallel. The "real" component gives the faction of the
blanchet@46409
   104
   time available given to the slice and should add up to 1.0. The first "bool"
blanchet@42723
   105
   component indicates whether the slice's strategy is complete; the "int", the
blanchet@43569
   106
   preferred number of facts to pass; the first "string", the preferred type
blanchet@45521
   107
   system (which should be sound or quasi-sound); the second "string", the
blanchet@46409
   108
   preferred lambda translation scheme; the second "bool", whether uncurried
blanchet@46409
   109
   aliased should be generated; the third "string", extra information to
blanchet@45521
   110
   the prover (e.g., SOS or no SOS).
blanchet@42723
   111
blanchet@42723
   112
   The last slice should be the most "normal" one, because it will get all the
blanchet@43569
   113
   time available if the other slices fail early and also because it is used if
blanchet@43569
   114
   slicing is disabled (e.g., by the minimizer). *)
blanchet@42710
   115
blanchet@38061
   116
val known_perl_failures =
blanchet@38094
   117
  [(CantConnect, "HTTP error"),
blanchet@38094
   118
   (NoPerl, "env: perl"),
blanchet@38065
   119
   (NoLibwwwPerl, "Can't locate HTTP")]
wenzelm@28596
   120
blanchet@45203
   121
fun known_szs_failures wrap =
blanchet@45203
   122
  [(Unprovable, wrap "CounterSatisfiable"),
blanchet@45203
   123
   (Unprovable, wrap "Satisfiable"),
blanchet@45203
   124
   (GaveUp, wrap "GaveUp"),
blanchet@45203
   125
   (GaveUp, wrap "Unknown"),
blanchet@45203
   126
   (GaveUp, wrap "Incomplete"),
blanchet@45203
   127
   (ProofMissing, wrap "Theorem"),
blanchet@45203
   128
   (ProofMissing, wrap "Unsatisfiable"),
blanchet@45203
   129
   (TimedOut, wrap "Timeout"),
blanchet@45203
   130
   (Inappropriate, wrap "Inappropriate"),
blanchet@45203
   131
   (OutOfResources, wrap "ResourceOut"),
blanchet@45203
   132
   (OutOfResources, wrap "MemoryOut"),
blanchet@45203
   133
   (Interrupted, wrap "Forced"),
blanchet@45203
   134
   (Interrupted, wrap "User")]
blanchet@45203
   135
blanchet@45203
   136
val known_szs_status_failures = known_szs_failures (prefix "SZS status ")
blanchet@45203
   137
val known_says_failures = known_szs_failures (prefix " says ")
blanchet@45203
   138
blanchet@40059
   139
(* named ATPs *)
blanchet@40059
   140
blanchet@46643
   141
val alt_ergoN = "alt_ergo"
blanchet@47055
   142
val dummy_thfN = "dummy_thf" (* for experiments *)
blanchet@40059
   143
val eN = "e"
blanchet@44590
   144
val e_sineN = "e_sine"
blanchet@44590
   145
val e_tofofN = "e_tofof"
blanchet@45338
   146
val iproverN = "iprover"
blanchet@45338
   147
val iprover_eqN = "iprover_eq"
blanchet@44099
   148
val leo2N = "leo2"
blanchet@44099
   149
val satallaxN = "satallax"
blanchet@44590
   150
val snarkN = "snark"
blanchet@40059
   151
val spassN = "spass"
blanchet@40059
   152
val vampireN = "vampire"
blanchet@44590
   153
val waldmeisterN = "waldmeister"
blanchet@44423
   154
val z3_tptpN = "z3_tptp"
blanchet@40060
   155
val remote_prefix = "remote_"
blanchet@38001
   156
blanchet@38023
   157
structure Data = Theory_Data
blanchet@38023
   158
(
blanchet@47606
   159
  type T = ((unit -> atp_config) * stamp) Symtab.table
blanchet@38023
   160
  val empty = Symtab.empty
blanchet@38023
   161
  val extend = I
blanchet@46407
   162
  fun merge data : T =
blanchet@46407
   163
    Symtab.merge (eq_snd (op =)) data
blanchet@38023
   164
    handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@38023
   165
)
blanchet@38017
   166
blanchet@43981
   167
fun to_secs min time = Int.max (min, (Time.toMilliseconds time + 999) div 1000)
blanchet@36142
   168
blanchet@43473
   169
val sosN = "sos"
blanchet@43473
   170
val no_sosN = "no_sos"
blanchet@43473
   171
blanchet@44099
   172
val force_sos = Attrib.setup_config_bool @{binding atp_force_sos} (K false)
blanchet@44099
   173
blanchet@47032
   174
val smartN = "smart"
blanchet@47073
   175
(* val kboN = "kbo" *)
blanchet@47032
   176
val lpoN = "lpo"
blanchet@47034
   177
val xweightsN = "_weights"
blanchet@47034
   178
val xprecN = "_prec"
blanchet@47034
   179
val xsimpN = "_simp" (* SPASS-specific *)
blanchet@47032
   180
blanchet@47038
   181
(* Possible values for "atp_term_order":
blanchet@47049
   182
   "smart", "(kbo|lpo)(_weights)?(_prec|_simp)?" *)
blanchet@47032
   183
val term_order =
blanchet@47032
   184
  Attrib.setup_config_string @{binding atp_term_order} (K smartN)
blanchet@47032
   185
blanchet@46643
   186
(* Alt-Ergo *)
blanchet@46643
   187
blanchet@48130
   188
val alt_ergo_tff1 = TFF (Polymorphic, TPTP_Explicit)
blanchet@46643
   189
blanchet@46643
   190
val alt_ergo_config : atp_config =
blanchet@47055
   191
  {exec = (["WHY3_HOME"], "why3"),
blanchet@47055
   192
   required_vars = [],
blanchet@46643
   193
   arguments =
blanchet@46643
   194
     fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@46643
   195
        "--format tff1 --prover alt-ergo --timelimit " ^
blanchet@46643
   196
        string_of_int (to_secs 1 timeout),
blanchet@46643
   197
   proof_delims = [],
blanchet@46643
   198
   known_failures =
blanchet@46643
   199
     [(ProofMissing, ": Valid"),
blanchet@46643
   200
      (TimedOut, ": Timeout"),
blanchet@46643
   201
      (GaveUp, ": Unknown")],
blanchet@47976
   202
   prem_role = Hypothesis,
blanchet@46643
   203
   best_slices = fn _ =>
blanchet@46643
   204
     (* FUDGE *)
blanchet@47962
   205
     [(1.0, (false, ((100, alt_ergo_tff1, "poly_native", liftingN, false), "")))],
blanchet@47962
   206
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   207
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@46643
   208
blanchet@47646
   209
val alt_ergo = (alt_ergoN, fn () => alt_ergo_config)
blanchet@46643
   210
blanchet@46643
   211
blanchet@40059
   212
(* E *)
wenzelm@28596
   213
blanchet@47055
   214
fun is_new_e_version () = (string_ord (getenv "E_VERSION", "1.2") = GREATER)
blanchet@44420
   215
blanchet@36369
   216
val tstp_proof_delims =
blanchet@42962
   217
  [("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation"),
blanchet@42962
   218
   ("% SZS output start CNFRefutation", "% SZS output end CNFRefutation")]
blanchet@36369
   219
blanchet@43473
   220
val e_smartN = "smart"
blanchet@42646
   221
val e_autoN = "auto"
blanchet@42646
   222
val e_fun_weightN = "fun_weight"
blanchet@42646
   223
val e_sym_offset_weightN = "sym_offset_weight"
blanchet@41725
   224
blanchet@47032
   225
val e_selection_heuristic =
blanchet@47032
   226
  Attrib.setup_config_string @{binding atp_e_selection_heuristic} (K e_smartN)
blanchet@41770
   227
(* FUDGE *)
blanchet@42646
   228
val e_default_fun_weight =
blanchet@42646
   229
  Attrib.setup_config_real @{binding atp_e_default_fun_weight} (K 20.0)
blanchet@42646
   230
val e_fun_weight_base =
blanchet@42646
   231
  Attrib.setup_config_real @{binding atp_e_fun_weight_base} (K 0.0)
blanchet@42646
   232
val e_fun_weight_span =
blanchet@42646
   233
  Attrib.setup_config_real @{binding atp_e_fun_weight_span} (K 40.0)
blanchet@42646
   234
val e_default_sym_offs_weight =
blanchet@42646
   235
  Attrib.setup_config_real @{binding atp_e_default_sym_offs_weight} (K 1.0)
blanchet@42646
   236
val e_sym_offs_weight_base =
blanchet@42646
   237
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_base} (K ~20.0)
blanchet@42646
   238
val e_sym_offs_weight_span =
blanchet@42646
   239
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_span} (K 60.0)
blanchet@41725
   240
blanchet@47038
   241
fun e_selection_heuristic_case heuristic fw sow =
blanchet@47038
   242
  if heuristic = e_fun_weightN then fw
blanchet@47038
   243
  else if heuristic = e_sym_offset_weightN then sow
blanchet@47038
   244
  else raise Fail ("unexpected " ^ quote heuristic)
blanchet@41725
   245
blanchet@47038
   246
fun scaled_e_selection_weight ctxt heuristic w =
blanchet@47038
   247
  w * Config.get ctxt (e_selection_heuristic_case heuristic
blanchet@47029
   248
                           e_fun_weight_span e_sym_offs_weight_span)
blanchet@47038
   249
  + Config.get ctxt (e_selection_heuristic_case heuristic
blanchet@47029
   250
                         e_fun_weight_base e_sym_offs_weight_base)
blanchet@41725
   251
  |> Real.ceil |> signed_string_of_int
blanchet@41313
   252
blanchet@47038
   253
fun e_selection_weight_arguments ctxt heuristic sel_weights =
blanchet@47038
   254
  if heuristic = e_autoN then
blanchet@47038
   255
    "-xAuto"
blanchet@41725
   256
  else
blanchet@43622
   257
    (* supplied by Stephan Schulz *)
blanchet@41314
   258
    "--split-clauses=4 --split-reuse-defs --simul-paramod --forward-context-sr \
blanchet@41314
   259
    \--destructive-er-aggressive --destructive-er --presat-simplify \
blanchet@47505
   260
    \--prefer-initial-clauses -winvfreqrank -c1 -Ginvfreqconjmax -F1 \
blanchet@47505
   261
    \--delete-bad-limit=150000000 -WSelectMaxLComplexAvoidPosPred -H'(4*" ^
blanchet@47038
   262
    e_selection_heuristic_case heuristic "FunWeight" "SymOffsetWeight" ^
blanchet@41725
   263
    "(SimulateSOS, " ^
blanchet@47038
   264
    (e_selection_heuristic_case heuristic
blanchet@47029
   265
         e_default_fun_weight e_default_sym_offs_weight
blanchet@42646
   266
     |> Config.get ctxt |> Real.ceil |> signed_string_of_int) ^
blanchet@41314
   267
    ",20,1.5,1.5,1" ^
blanchet@47030
   268
    (sel_weights ()
blanchet@47029
   269
     |> map (fn (s, w) => "," ^ s ^ ":" ^
blanchet@47038
   270
                          scaled_e_selection_weight ctxt heuristic w)
blanchet@42646
   271
     |> implode) ^
blanchet@41314
   272
    "),3*ConjectureGeneralSymbolWeight(PreferNonGoals,200,100,200,50,50,1,100,\
blanchet@41314
   273
    \1.5,1.5,1),1*Clauseweight(PreferProcessed,1,1,1),1*\
blanchet@41314
   274
    \FIFOWeight(PreferProcessed))'"
blanchet@41313
   275
blanchet@47038
   276
val e_ord_weights =
blanchet@47038
   277
  map (fn (s, w) => s ^ ":" ^ string_of_int w) #> space_implode ","
blanchet@47038
   278
fun e_ord_precedence [_] = ""
blanchet@47038
   279
  | e_ord_precedence info = info |> map fst |> space_implode "<"
blanchet@47038
   280
blanchet@47039
   281
fun e_term_order_info_arguments false false _ = ""
blanchet@47039
   282
  | e_term_order_info_arguments gen_weights gen_prec ord_info =
blanchet@47038
   283
    let val ord_info = ord_info () in
blanchet@47038
   284
      (if gen_weights then "--order-weights='" ^ e_ord_weights ord_info ^ "' "
blanchet@47038
   285
       else "") ^
blanchet@47038
   286
      (if gen_prec then "--precedence='" ^ e_ord_precedence ord_info ^ "' "
blanchet@47038
   287
       else "")
blanchet@47038
   288
    end
blanchet@47038
   289
blanchet@47032
   290
fun effective_e_selection_heuristic ctxt =
blanchet@47055
   291
  if is_new_e_version () then Config.get ctxt e_selection_heuristic else e_autoN
blanchet@42443
   292
blanchet@47505
   293
fun e_kbo () = if is_new_e_version () then "KBO6" else "KBO"
blanchet@47505
   294
blanchet@40059
   295
val e_config : atp_config =
blanchet@47055
   296
  {exec = (["E_HOME"], "eproof"),
blanchet@47055
   297
   required_vars = [],
blanchet@43354
   298
   arguments =
blanchet@47038
   299
     fn ctxt => fn _ => fn heuristic => fn timeout =>
blanchet@47038
   300
        fn ({is_lpo, gen_weights, gen_prec, ...}, ord_info, sel_weights) =>
blanchet@47038
   301
        "--tstp-in --tstp-out --output-level=5 --silent " ^
blanchet@47038
   302
        e_selection_weight_arguments ctxt heuristic sel_weights ^ " " ^
blanchet@47039
   303
        e_term_order_info_arguments gen_weights gen_prec ord_info ^ " " ^
blanchet@47505
   304
        "--term-ordering=" ^ (if is_lpo then "LPO4" else e_kbo ()) ^ " " ^
blanchet@47038
   305
        "--cpu-limit=" ^ string_of_int (to_secs 2 timeout),
blanchet@42962
   306
   proof_delims = tstp_proof_delims,
blanchet@36265
   307
   known_failures =
blanchet@45203
   308
     [(TimedOut, "Failure: Resource limit exceeded (time)"),
blanchet@47972
   309
      (TimedOut, "time limit exceeded")] @
blanchet@47972
   310
     known_szs_status_failures,
blanchet@47976
   311
   prem_role = Conjecture,
blanchet@42646
   312
   best_slices = fn ctxt =>
blanchet@47038
   313
     let val heuristic = effective_e_selection_heuristic ctxt in
blanchet@43474
   314
       (* FUDGE *)
blanchet@47038
   315
       if heuristic = e_smartN then
blanchet@46449
   316
         [(0.333, (true, ((500, FOF, "mono_tags??", combsN, false), e_fun_weightN))),
blanchet@46449
   317
          (0.334, (true, ((50, FOF, "mono_guards??", combsN, false), e_fun_weightN))),
blanchet@46449
   318
          (0.333, (true, ((1000, FOF, "mono_tags??", combsN, false), e_sym_offset_weightN)))]
blanchet@43473
   319
       else
blanchet@47038
   320
         [(1.0, (true, ((500, FOF, "mono_tags??", combsN, false), heuristic)))]
blanchet@47962
   321
     end,
blanchet@47962
   322
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   323
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@38454
   324
blanchet@47646
   325
val e = (eN, fn () => e_config)
wenzelm@28596
   326
wenzelm@28596
   327
blanchet@44099
   328
(* LEO-II *)
blanchet@44099
   329
blanchet@48004
   330
(* LEO-II supports definitions, but it performs significantly better on our
blanchet@48004
   331
   benchmarks when they are not used. *)
blanchet@48004
   332
val leo2_thf0 =
blanchet@48130
   333
  THF (Monomorphic, TPTP_Explicit, THF_Without_Choice, THF_Without_Defs)
blanchet@44754
   334
blanchet@44099
   335
val leo2_config : atp_config =
blanchet@47055
   336
  {exec = (["LEO2_HOME"], "leo"),
blanchet@47055
   337
   required_vars = [],
blanchet@44099
   338
   arguments =
blanchet@47916
   339
     fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@48084
   340
        "--foatp e --atp e=\"$E_HOME\"/eprover \
blanchet@48084
   341
        \--atp epclextract=\"$E_HOME\"/epclextract \
blanchet@48084
   342
        \--proofoutput 1 --timeout " ^
blanchet@48084
   343
        string_of_int (to_secs 1 timeout),
blanchet@44099
   344
   proof_delims = tstp_proof_delims,
blanchet@45207
   345
   known_failures =
blanchet@47974
   346
     [(TimedOut, "CPU time limit exceeded, terminating"),
blanchet@47972
   347
      (GaveUp, "No.of.Axioms")] @
blanchet@47972
   348
     known_szs_status_failures,
blanchet@47976
   349
   prem_role = Hypothesis,
blanchet@47914
   350
   best_slices =
blanchet@44099
   351
     (* FUDGE *)
blanchet@48097
   352
     K [(1.0, (true, ((40, leo2_thf0, "mono_native_higher", keep_lamsN, false), "")))],
blanchet@47962
   353
   best_max_mono_iters = default_max_mono_iters - 1 (* FUDGE *),
blanchet@47962
   354
   best_max_new_mono_instances = default_max_new_mono_instances div 2 (* FUDGE *)}
blanchet@39491
   355
blanchet@47646
   356
val leo2 = (leo2N, fn () => leo2_config)
blanchet@44099
   357
blanchet@44099
   358
blanchet@44099
   359
(* Satallax *)
blanchet@44099
   360
blanchet@48004
   361
val satallax_thf0 =
blanchet@48130
   362
  THF (Monomorphic, TPTP_Explicit, THF_With_Choice, THF_With_Defs)
blanchet@44754
   363
blanchet@44099
   364
val satallax_config : atp_config =
blanchet@47055
   365
  {exec = (["SATALLAX_HOME"], "satallax"),
blanchet@47055
   366
   required_vars = [],
blanchet@44099
   367
   arguments =
blanchet@44099
   368
     fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@45162
   369
        "-p hocore -t " ^ string_of_int (to_secs 1 timeout),
blanchet@45162
   370
   proof_delims =
blanchet@45162
   371
     [("% Higher-Order Unsat Core BEGIN", "% Higher-Order Unsat Core END")],
blanchet@45203
   372
   known_failures = known_szs_status_failures,
blanchet@47981
   373
   prem_role = Hypothesis,
blanchet@44416
   374
   best_slices =
blanchet@44754
   375
     (* FUDGE *)
blanchet@47985
   376
     K [(1.0, (true, ((60, satallax_thf0, "mono_native_higher", keep_lamsN, false), "")))],
blanchet@47962
   377
   best_max_mono_iters = default_max_mono_iters - 1 (* FUDGE *),
blanchet@47962
   378
   best_max_new_mono_instances = default_max_new_mono_instances div 2 (* FUDGE *)}
blanchet@44099
   379
blanchet@47646
   380
val satallax = (satallaxN, fn () => satallax_config)
blanchet@44099
   381
blanchet@44099
   382
blanchet@44099
   383
(* SPASS *)
blanchet@42725
   384
blanchet@48005
   385
val spass_H1SOS = "-Heuristic=1 -SOS"
blanchet@48005
   386
val spass_H2LR0LT0 = "-Heuristic=2 -LR=0 -LT=0"
blanchet@48005
   387
val spass_H2SOS = "-Heuristic=2 -SOS"
blanchet@48005
   388
val spass_H2NuVS0 = "-Heuristic=2 -RNuV=1 -Sorts=0"
blanchet@48005
   389
val spass_H2NuVS0Red2 = "-Heuristic=2 -RNuV=1 -Sorts=0 -RFRew=2 -RBRew=2 -RTaut=2"
blanchet@47055
   390
blanchet@48005
   391
(* FIXME: Make "SPASS_NEW_HOME" legacy. *)
blanchet@48005
   392
val spass_config : atp_config =
blanchet@48005
   393
  {exec = (["SPASS_NEW_HOME", "SPASS_HOME"], "SPASS"),
blanchet@48005
   394
   required_vars = [],
blanchet@48005
   395
   arguments = fn _ => fn _ => fn extra_options => fn timeout => fn _ =>
blanchet@48005
   396
     ("-Isabelle=1 -TimeLimit=" ^ string_of_int (to_secs 1 timeout))
blanchet@48005
   397
     |> extra_options <> "" ? prefix (extra_options ^ " "),
blanchet@36369
   398
   proof_delims = [("Here is a proof", "Formulae used in the proof")],
blanchet@36289
   399
   known_failures =
blanchet@48005
   400
     [(OldSPASS, "Unrecognized option Isabelle"),
blanchet@47950
   401
      (GaveUp, "SPASS beiseite: Completion found"),
blanchet@36370
   402
      (TimedOut, "SPASS beiseite: Ran out of time"),
blanchet@36965
   403
      (OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"),
blanchet@37413
   404
      (MalformedInput, "Undefined symbol"),
blanchet@37414
   405
      (MalformedInput, "Free Variable"),
blanchet@44391
   406
      (Unprovable, "No formulae and clauses found in input file"),
blanchet@47972
   407
      (InternalError, "Please report this error")] @
blanchet@47972
   408
      known_perl_failures,
blanchet@47976
   409
   prem_role = Conjecture,
blanchet@48005
   410
   best_slices = fn _ =>
blanchet@42723
   411
     (* FUDGE *)
blanchet@48129
   412
     [(0.1667, (false, ((150, DFG, "mono_native", combsN, true), ""))),
blanchet@48129
   413
      (0.1667, (false, ((500, DFG, "mono_native", liftingN, true), spass_H2SOS))),
blanchet@48129
   414
      (0.1666, (false, ((50, DFG,  "mono_native", liftingN, true), spass_H2LR0LT0))),
blanchet@48129
   415
      (0.1000, (false, ((250, DFG, "mono_native", combsN, true), spass_H2NuVS0))),
blanchet@48129
   416
      (0.1000, (false, ((1000, DFG, "mono_native", liftingN, true), spass_H1SOS))),
blanchet@48129
   417
      (0.1000, (false, ((150, DFG, "poly_guards??", liftingN, false), spass_H2NuVS0Red2))),
blanchet@48129
   418
      (0.1000, (false, ((300, DFG, "mono_native", combsN, true), spass_H2SOS))),
blanchet@48129
   419
      (0.1000, (false, ((100, DFG, "mono_native", combs_and_liftingN, true), spass_H2NuVS0)))],
blanchet@47962
   420
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   421
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@38454
   422
blanchet@48005
   423
val spass = (spassN, fn () => spass_config)
blanchet@38454
   424
blanchet@37509
   425
(* Vampire *)
blanchet@37509
   426
blanchet@48007
   427
(* Vampire 1.8 has TFF support, but the support was buggy until revision
blanchet@48007
   428
   1435 (or shortly before). *)
blanchet@47055
   429
fun is_new_vampire_version () =
blanchet@47055
   430
  string_ord (getenv "VAMPIRE_VERSION", "1.8") = GREATER
blanchet@44420
   431
blanchet@48130
   432
val vampire_tff0 = TFF (Monomorphic, TPTP_Implicit)
blanchet@44589
   433
blanchet@40059
   434
val vampire_config : atp_config =
blanchet@47055
   435
  {exec = (["VAMPIRE_HOME"], "vampire"),
blanchet@47055
   436
   required_vars = [],
blanchet@43569
   437
   arguments = fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@44417
   438
     "--mode casc -t " ^ string_of_int (to_secs 1 timeout) ^
blanchet@45234
   439
     " --proof tptp --output_axiom_names on\
blanchet@45234
   440
     \ --forced_options propositional_to_bdd=off\
blanchet@44417
   441
     \ --thanks \"Andrei and Krystof\" --input_file"
blanchet@43473
   442
     |> sos = sosN ? prefix "--sos on ",
blanchet@37509
   443
   proof_delims =
blanchet@37509
   444
     [("=========== Refutation ==========",
blanchet@37509
   445
       "======= End of refutation ======="),
blanchet@38033
   446
      ("% SZS output start Refutation", "% SZS output end Refutation"),
blanchet@38033
   447
      ("% SZS output start Proof", "% SZS output end Proof")],
blanchet@37509
   448
   known_failures =
blanchet@43050
   449
     [(GaveUp, "UNPROVABLE"),
blanchet@43050
   450
      (GaveUp, "CANNOT PROVE"),
blanchet@37509
   451
      (Unprovable, "Satisfiability detected"),
blanchet@38647
   452
      (Unprovable, "Termination reason: Satisfiable"),
blanchet@47972
   453
      (Interrupted, "Aborted by signal SIGINT")] @
blanchet@47972
   454
     known_szs_status_failures,
blanchet@47976
   455
   prem_role = Conjecture,
blanchet@42725
   456
   best_slices = fn ctxt =>
blanchet@42723
   457
     (* FUDGE *)
blanchet@47055
   458
     (if is_new_vampire_version () then
blanchet@47948
   459
        [(0.333, (false, ((500, vampire_tff0, "mono_native", combs_or_liftingN, false), sosN))),
blanchet@47948
   460
         (0.333, (false, ((150, vampire_tff0, "poly_guards??", combs_or_liftingN, false), sosN))),
blanchet@47055
   461
         (0.334, (true, ((50, vampire_tff0, "mono_native", combs_or_liftingN, false), no_sosN)))]
blanchet@47055
   462
      else
blanchet@46449
   463
        [(0.333, (false, ((150, FOF, "poly_guards??", combs_or_liftingN, false), sosN))),
blanchet@46449
   464
         (0.333, (false, ((500, FOF, "mono_tags??", combs_or_liftingN, false), sosN))),
blanchet@47055
   465
         (0.334, (true, ((50, FOF, "mono_guards??", combs_or_liftingN, false), no_sosN)))])
blanchet@44099
   466
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@47962
   467
         else I),
blanchet@47962
   468
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   469
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@38454
   470
blanchet@47646
   471
val vampire = (vampireN, fn () => vampire_config)
blanchet@37509
   472
blanchet@38454
   473
blanchet@41740
   474
(* Z3 with TPTP syntax *)
blanchet@41740
   475
blanchet@48130
   476
val z3_tff0 = TFF (Monomorphic, TPTP_Implicit)
blanchet@44589
   477
blanchet@44423
   478
val z3_tptp_config : atp_config =
blanchet@47055
   479
  {exec = (["Z3_HOME"], "z3"),
blanchet@47055
   480
   required_vars = [],
blanchet@43354
   481
   arguments = fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@44420
   482
     "MBQI=true -tptp -t:" ^ string_of_int (to_secs 1 timeout),
blanchet@41740
   483
   proof_delims = [],
blanchet@45203
   484
   known_failures = known_szs_status_failures,
blanchet@47976
   485
   prem_role = Hypothesis,
blanchet@42723
   486
   best_slices =
blanchet@44423
   487
     (* FUDGE *)
blanchet@46435
   488
     K [(0.5, (false, ((250, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@46435
   489
        (0.25, (false, ((125, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@46435
   490
        (0.125, (false, ((62, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@47962
   491
        (0.125, (false, ((31, z3_tff0, "mono_native", combsN, false), "")))],
blanchet@47962
   492
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   493
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@41740
   494
blanchet@47646
   495
val z3_tptp = (z3_tptpN, fn () => z3_tptp_config)
blanchet@41740
   496
blanchet@44590
   497
blanchet@44754
   498
(* Not really a prover: Experimental Polymorphic TFF and THF output *)
blanchet@44590
   499
blanchet@44754
   500
fun dummy_config format type_enc : atp_config =
blanchet@47055
   501
  {exec = (["ISABELLE_ATP"], "scripts/dummy_atp"),
blanchet@47055
   502
   required_vars = [],
blanchet@44590
   503
   arguments = K (K (K (K (K "")))),
blanchet@44590
   504
   proof_delims = [],
blanchet@45203
   505
   known_failures = known_szs_status_failures,
blanchet@47976
   506
   prem_role = Hypothesis,
blanchet@45521
   507
   best_slices =
blanchet@46407
   508
     K [(1.0, (false, ((200, format, type_enc,
blanchet@46407
   509
                        if is_format_higher_order format then keep_lamsN
blanchet@47962
   510
                        else combsN, false), "")))],
blanchet@47962
   511
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   512
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@44590
   513
blanchet@48004
   514
val dummy_thf_format =
blanchet@48130
   515
  THF (Polymorphic, TPTP_Explicit, THF_With_Choice, THF_With_Defs)
blanchet@46435
   516
val dummy_thf_config = dummy_config dummy_thf_format "poly_native_higher"
blanchet@47646
   517
val dummy_thf = (dummy_thfN, fn () => dummy_thf_config)
blanchet@44754
   518
blanchet@41740
   519
blanchet@40059
   520
(* Remote ATP invocation via SystemOnTPTP *)
wenzelm@28596
   521
blanchet@38061
   522
val systems = Synchronized.var "atp_systems" ([] : string list)
immler@31835
   523
immler@31835
   524
fun get_systems () =
blanchet@44589
   525
  case Isabelle_System.bash_output
blanchet@44589
   526
           "\"$ISABELLE_ATP/scripts/remote_atp\" -w 2>&1" of
blanchet@39491
   527
    (output, 0) => split_lines output
blanchet@39491
   528
  | (output, _) =>
blanchet@39491
   529
    error (case extract_known_failure known_perl_failures output of
blanchet@41744
   530
             SOME failure => string_for_failure failure
wenzelm@47499
   531
           | NONE => trim_line output ^ ".")
immler@31835
   532
blanchet@42537
   533
fun find_system name [] systems =
blanchet@42537
   534
    find_first (String.isPrefix (name ^ "---")) systems
blanchet@38690
   535
  | find_system name (version :: versions) systems =
blanchet@38690
   536
    case find_first (String.isPrefix (name ^ "---" ^ version)) systems of
blanchet@38690
   537
      NONE => find_system name versions systems
blanchet@38690
   538
    | res => res
blanchet@38690
   539
blanchet@38690
   540
fun get_system name versions =
blanchet@38589
   541
  Synchronized.change_result systems
blanchet@38589
   542
      (fn systems => (if null systems then get_systems () else systems)
blanchet@42955
   543
                     |> `(`(find_system name versions)))
boehmes@32864
   544
blanchet@38690
   545
fun the_system name versions =
blanchet@38690
   546
  case get_system name versions of
blanchet@42955
   547
    (SOME sys, _) => sys
blanchet@46480
   548
  | (NONE, []) => error ("SystemOnTPTP is not available.")
blanchet@42955
   549
  | (NONE, syss) =>
blanchet@46480
   550
    case syss |> filter_out (String.isPrefix "%")
blanchet@46480
   551
              |> filter_out (curry (op =) "") of
blanchet@46480
   552
      [] => error ("SystemOnTPTP is not available.")
blanchet@46480
   553
    | [msg] => error ("SystemOnTPTP is not available: " ^ msg ^ ".")
blanchet@46480
   554
    | syss =>
blanchet@46480
   555
      error ("System " ^ quote name ^ " is not available at SystemOnTPTP.\n" ^
blanchet@46480
   556
             "(Available systems: " ^ commas_quote syss ^ ".)")
immler@31835
   557
blanchet@41148
   558
val max_remote_secs = 240 (* give Geoff Sutcliffe's servers a break *)
blanchet@41148
   559
blanchet@38690
   560
fun remote_config system_name system_versions proof_delims known_failures
blanchet@47976
   561
                  prem_role best_slice : atp_config =
blanchet@47055
   562
  {exec = (["ISABELLE_ATP"], "scripts/remote_atp"),
blanchet@47055
   563
   required_vars = [],
blanchet@47074
   564
   arguments = fn _ => fn _ => fn command => fn timeout => fn _ =>
blanchet@47074
   565
     (if command <> "" then "-c " ^ quote command ^ " " else "") ^
blanchet@47074
   566
     "-s " ^ the_system system_name system_versions ^ " " ^
blanchet@47074
   567
     "-t " ^ string_of_int (Int.min (max_remote_secs, to_secs 1 timeout)),
blanchet@42962
   568
   proof_delims = union (op =) tstp_proof_delims proof_delims,
blanchet@45203
   569
   known_failures = known_failures @ known_perl_failures @ known_says_failures,
blanchet@47976
   570
   prem_role = prem_role,
blanchet@47962
   571
   best_slices = fn ctxt => [(1.0, (false, best_slice ctxt))],
blanchet@47962
   572
   best_max_mono_iters = default_max_mono_iters,
blanchet@47962
   573
   best_max_new_mono_instances = default_max_new_mono_instances}
blanchet@42443
   574
blanchet@43500
   575
fun remotify_config system_name system_versions best_slice
blanchet@47976
   576
        ({proof_delims, known_failures, prem_role, ...} : atp_config)
blanchet@47912
   577
        : atp_config =
blanchet@38690
   578
  remote_config system_name system_versions proof_delims known_failures
blanchet@47976
   579
                prem_role best_slice
blanchet@38023
   580
blanchet@40059
   581
fun remote_atp name system_name system_versions proof_delims known_failures
blanchet@47976
   582
               prem_role best_slice =
blanchet@40060
   583
  (remote_prefix ^ name,
blanchet@47912
   584
   fn () => remote_config system_name system_versions proof_delims
blanchet@47976
   585
                          known_failures prem_role best_slice)
blanchet@43500
   586
fun remotify_atp (name, config) system_name system_versions best_slice =
blanchet@43500
   587
  (remote_prefix ^ name,
blanchet@47606
   588
   remotify_config system_name system_versions best_slice o config)
wenzelm@28592
   589
blanchet@48130
   590
val explicit_tff0 = TFF (Monomorphic, TPTP_Explicit)
blanchet@44589
   591
blanchet@43500
   592
val remote_e =
blanchet@43500
   593
  remotify_atp e "EP" ["1.0", "1.1", "1.2"]
blanchet@47074
   594
      (K ((750, FOF, "mono_tags??", combsN, false), "") (* FUDGE *))
blanchet@44099
   595
val remote_leo2 =
blanchet@44099
   596
  remotify_atp leo2 "LEO-II" ["1.2.8", "1.2.6"]
blanchet@47074
   597
      (K ((100, leo2_thf0, "mono_native_higher", liftingN, false), "") (* FUDGE *))
blanchet@44099
   598
val remote_satallax =
blanchet@47074
   599
  remotify_atp satallax "Satallax" ["2.3", "2.2", "2"]
blanchet@47076
   600
      (K ((100, satallax_thf0, "mono_native_higher", keep_lamsN, false), "") (* FUDGE *))
blanchet@43500
   601
val remote_vampire =
blanchet@48077
   602
  remotify_atp vampire "Vampire" ["2.6", "2.5", "1.8"]
blanchet@47074
   603
      (K ((250, vampire_tff0, "mono_native", combs_or_liftingN, false), "") (* FUDGE *))
blanchet@44423
   604
val remote_z3_tptp =
blanchet@44754
   605
  remotify_atp z3_tptp "Z3" ["3.0"]
blanchet@47074
   606
      (K ((250, z3_tff0, "mono_native", combsN, false), "") (* FUDGE *))
blanchet@44092
   607
val remote_e_sine =
blanchet@47912
   608
  remote_atp e_sineN "SInE" ["0.4"] [] (#known_failures e_config) Conjecture
blanchet@47074
   609
      (K ((500, FOF, "mono_guards??", combsN, false), "") (* FUDGE *))
blanchet@45338
   610
val remote_iprover =
blanchet@47912
   611
  remote_atp iproverN "iProver" [] [] [] Conjecture
blanchet@47074
   612
      (K ((150, FOF, "mono_guards??", liftingN, false), "") (* FUDGE *))
blanchet@45338
   613
val remote_iprover_eq =
blanchet@47912
   614
  remote_atp iprover_eqN "iProver-Eq" [] [] [] Conjecture
blanchet@47074
   615
      (K ((150, FOF, "mono_guards??", liftingN, false), "") (* FUDGE *))
blanchet@41740
   616
val remote_snark =
blanchet@42939
   617
  remote_atp snarkN "SNARK" ["20080805r029", "20080805r024"]
blanchet@47912
   618
      [("refutation.", "end_refutation.")] [] Hypothesis
blanchet@47074
   619
      (K ((100, explicit_tff0, "mono_native", liftingN, false), "") (* FUDGE *))
blanchet@44092
   620
val remote_e_tofof =
blanchet@47912
   621
  remote_atp e_tofofN "ToFoF" ["0.1"] [] (#known_failures e_config) Hypothesis
blanchet@47074
   622
      (K ((150, explicit_tff0, "mono_native", liftingN, false), "") (* FUDGE *))
blanchet@42938
   623
val remote_waldmeister =
blanchet@42938
   624
  remote_atp waldmeisterN "Waldmeister" ["710"]
blanchet@45521
   625
      [("#START OF PROOF", "Proved Goals:")]
blanchet@45521
   626
      [(OutOfResources, "Too many function symbols"),
blanchet@47506
   627
       (Inappropriate, "****  Unexpected end of file."),
blanchet@45521
   628
       (Crashed, "Unrecoverable Segmentation Fault")]
blanchet@47912
   629
      Hypothesis
blanchet@47898
   630
      (K ((50, CNF_UEQ, "raw_mono_tags??", combsN, false), "") (* FUDGE *))
blanchet@38454
   631
blanchet@38454
   632
(* Setup *)
blanchet@38454
   633
blanchet@40059
   634
fun add_atp (name, config) thy =
blanchet@40059
   635
  Data.map (Symtab.update_new (name, (config, stamp ()))) thy
blanchet@40059
   636
  handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@40059
   637
blanchet@40059
   638
fun get_atp thy name =
blanchet@40059
   639
  the (Symtab.lookup (Data.get thy) name) |> fst
blanchet@40059
   640
  handle Option.Option => error ("Unknown ATP: " ^ name ^ ".")
blanchet@40059
   641
blanchet@41727
   642
val supported_atps = Symtab.keys o Data.get
blanchet@36371
   643
blanchet@40059
   644
fun is_atp_installed thy name =
blanchet@47606
   645
  let val {exec, required_vars, ...} = get_atp thy name () in
blanchet@47055
   646
    forall (exists (fn var => getenv var <> "")) (fst exec :: required_vars)
blanchet@40059
   647
  end
blanchet@36371
   648
blanchet@40059
   649
fun refresh_systems_on_tptp () =
blanchet@40059
   650
  Synchronized.change systems (fn _ => get_systems ())
blanchet@40059
   651
blanchet@47055
   652
fun effective_term_order ctxt atp =
blanchet@47055
   653
  let val ord = Config.get ctxt term_order in
blanchet@47055
   654
    if ord = smartN then
blanchet@48005
   655
      if atp = spassN then
blanchet@47073
   656
        {is_lpo = false, gen_weights = true, gen_prec = true, gen_simp = false}
blanchet@47055
   657
      else
blanchet@47055
   658
        {is_lpo = false, gen_weights = false, gen_prec = false,
blanchet@47055
   659
         gen_simp = false}
blanchet@47055
   660
    else
blanchet@47055
   661
      let val is_lpo = String.isSubstring lpoN ord in
blanchet@47055
   662
        {is_lpo = is_lpo,
blanchet@47055
   663
         gen_weights = not is_lpo andalso String.isSubstring xweightsN ord,
blanchet@47055
   664
         gen_prec = String.isSubstring xprecN ord,
blanchet@47055
   665
         gen_simp = String.isSubstring xsimpN ord}
blanchet@47055
   666
      end
blanchet@47055
   667
  end
blanchet@47055
   668
blanchet@47606
   669
val atps=
blanchet@47949
   670
  [alt_ergo, e, leo2, dummy_thf, satallax, spass, vampire, z3_tptp, remote_e,
blanchet@47949
   671
   remote_e_sine, remote_e_tofof, remote_iprover, remote_iprover_eq,
blanchet@47949
   672
   remote_leo2, remote_satallax, remote_vampire, remote_z3_tptp, remote_snark,
blanchet@47949
   673
   remote_waldmeister]
blanchet@47055
   674
blanchet@47606
   675
val setup = fold add_atp atps
blanchet@35867
   676
wenzelm@28592
   677
end;