src/HOL/Tools/ATP/atp_systems.ML
author blanchet
Tue Feb 14 20:13:07 2012 +0100 (2012-02-14)
changeset 46481 c7c85ff6de2a
parent 46480 24990fae5f92
child 46643 a88bccd2b567
permissions -rw-r--r--
don't report spurious LEO-II errors
blanchet@38047
     1
(*  Title:      HOL/Tools/ATP/atp_systems.ML
wenzelm@28592
     2
    Author:     Fabian Immler, TU Muenchen
blanchet@36371
     3
    Author:     Jasmin Blanchette, TU Muenchen
wenzelm@28592
     4
blanchet@36376
     5
Setup for supported ATPs.
wenzelm@28592
     6
*)
wenzelm@28592
     7
blanchet@36376
     8
signature ATP_SYSTEMS =
wenzelm@28592
     9
sig
blanchet@45301
    10
  type atp_format = ATP_Problem.atp_format
blanchet@42577
    11
  type formula_kind = ATP_Problem.formula_kind
blanchet@39491
    12
  type failure = ATP_Proof.failure
blanchet@38023
    13
blanchet@46409
    14
  type slice_spec = int * atp_format * string * string * bool
blanchet@40059
    15
  type atp_config =
blanchet@42578
    16
    {exec : string * string,
blanchet@42578
    17
     required_execs : (string * string) list,
blanchet@42646
    18
     arguments :
blanchet@43473
    19
       Proof.context -> bool -> string -> Time.time
blanchet@43354
    20
       -> (unit -> (string * real) list) -> string,
blanchet@42578
    21
     proof_delims : (string * string) list,
blanchet@42578
    22
     known_failures : (failure * string) list,
blanchet@42709
    23
     conj_sym_kind : formula_kind,
blanchet@42709
    24
     prem_kind : formula_kind,
blanchet@43473
    25
     best_slices :
blanchet@46409
    26
       Proof.context -> (real * (bool * (slice_spec * string))) list}
blanchet@38023
    27
blanchet@44099
    28
  val force_sos : bool Config.T
blanchet@43566
    29
  val e_smartN : string
blanchet@43566
    30
  val e_autoN : string
blanchet@43566
    31
  val e_fun_weightN : string
blanchet@43566
    32
  val e_sym_offset_weightN : string
blanchet@42646
    33
  val e_weight_method : string Config.T
blanchet@42646
    34
  val e_default_fun_weight : real Config.T
blanchet@42646
    35
  val e_fun_weight_base : real Config.T
blanchet@42646
    36
  val e_fun_weight_span : real Config.T
blanchet@42646
    37
  val e_default_sym_offs_weight : real Config.T
blanchet@42646
    38
  val e_sym_offs_weight_base : real Config.T
blanchet@42646
    39
  val e_sym_offs_weight_span : real Config.T
blanchet@40059
    40
  val eN : string
blanchet@44590
    41
  val e_sineN : string
blanchet@44590
    42
  val e_tofofN : string
blanchet@45338
    43
  val iproverN : string
blanchet@45338
    44
  val iprover_eqN : string
blanchet@44590
    45
  val leo2N : string
blanchet@45365
    46
  val dummy_tff1N : string
blanchet@45365
    47
  val dummy_thfN : string
blanchet@44590
    48
  val satallaxN : string
blanchet@44590
    49
  val snarkN : string
blanchet@40059
    50
  val spassN : string
blanchet@45301
    51
  val spass_newN : string
blanchet@40059
    52
  val vampireN : string
blanchet@42938
    53
  val waldmeisterN : string
blanchet@44423
    54
  val z3_tptpN : string
blanchet@40060
    55
  val remote_prefix : string
blanchet@41738
    56
  val remote_atp :
blanchet@41738
    57
    string -> string -> string list -> (string * string) list
blanchet@44416
    58
    -> (failure * string) list -> formula_kind -> formula_kind
blanchet@46409
    59
    -> (Proof.context -> slice_spec) -> string * atp_config
blanchet@40059
    60
  val add_atp : string * atp_config -> theory -> theory
blanchet@40059
    61
  val get_atp : theory -> string -> atp_config
blanchet@41727
    62
  val supported_atps : theory -> string list
blanchet@40059
    63
  val is_atp_installed : theory -> string -> bool
blanchet@35867
    64
  val refresh_systems_on_tptp : unit -> unit
blanchet@35867
    65
  val setup : theory -> theory
wenzelm@28592
    66
end;
wenzelm@28592
    67
blanchet@36376
    68
structure ATP_Systems : ATP_SYSTEMS =
wenzelm@28592
    69
struct
wenzelm@28596
    70
blanchet@42577
    71
open ATP_Problem
blanchet@39491
    72
open ATP_Proof
blanchet@46320
    73
open ATP_Problem_Generate
boehmes@32864
    74
blanchet@40059
    75
(* ATP configuration *)
boehmes@32864
    76
blanchet@46409
    77
type slice_spec = int * atp_format * string * string * bool
blanchet@46409
    78
blanchet@40059
    79
type atp_config =
blanchet@42578
    80
  {exec : string * string,
blanchet@42578
    81
   required_execs : (string * string) list,
blanchet@42646
    82
   arguments :
blanchet@43473
    83
     Proof.context -> bool -> string -> Time.time
blanchet@43473
    84
     -> (unit -> (string * real) list) -> string,
blanchet@42578
    85
   proof_delims : (string * string) list,
blanchet@42578
    86
   known_failures : (failure * string) list,
blanchet@42709
    87
   conj_sym_kind : formula_kind,
blanchet@42709
    88
   prem_kind : formula_kind,
blanchet@46409
    89
   best_slices : Proof.context -> (real * (bool * (slice_spec * string))) list}
wenzelm@28596
    90
blanchet@42723
    91
(* "best_slices" must be found empirically, taking a wholistic approach since
blanchet@46407
    92
   the ATPs are run in parallel. The "real" component gives the faction of the
blanchet@46409
    93
   time available given to the slice and should add up to 1.0. The first "bool"
blanchet@42723
    94
   component indicates whether the slice's strategy is complete; the "int", the
blanchet@43569
    95
   preferred number of facts to pass; the first "string", the preferred type
blanchet@45521
    96
   system (which should be sound or quasi-sound); the second "string", the
blanchet@46409
    97
   preferred lambda translation scheme; the second "bool", whether uncurried
blanchet@46409
    98
   aliased should be generated; the third "string", extra information to
blanchet@45521
    99
   the prover (e.g., SOS or no SOS).
blanchet@42723
   100
blanchet@42723
   101
   The last slice should be the most "normal" one, because it will get all the
blanchet@43569
   102
   time available if the other slices fail early and also because it is used if
blanchet@43569
   103
   slicing is disabled (e.g., by the minimizer). *)
blanchet@42710
   104
blanchet@38061
   105
val known_perl_failures =
blanchet@38094
   106
  [(CantConnect, "HTTP error"),
blanchet@38094
   107
   (NoPerl, "env: perl"),
blanchet@38065
   108
   (NoLibwwwPerl, "Can't locate HTTP")]
wenzelm@28596
   109
blanchet@45203
   110
fun known_szs_failures wrap =
blanchet@45203
   111
  [(Unprovable, wrap "CounterSatisfiable"),
blanchet@45203
   112
   (Unprovable, wrap "Satisfiable"),
blanchet@45203
   113
   (GaveUp, wrap "GaveUp"),
blanchet@45203
   114
   (GaveUp, wrap "Unknown"),
blanchet@45203
   115
   (GaveUp, wrap "Incomplete"),
blanchet@45203
   116
   (ProofMissing, wrap "Theorem"),
blanchet@45203
   117
   (ProofMissing, wrap "Unsatisfiable"),
blanchet@45203
   118
   (TimedOut, wrap "Timeout"),
blanchet@45203
   119
   (Inappropriate, wrap "Inappropriate"),
blanchet@45203
   120
   (OutOfResources, wrap "ResourceOut"),
blanchet@45203
   121
   (OutOfResources, wrap "MemoryOut"),
blanchet@45203
   122
   (Interrupted, wrap "Forced"),
blanchet@45203
   123
   (Interrupted, wrap "User")]
blanchet@45203
   124
blanchet@45203
   125
val known_szs_status_failures = known_szs_failures (prefix "SZS status ")
blanchet@45203
   126
val known_says_failures = known_szs_failures (prefix " says ")
blanchet@45203
   127
blanchet@40059
   128
(* named ATPs *)
blanchet@40059
   129
blanchet@40059
   130
val eN = "e"
blanchet@44590
   131
val e_sineN = "e_sine"
blanchet@44590
   132
val e_tofofN = "e_tofof"
blanchet@45338
   133
val iproverN = "iprover"
blanchet@45338
   134
val iprover_eqN = "iprover_eq"
blanchet@44099
   135
val leo2N = "leo2"
blanchet@45365
   136
val dummy_tff1N = "dummy_tff1" (* experimental *)
blanchet@45365
   137
val dummy_thfN = "dummy_thf" (* experimental *)
blanchet@44099
   138
val satallaxN = "satallax"
blanchet@44590
   139
val snarkN = "snark"
blanchet@40059
   140
val spassN = "spass"
blanchet@45365
   141
val spass_newN = "spass_new" (* experimental *)
blanchet@40059
   142
val vampireN = "vampire"
blanchet@44590
   143
val waldmeisterN = "waldmeister"
blanchet@44423
   144
val z3_tptpN = "z3_tptp"
blanchet@40060
   145
val remote_prefix = "remote_"
blanchet@38001
   146
blanchet@38023
   147
structure Data = Theory_Data
blanchet@38023
   148
(
blanchet@40059
   149
  type T = (atp_config * stamp) Symtab.table
blanchet@38023
   150
  val empty = Symtab.empty
blanchet@38023
   151
  val extend = I
blanchet@46407
   152
  fun merge data : T =
blanchet@46407
   153
    Symtab.merge (eq_snd (op =)) data
blanchet@38023
   154
    handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@38023
   155
)
blanchet@38017
   156
blanchet@43981
   157
fun to_secs min time = Int.max (min, (Time.toMilliseconds time + 999) div 1000)
blanchet@36142
   158
blanchet@43473
   159
val sosN = "sos"
blanchet@43473
   160
val no_sosN = "no_sos"
blanchet@43473
   161
blanchet@44099
   162
val force_sos = Attrib.setup_config_bool @{binding atp_force_sos} (K false)
blanchet@44099
   163
blanchet@39491
   164
blanchet@40059
   165
(* E *)
wenzelm@28596
   166
blanchet@44420
   167
fun is_old_e_version () = (string_ord (getenv "E_VERSION", "1.2w") = LESS)
blanchet@44420
   168
blanchet@36369
   169
val tstp_proof_delims =
blanchet@42962
   170
  [("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation"),
blanchet@42962
   171
   ("% SZS output start CNFRefutation", "% SZS output end CNFRefutation")]
blanchet@36369
   172
blanchet@43473
   173
val e_smartN = "smart"
blanchet@42646
   174
val e_autoN = "auto"
blanchet@42646
   175
val e_fun_weightN = "fun_weight"
blanchet@42646
   176
val e_sym_offset_weightN = "sym_offset_weight"
blanchet@41725
   177
blanchet@42646
   178
val e_weight_method =
blanchet@43473
   179
  Attrib.setup_config_string @{binding atp_e_weight_method} (K e_smartN)
blanchet@41770
   180
(* FUDGE *)
blanchet@42646
   181
val e_default_fun_weight =
blanchet@42646
   182
  Attrib.setup_config_real @{binding atp_e_default_fun_weight} (K 20.0)
blanchet@42646
   183
val e_fun_weight_base =
blanchet@42646
   184
  Attrib.setup_config_real @{binding atp_e_fun_weight_base} (K 0.0)
blanchet@42646
   185
val e_fun_weight_span =
blanchet@42646
   186
  Attrib.setup_config_real @{binding atp_e_fun_weight_span} (K 40.0)
blanchet@42646
   187
val e_default_sym_offs_weight =
blanchet@42646
   188
  Attrib.setup_config_real @{binding atp_e_default_sym_offs_weight} (K 1.0)
blanchet@42646
   189
val e_sym_offs_weight_base =
blanchet@42646
   190
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_base} (K ~20.0)
blanchet@42646
   191
val e_sym_offs_weight_span =
blanchet@42646
   192
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_span} (K 60.0)
blanchet@41725
   193
blanchet@42443
   194
fun e_weight_method_case method fw sow =
blanchet@42646
   195
  if method = e_fun_weightN then fw
blanchet@42646
   196
  else if method = e_sym_offset_weightN then sow
blanchet@43478
   197
  else raise Fail ("unexpected " ^ quote method)
blanchet@41725
   198
blanchet@42646
   199
fun scaled_e_weight ctxt method w =
blanchet@42646
   200
  w * Config.get ctxt
blanchet@42646
   201
          (e_weight_method_case method e_fun_weight_span e_sym_offs_weight_span)
blanchet@42646
   202
  + Config.get ctxt
blanchet@42646
   203
        (e_weight_method_case method e_fun_weight_base e_sym_offs_weight_base)
blanchet@41725
   204
  |> Real.ceil |> signed_string_of_int
blanchet@41313
   205
blanchet@42646
   206
fun e_weight_arguments ctxt method weights =
blanchet@42646
   207
  if method = e_autoN then
blanchet@41725
   208
    "-xAutoDev"
blanchet@41725
   209
  else
blanchet@43622
   210
    (* supplied by Stephan Schulz *)
blanchet@41314
   211
    "--split-clauses=4 --split-reuse-defs --simul-paramod --forward-context-sr \
blanchet@41314
   212
    \--destructive-er-aggressive --destructive-er --presat-simplify \
blanchet@41314
   213
    \--prefer-initial-clauses -tKBO6 -winvfreqrank -c1 -Ginvfreqconjmax -F1 \
blanchet@41314
   214
    \--delete-bad-limit=150000000 -WSelectMaxLComplexAvoidPosPred \
blanchet@42443
   215
    \-H'(4*" ^ e_weight_method_case method "FunWeight" "SymOffsetWeight" ^
blanchet@41725
   216
    "(SimulateSOS, " ^
blanchet@42646
   217
    (e_weight_method_case method e_default_fun_weight e_default_sym_offs_weight
blanchet@42646
   218
     |> Config.get ctxt |> Real.ceil |> signed_string_of_int) ^
blanchet@41314
   219
    ",20,1.5,1.5,1" ^
blanchet@42646
   220
    (weights ()
blanchet@42646
   221
     |> map (fn (s, w) => "," ^ s ^ ":" ^ scaled_e_weight ctxt method w)
blanchet@42646
   222
     |> implode) ^
blanchet@41314
   223
    "),3*ConjectureGeneralSymbolWeight(PreferNonGoals,200,100,200,50,50,1,100,\
blanchet@41314
   224
    \1.5,1.5,1),1*Clauseweight(PreferProcessed,1,1,1),1*\
blanchet@41314
   225
    \FIFOWeight(PreferProcessed))'"
blanchet@41313
   226
blanchet@42646
   227
fun effective_e_weight_method ctxt =
blanchet@42646
   228
  if is_old_e_version () then e_autoN else Config.get ctxt e_weight_method
blanchet@42443
   229
blanchet@40059
   230
val e_config : atp_config =
blanchet@38092
   231
  {exec = ("E_HOME", "eproof"),
blanchet@38092
   232
   required_execs = [],
blanchet@43354
   233
   arguments =
blanchet@43567
   234
     fn ctxt => fn _ => fn method => fn timeout => fn weights =>
blanchet@43473
   235
        "--tstp-in --tstp-out -l5 " ^ e_weight_arguments ctxt method weights ^
blanchet@43981
   236
        " -tAutoDev --silent --cpu-limit=" ^ string_of_int (to_secs 2 timeout),
blanchet@42962
   237
   proof_delims = tstp_proof_delims,
blanchet@36265
   238
   known_failures =
blanchet@45203
   239
     known_szs_status_failures @
blanchet@45203
   240
     [(TimedOut, "Failure: Resource limit exceeded (time)"),
blanchet@36370
   241
      (TimedOut, "time limit exceeded"),
blanchet@45203
   242
      (OutOfResources, "# Cannot determine problem status")],
blanchet@43466
   243
   conj_sym_kind = Hypothesis,
blanchet@42709
   244
   prem_kind = Conjecture,
blanchet@42646
   245
   best_slices = fn ctxt =>
blanchet@43473
   246
     let val method = effective_e_weight_method ctxt in
blanchet@43474
   247
       (* FUDGE *)
blanchet@43473
   248
       if method = e_smartN then
blanchet@46449
   249
         [(0.333, (true, ((500, FOF, "mono_tags??", combsN, false), e_fun_weightN))),
blanchet@46449
   250
          (0.334, (true, ((50, FOF, "mono_guards??", combsN, false), e_fun_weightN))),
blanchet@46449
   251
          (0.333, (true, ((1000, FOF, "mono_tags??", combsN, false), e_sym_offset_weightN)))]
blanchet@43473
   252
       else
blanchet@46409
   253
         [(1.0, (true, ((500, FOF, "mono_tags??", combsN, false), method)))]
blanchet@43473
   254
     end}
blanchet@38454
   255
blanchet@40059
   256
val e = (eN, e_config)
wenzelm@28596
   257
wenzelm@28596
   258
blanchet@44099
   259
(* LEO-II *)
blanchet@44099
   260
blanchet@44754
   261
val leo2_thf0 = THF (TPTP_Monomorphic, TPTP_Explicit, THF_Without_Choice)
blanchet@44754
   262
blanchet@44099
   263
val leo2_config : atp_config =
blanchet@44099
   264
  {exec = ("LEO2_HOME", "leo"),
blanchet@44099
   265
   required_execs = [],
blanchet@44099
   266
   arguments =
blanchet@44099
   267
     fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@45300
   268
        "--proofoutput 1 --timeout " ^ string_of_int (to_secs 1 timeout)
blanchet@44099
   269
        |> sos = sosN ? prefix "--sos ",
blanchet@44099
   270
   proof_delims = tstp_proof_delims,
blanchet@45207
   271
   known_failures =
blanchet@45207
   272
     known_szs_status_failures @
blanchet@46481
   273
     [(TimedOut, "CPU time limit exceeded, terminating"),
blanchet@46481
   274
      (GaveUp, "No.of.Axioms")],
blanchet@44099
   275
   conj_sym_kind = Axiom,
blanchet@44099
   276
   prem_kind = Hypothesis,
blanchet@44099
   277
   best_slices = fn ctxt =>
blanchet@44099
   278
     (* FUDGE *)
blanchet@46449
   279
     [(0.667, (false, ((150, leo2_thf0, "mono_native_higher", liftingN, false), sosN))),
blanchet@46449
   280
      (0.333, (true, ((50, leo2_thf0, "mono_native_higher", liftingN, false), no_sosN)))]
blanchet@44099
   281
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@44099
   282
         else I)}
blanchet@39491
   283
blanchet@44099
   284
val leo2 = (leo2N, leo2_config)
blanchet@44099
   285
blanchet@44099
   286
blanchet@44099
   287
(* Satallax *)
blanchet@44099
   288
blanchet@44754
   289
val satallax_thf0 = THF (TPTP_Monomorphic, TPTP_Explicit, THF_With_Choice)
blanchet@44754
   290
blanchet@44099
   291
val satallax_config : atp_config =
blanchet@44099
   292
  {exec = ("SATALLAX_HOME", "satallax"),
blanchet@44099
   293
   required_execs = [],
blanchet@44099
   294
   arguments =
blanchet@44099
   295
     fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@45162
   296
        "-p hocore -t " ^ string_of_int (to_secs 1 timeout),
blanchet@45162
   297
   proof_delims =
blanchet@45162
   298
     [("% Higher-Order Unsat Core BEGIN", "% Higher-Order Unsat Core END")],
blanchet@45203
   299
   known_failures = known_szs_status_failures,
blanchet@44099
   300
   conj_sym_kind = Axiom,
blanchet@44099
   301
   prem_kind = Hypothesis,
blanchet@44416
   302
   best_slices =
blanchet@44754
   303
     (* FUDGE *)
blanchet@46449
   304
     K [(1.0, (true, ((100, satallax_thf0, "mono_native_higher", keep_lamsN, false), "")))]}
blanchet@44099
   305
blanchet@44099
   306
val satallax = (satallaxN, satallax_config)
blanchet@44099
   307
blanchet@44099
   308
blanchet@44099
   309
(* SPASS *)
blanchet@42725
   310
blanchet@36219
   311
(* The "-VarWeight=3" option helps the higher-order problems, probably by
blanchet@44450
   312
   counteracting the presence of explicit application operators. *)
blanchet@40059
   313
val spass_config : atp_config =
blanchet@38092
   314
  {exec = ("ISABELLE_ATP", "scripts/spass"),
blanchet@39002
   315
   required_execs = [("SPASS_HOME", "SPASS"), ("SPASS_HOME", "tptp2dfg")],
blanchet@43569
   316
   arguments = fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@37962
   317
     ("-Auto -PGiven=0 -PProblem=0 -Splits=0 -FullRed=0 -DocProof \
blanchet@43981
   318
      \-VarWeight=3 -TimeLimit=" ^ string_of_int (to_secs 1 timeout))
blanchet@43473
   319
     |> sos = sosN ? prefix "-SOS=1 ",
blanchet@36369
   320
   proof_delims = [("Here is a proof", "Formulae used in the proof")],
blanchet@36289
   321
   known_failures =
blanchet@38061
   322
     known_perl_failures @
blanchet@43050
   323
     [(GaveUp, "SPASS beiseite: Completion found"),
blanchet@36370
   324
      (TimedOut, "SPASS beiseite: Ran out of time"),
blanchet@36965
   325
      (OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"),
blanchet@37413
   326
      (MalformedInput, "Undefined symbol"),
blanchet@37414
   327
      (MalformedInput, "Free Variable"),
blanchet@44391
   328
      (Unprovable, "No formulae and clauses found in input file"),
blanchet@39263
   329
      (InternalError, "Please report this error")],
blanchet@43466
   330
   conj_sym_kind = Hypothesis,
blanchet@42709
   331
   prem_kind = Conjecture,
blanchet@42725
   332
   best_slices = fn ctxt =>
blanchet@42723
   333
     (* FUDGE *)
blanchet@46449
   334
     [(0.333, (false, ((150, DFG DFG_Unsorted, "mono_tags??", liftingN, false), sosN))),
blanchet@46449
   335
      (0.333, (false, ((300, DFG DFG_Unsorted, "poly_tags??", liftingN, false), sosN))),
blanchet@46449
   336
      (0.334, (false, ((50, DFG DFG_Unsorted, "mono_tags??", liftingN, false), no_sosN)))]
blanchet@46449
   337
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single else I)}
blanchet@38454
   338
blanchet@40059
   339
val spass = (spassN, spass_config)
wenzelm@28596
   340
blanchet@46449
   341
val spass_new_H2 = "-Heuristic=2"
blanchet@46455
   342
val spass_new_H2SOS = "-Heuristic=2 -SOS"
blanchet@46449
   343
val spass_new_Red2 = "-RFRew=2 -RBRew=2 -RTaut=2"
blanchet@46449
   344
val spass_new_Sorts0 = "-Sorts=0"
blanchet@46455
   345
val spass_new_H2NuVS0 = "-Heuristic=2 -RNuV=1 -Sorts=0"
blanchet@46455
   346
val spass_new_H2NuVS0Red2 =
blanchet@46455
   347
  "-Heuristic=2 -RNuV=1 -Sorts=0 -RFRew=2 -RBRew=2 -RTaut=2"
blanchet@46449
   348
blanchet@45301
   349
(* Experimental *)
blanchet@45301
   350
val spass_new_config : atp_config =
blanchet@46428
   351
  {exec = ("SPASS_NEW_HOME", "SPASS"),
blanchet@46428
   352
   required_execs = [],
blanchet@46444
   353
   arguments = fn _ => fn _ => fn extra_options => fn timeout => fn _ =>
blanchet@46429
   354
     ("-Isabelle=1 -TimeLimit=" ^ string_of_int (to_secs 1 timeout))
blanchet@46444
   355
     |> extra_options <> "" ? prefix (extra_options ^ " "),
blanchet@45301
   356
   proof_delims = #proof_delims spass_config,
blanchet@45301
   357
   known_failures = #known_failures spass_config,
blanchet@45301
   358
   conj_sym_kind = #conj_sym_kind spass_config,
blanchet@45301
   359
   prem_kind = #prem_kind spass_config,
blanchet@46381
   360
   best_slices = fn _ =>
blanchet@45301
   361
     (* FUDGE *)
blanchet@46455
   362
     [(0.1667, (false, ((150, DFG DFG_Sorted, "mono_native", combsN, true), ""))),
blanchet@46455
   363
      (0.1667, (false, ((500, DFG DFG_Sorted, "mono_native", liftingN, true), spass_new_H2SOS))),
blanchet@46455
   364
      (0.1666, (false, ((50, DFG DFG_Sorted,  "mono_native", liftingN, true), spass_new_H2))),
blanchet@46455
   365
      (0.1000, (false, ((250, DFG DFG_Sorted, "mono_native", combsN, true), spass_new_H2NuVS0))),
blanchet@46455
   366
      (0.1000, (false, ((100, DFG DFG_Sorted, "mono_native", combs_and_liftingN, true), spass_new_H2NuVS0))),
blanchet@46455
   367
      (0.1000, (false, ((300, DFG DFG_Sorted, "mono_native", combsN, true), spass_new_H2SOS))),
blanchet@46455
   368
      (0.1000, (false, ((150, DFG DFG_Sorted, "poly_guards??", liftingN, false), spass_new_H2NuVS0Red2))),
blanchet@46455
   369
      (0.1000, (false, ((400, DFG DFG_Sorted, "mono_native", liftingN, true), spass_new_H2)))]}
blanchet@45301
   370
blanchet@45301
   371
val spass_new = (spass_newN, spass_new_config)
blanchet@45301
   372
blanchet@38454
   373
blanchet@37509
   374
(* Vampire *)
blanchet@37509
   375
blanchet@44507
   376
(* Vampire 1.8 has TFF support, but it's buggy and therefore disabled on
blanchet@44507
   377
   SystemOnTPTP. *)
blanchet@44420
   378
fun is_old_vampire_version () =
blanchet@44507
   379
  string_ord (getenv "VAMPIRE_VERSION", "1.8") <> GREATER
blanchet@44420
   380
blanchet@44754
   381
val vampire_tff0 = TFF (TPTP_Monomorphic, TPTP_Implicit)
blanchet@44589
   382
blanchet@40059
   383
val vampire_config : atp_config =
blanchet@38092
   384
  {exec = ("VAMPIRE_HOME", "vampire"),
blanchet@38092
   385
   required_execs = [],
blanchet@43569
   386
   arguments = fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@44417
   387
     "--mode casc -t " ^ string_of_int (to_secs 1 timeout) ^
blanchet@45234
   388
     " --proof tptp --output_axiom_names on\
blanchet@45234
   389
     \ --forced_options propositional_to_bdd=off\
blanchet@44417
   390
     \ --thanks \"Andrei and Krystof\" --input_file"
blanchet@43473
   391
     |> sos = sosN ? prefix "--sos on ",
blanchet@37509
   392
   proof_delims =
blanchet@37509
   393
     [("=========== Refutation ==========",
blanchet@37509
   394
       "======= End of refutation ======="),
blanchet@38033
   395
      ("% SZS output start Refutation", "% SZS output end Refutation"),
blanchet@38033
   396
      ("% SZS output start Proof", "% SZS output end Proof")],
blanchet@37509
   397
   known_failures =
blanchet@45203
   398
     known_szs_status_failures @
blanchet@43050
   399
     [(GaveUp, "UNPROVABLE"),
blanchet@43050
   400
      (GaveUp, "CANNOT PROVE"),
blanchet@37509
   401
      (Unprovable, "Satisfiability detected"),
blanchet@38647
   402
      (Unprovable, "Termination reason: Satisfiable"),
blanchet@39263
   403
      (Interrupted, "Aborted by signal SIGINT")],
blanchet@43466
   404
   conj_sym_kind = Conjecture,
blanchet@42709
   405
   prem_kind = Conjecture,
blanchet@42725
   406
   best_slices = fn ctxt =>
blanchet@42723
   407
     (* FUDGE *)
blanchet@44420
   408
     (if is_old_vampire_version () then
blanchet@46449
   409
        [(0.333, (false, ((150, FOF, "poly_guards??", combs_or_liftingN, false), sosN))),
blanchet@46449
   410
         (0.333, (false, ((500, FOF, "mono_tags??", combs_or_liftingN, false), sosN))),
blanchet@46449
   411
         (0.334, (true, ((50, FOF, "mono_guards??", combs_or_liftingN, false), no_sosN)))]
blanchet@44420
   412
      else
blanchet@46449
   413
        [(0.333, (false, ((150, vampire_tff0, "poly_guards??", combs_or_liftingN, false), sosN))),
blanchet@46449
   414
         (0.333, (false, ((500, vampire_tff0, "mono_native", combs_or_liftingN, false), sosN))),
blanchet@46449
   415
         (0.334, (true, ((50, vampire_tff0, "mono_native", combs_or_liftingN, false), no_sosN)))])
blanchet@44099
   416
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@42725
   417
         else I)}
blanchet@38454
   418
blanchet@40059
   419
val vampire = (vampireN, vampire_config)
blanchet@37509
   420
blanchet@38454
   421
blanchet@41740
   422
(* Z3 with TPTP syntax *)
blanchet@41740
   423
blanchet@44754
   424
val z3_tff0 = TFF (TPTP_Monomorphic, TPTP_Implicit)
blanchet@44589
   425
blanchet@44423
   426
val z3_tptp_config : atp_config =
blanchet@41740
   427
  {exec = ("Z3_HOME", "z3"),
blanchet@41740
   428
   required_execs = [],
blanchet@43354
   429
   arguments = fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@44420
   430
     "MBQI=true -tptp -t:" ^ string_of_int (to_secs 1 timeout),
blanchet@41740
   431
   proof_delims = [],
blanchet@45203
   432
   known_failures = known_szs_status_failures,
blanchet@42709
   433
   conj_sym_kind = Hypothesis,
blanchet@42709
   434
   prem_kind = Hypothesis,
blanchet@42723
   435
   best_slices =
blanchet@44423
   436
     (* FUDGE *)
blanchet@46435
   437
     K [(0.5, (false, ((250, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@46435
   438
        (0.25, (false, ((125, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@46435
   439
        (0.125, (false, ((62, z3_tff0, "mono_native", combsN, false), ""))),
blanchet@46435
   440
        (0.125, (false, ((31, z3_tff0, "mono_native", combsN, false), "")))]}
blanchet@41740
   441
blanchet@44423
   442
val z3_tptp = (z3_tptpN, z3_tptp_config)
blanchet@41740
   443
blanchet@44590
   444
blanchet@44754
   445
(* Not really a prover: Experimental Polymorphic TFF and THF output *)
blanchet@44590
   446
blanchet@44754
   447
fun dummy_config format type_enc : atp_config =
blanchet@44596
   448
  {exec = ("ISABELLE_ATP", "scripts/dummy_atp"),
blanchet@44590
   449
   required_execs = [],
blanchet@44590
   450
   arguments = K (K (K (K (K "")))),
blanchet@44590
   451
   proof_delims = [],
blanchet@45203
   452
   known_failures = known_szs_status_failures,
blanchet@44590
   453
   conj_sym_kind = Hypothesis,
blanchet@44590
   454
   prem_kind = Hypothesis,
blanchet@45521
   455
   best_slices =
blanchet@46407
   456
     K [(1.0, (false, ((200, format, type_enc,
blanchet@46407
   457
                        if is_format_higher_order format then keep_lamsN
blanchet@46409
   458
                        else combsN, false), "")))]}
blanchet@44590
   459
blanchet@45365
   460
val dummy_tff1_format = TFF (TPTP_Polymorphic, TPTP_Explicit)
blanchet@46435
   461
val dummy_tff1_config = dummy_config dummy_tff1_format "poly_native"
blanchet@45365
   462
val dummy_tff1 = (dummy_tff1N, dummy_tff1_config)
blanchet@44590
   463
blanchet@45365
   464
val dummy_thf_format = THF (TPTP_Polymorphic, TPTP_Explicit, THF_With_Choice)
blanchet@46435
   465
val dummy_thf_config = dummy_config dummy_thf_format "poly_native_higher"
blanchet@45365
   466
val dummy_thf = (dummy_thfN, dummy_thf_config)
blanchet@44754
   467
blanchet@41740
   468
blanchet@40059
   469
(* Remote ATP invocation via SystemOnTPTP *)
wenzelm@28596
   470
blanchet@38061
   471
val systems = Synchronized.var "atp_systems" ([] : string list)
immler@31835
   472
immler@31835
   473
fun get_systems () =
blanchet@44589
   474
  case Isabelle_System.bash_output
blanchet@44589
   475
           "\"$ISABELLE_ATP/scripts/remote_atp\" -w 2>&1" of
blanchet@39491
   476
    (output, 0) => split_lines output
blanchet@39491
   477
  | (output, _) =>
blanchet@39491
   478
    error (case extract_known_failure known_perl_failures output of
blanchet@41744
   479
             SOME failure => string_for_failure failure
blanchet@39491
   480
           | NONE => perhaps (try (unsuffix "\n")) output ^ ".")
immler@31835
   481
blanchet@42537
   482
fun find_system name [] systems =
blanchet@42537
   483
    find_first (String.isPrefix (name ^ "---")) systems
blanchet@38690
   484
  | find_system name (version :: versions) systems =
blanchet@38690
   485
    case find_first (String.isPrefix (name ^ "---" ^ version)) systems of
blanchet@38690
   486
      NONE => find_system name versions systems
blanchet@38690
   487
    | res => res
blanchet@38690
   488
blanchet@38690
   489
fun get_system name versions =
blanchet@38589
   490
  Synchronized.change_result systems
blanchet@38589
   491
      (fn systems => (if null systems then get_systems () else systems)
blanchet@42955
   492
                     |> `(`(find_system name versions)))
boehmes@32864
   493
blanchet@38690
   494
fun the_system name versions =
blanchet@38690
   495
  case get_system name versions of
blanchet@42955
   496
    (SOME sys, _) => sys
blanchet@46480
   497
  | (NONE, []) => error ("SystemOnTPTP is not available.")
blanchet@42955
   498
  | (NONE, syss) =>
blanchet@46480
   499
    case syss |> filter_out (String.isPrefix "%")
blanchet@46480
   500
              |> filter_out (curry (op =) "") of
blanchet@46480
   501
      [] => error ("SystemOnTPTP is not available.")
blanchet@46480
   502
    | [msg] => error ("SystemOnTPTP is not available: " ^ msg ^ ".")
blanchet@46480
   503
    | syss =>
blanchet@46480
   504
      error ("System " ^ quote name ^ " is not available at SystemOnTPTP.\n" ^
blanchet@46480
   505
             "(Available systems: " ^ commas_quote syss ^ ".)")
immler@31835
   506
blanchet@41148
   507
val max_remote_secs = 240 (* give Geoff Sutcliffe's servers a break *)
blanchet@41148
   508
blanchet@38690
   509
fun remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   510
                  conj_sym_kind prem_kind best_slice : atp_config =
blanchet@38092
   511
  {exec = ("ISABELLE_ATP", "scripts/remote_atp"),
blanchet@38092
   512
   required_execs = [],
blanchet@43354
   513
   arguments = fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@46409
   514
     "-t " ^ string_of_int (Int.min (max_remote_secs, to_secs 1 timeout)) ^
blanchet@46409
   515
     " -s " ^ the_system system_name system_versions,
blanchet@42962
   516
   proof_delims = union (op =) tstp_proof_delims proof_delims,
blanchet@45203
   517
   known_failures = known_failures @ known_perl_failures @ known_says_failures,
blanchet@42709
   518
   conj_sym_kind = conj_sym_kind,
blanchet@42709
   519
   prem_kind = prem_kind,
blanchet@46409
   520
   best_slices = fn ctxt => [(1.0, (false, (best_slice ctxt, "")))]}
blanchet@42443
   521
blanchet@43500
   522
fun remotify_config system_name system_versions best_slice
blanchet@44416
   523
        ({proof_delims, known_failures, conj_sym_kind, prem_kind, ...}
blanchet@43500
   524
         : atp_config) : atp_config =
blanchet@38690
   525
  remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   526
                conj_sym_kind prem_kind best_slice
blanchet@38023
   527
blanchet@40059
   528
fun remote_atp name system_name system_versions proof_delims known_failures
blanchet@44416
   529
               conj_sym_kind prem_kind best_slice =
blanchet@40060
   530
  (remote_prefix ^ name,
blanchet@38690
   531
   remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   532
                 conj_sym_kind prem_kind best_slice)
blanchet@43500
   533
fun remotify_atp (name, config) system_name system_versions best_slice =
blanchet@43500
   534
  (remote_prefix ^ name,
blanchet@43500
   535
   remotify_config system_name system_versions best_slice config)
wenzelm@28592
   536
blanchet@44754
   537
val explicit_tff0 = TFF (TPTP_Monomorphic, TPTP_Explicit)
blanchet@44589
   538
blanchet@43500
   539
val remote_e =
blanchet@43500
   540
  remotify_atp e "EP" ["1.0", "1.1", "1.2"]
blanchet@46409
   541
      (K (750, FOF, "mono_tags??", combsN, false) (* FUDGE *))
blanchet@44099
   542
val remote_leo2 =
blanchet@44099
   543
  remotify_atp leo2 "LEO-II" ["1.2.8", "1.2.6"]
blanchet@46435
   544
      (K (100, leo2_thf0, "mono_native_higher", liftingN, false) (* FUDGE *))
blanchet@44099
   545
val remote_satallax =
blanchet@44099
   546
  remotify_atp satallax "Satallax" ["2.1", "2.0", "2"]
blanchet@46435
   547
      (K (100, satallax_thf0, "mono_native_higher", keep_lamsN, false)
blanchet@46409
   548
         (* FUDGE *))
blanchet@43500
   549
val remote_vampire =
blanchet@44499
   550
  remotify_atp vampire "Vampire" ["1.8"]
blanchet@46409
   551
      (K (250, FOF, "mono_guards??", combs_or_liftingN, false) (* FUDGE *))
blanchet@44423
   552
val remote_z3_tptp =
blanchet@44754
   553
  remotify_atp z3_tptp "Z3" ["3.0"]
blanchet@46435
   554
      (K (250, z3_tff0, "mono_native", combsN, false) (* FUDGE *))
blanchet@44092
   555
val remote_e_sine =
blanchet@44092
   556
  remote_atp e_sineN "SInE" ["0.4"] [] (#known_failures e_config) Axiom
blanchet@46409
   557
      Conjecture (K (500, FOF, "mono_guards??", combsN, false) (* FUDGE *))
blanchet@45338
   558
val remote_iprover =
blanchet@45338
   559
  remote_atp iproverN "iProver" [] [] [] Axiom Conjecture
blanchet@46409
   560
      (K (150, FOF, "mono_guards??", liftingN, false) (* FUDGE *))
blanchet@45338
   561
val remote_iprover_eq =
blanchet@45338
   562
  remote_atp iprover_eqN "iProver-Eq" [] [] [] Axiom Conjecture
blanchet@46409
   563
      (K (150, FOF, "mono_guards??", liftingN, false) (* FUDGE *))
blanchet@41740
   564
val remote_snark =
blanchet@42939
   565
  remote_atp snarkN "SNARK" ["20080805r029", "20080805r024"]
blanchet@45521
   566
      [("refutation.", "end_refutation.")] [] Hypothesis Hypothesis
blanchet@46435
   567
      (K (100, explicit_tff0, "mono_native", liftingN, false) (* FUDGE *))
blanchet@44092
   568
val remote_e_tofof =
blanchet@44589
   569
  remote_atp e_tofofN "ToFoF" ["0.1"] [] (#known_failures e_config) Axiom
blanchet@45521
   570
      Hypothesis
blanchet@46435
   571
      (K (150, explicit_tff0, "mono_native", liftingN, false) (* FUDGE *))
blanchet@42938
   572
val remote_waldmeister =
blanchet@42938
   573
  remote_atp waldmeisterN "Waldmeister" ["710"]
blanchet@45521
   574
      [("#START OF PROOF", "Proved Goals:")]
blanchet@45521
   575
      [(OutOfResources, "Too many function symbols"),
blanchet@45521
   576
       (Crashed, "Unrecoverable Segmentation Fault")]
blanchet@45521
   577
      Hypothesis Hypothesis
blanchet@46409
   578
      (K (50, CNF_UEQ, "mono_tags??", combsN, false) (* FUDGE *))
blanchet@38454
   579
blanchet@38454
   580
(* Setup *)
blanchet@38454
   581
blanchet@40059
   582
fun add_atp (name, config) thy =
blanchet@40059
   583
  Data.map (Symtab.update_new (name, (config, stamp ()))) thy
blanchet@40059
   584
  handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@40059
   585
blanchet@40059
   586
fun get_atp thy name =
blanchet@40059
   587
  the (Symtab.lookup (Data.get thy) name) |> fst
blanchet@40059
   588
  handle Option.Option => error ("Unknown ATP: " ^ name ^ ".")
blanchet@40059
   589
blanchet@41727
   590
val supported_atps = Symtab.keys o Data.get
blanchet@36371
   591
blanchet@40059
   592
fun is_atp_installed thy name =
blanchet@40059
   593
  let val {exec, required_execs, ...} = get_atp thy name in
blanchet@40059
   594
    forall (curry (op <>) "" o getenv o fst) (exec :: required_execs)
blanchet@40059
   595
  end
blanchet@36371
   596
blanchet@40059
   597
fun refresh_systems_on_tptp () =
blanchet@40059
   598
  Synchronized.change systems (fn _ => get_systems ())
blanchet@40059
   599
blanchet@42962
   600
val atps =
blanchet@45365
   601
  [e, leo2, dummy_tff1, dummy_thf, satallax, spass, spass_new, vampire, z3_tptp,
blanchet@45365
   602
   remote_e, remote_e_sine, remote_e_tofof, remote_iprover, remote_iprover_eq,
blanchet@45339
   603
   remote_leo2, remote_satallax, remote_vampire, remote_z3_tptp, remote_snark,
blanchet@45339
   604
   remote_waldmeister]
blanchet@40059
   605
val setup = fold add_atp atps
blanchet@35867
   606
wenzelm@28592
   607
end;