src/HOL/Tools/ATP/atp_systems.ML
author blanchet
Fri Feb 03 18:00:55 2012 +0100 (2012-02-03)
changeset 46407 30e9720cc0b9
parent 46402 ef8d65f64f77
child 46409 d4754183ccce
permissions -rw-r--r--
optimization: slice caching in case two consecutive slices are nearly identical
blanchet@38047
     1
(*  Title:      HOL/Tools/ATP/atp_systems.ML
wenzelm@28592
     2
    Author:     Fabian Immler, TU Muenchen
blanchet@36371
     3
    Author:     Jasmin Blanchette, TU Muenchen
wenzelm@28592
     4
blanchet@36376
     5
Setup for supported ATPs.
wenzelm@28592
     6
*)
wenzelm@28592
     7
blanchet@36376
     8
signature ATP_SYSTEMS =
wenzelm@28592
     9
sig
blanchet@45301
    10
  type atp_format = ATP_Problem.atp_format
blanchet@42577
    11
  type formula_kind = ATP_Problem.formula_kind
blanchet@39491
    12
  type failure = ATP_Proof.failure
blanchet@38023
    13
blanchet@40059
    14
  type atp_config =
blanchet@42578
    15
    {exec : string * string,
blanchet@42578
    16
     required_execs : (string * string) list,
blanchet@42646
    17
     arguments :
blanchet@43473
    18
       Proof.context -> bool -> string -> Time.time
blanchet@43354
    19
       -> (unit -> (string * real) list) -> string,
blanchet@42578
    20
     proof_delims : (string * string) list,
blanchet@42578
    21
     known_failures : (failure * string) list,
blanchet@42709
    22
     conj_sym_kind : formula_kind,
blanchet@42709
    23
     prem_kind : formula_kind,
blanchet@43473
    24
     best_slices :
blanchet@44754
    25
       Proof.context
blanchet@46407
    26
       -> (real * (bool * ((int * atp_format * string * string) * string)))
blanchet@46407
    27
            list}
blanchet@38023
    28
blanchet@44099
    29
  val force_sos : bool Config.T
blanchet@43566
    30
  val e_smartN : string
blanchet@43566
    31
  val e_autoN : string
blanchet@43566
    32
  val e_fun_weightN : string
blanchet@43566
    33
  val e_sym_offset_weightN : string
blanchet@42646
    34
  val e_weight_method : string Config.T
blanchet@42646
    35
  val e_default_fun_weight : real Config.T
blanchet@42646
    36
  val e_fun_weight_base : real Config.T
blanchet@42646
    37
  val e_fun_weight_span : real Config.T
blanchet@42646
    38
  val e_default_sym_offs_weight : real Config.T
blanchet@42646
    39
  val e_sym_offs_weight_base : real Config.T
blanchet@42646
    40
  val e_sym_offs_weight_span : real Config.T
blanchet@46380
    41
  val spass_incompleteN : string
blanchet@40059
    42
  val eN : string
blanchet@44590
    43
  val e_sineN : string
blanchet@44590
    44
  val e_tofofN : string
blanchet@45338
    45
  val iproverN : string
blanchet@45338
    46
  val iprover_eqN : string
blanchet@44590
    47
  val leo2N : string
blanchet@45365
    48
  val dummy_tff1N : string
blanchet@45365
    49
  val dummy_thfN : string
blanchet@44590
    50
  val satallaxN : string
blanchet@44590
    51
  val snarkN : string
blanchet@40059
    52
  val spassN : string
blanchet@45301
    53
  val spass_newN : string
blanchet@40059
    54
  val vampireN : string
blanchet@42938
    55
  val waldmeisterN : string
blanchet@44423
    56
  val z3_tptpN : string
blanchet@40060
    57
  val remote_prefix : string
blanchet@41738
    58
  val remote_atp :
blanchet@41738
    59
    string -> string -> string list -> (string * string) list
blanchet@44416
    60
    -> (failure * string) list -> formula_kind -> formula_kind
blanchet@45521
    61
    -> (Proof.context -> int * atp_format * string * string)
blanchet@45521
    62
    -> string * atp_config
blanchet@40059
    63
  val add_atp : string * atp_config -> theory -> theory
blanchet@40059
    64
  val get_atp : theory -> string -> atp_config
blanchet@41727
    65
  val supported_atps : theory -> string list
blanchet@40059
    66
  val is_atp_installed : theory -> string -> bool
blanchet@35867
    67
  val refresh_systems_on_tptp : unit -> unit
blanchet@35867
    68
  val setup : theory -> theory
wenzelm@28592
    69
end;
wenzelm@28592
    70
blanchet@36376
    71
structure ATP_Systems : ATP_SYSTEMS =
wenzelm@28592
    72
struct
wenzelm@28596
    73
blanchet@42577
    74
open ATP_Problem
blanchet@39491
    75
open ATP_Proof
blanchet@46320
    76
open ATP_Problem_Generate
boehmes@32864
    77
blanchet@40059
    78
(* ATP configuration *)
boehmes@32864
    79
blanchet@40059
    80
type atp_config =
blanchet@42578
    81
  {exec : string * string,
blanchet@42578
    82
   required_execs : (string * string) list,
blanchet@42646
    83
   arguments :
blanchet@43473
    84
     Proof.context -> bool -> string -> Time.time
blanchet@43473
    85
     -> (unit -> (string * real) list) -> string,
blanchet@42578
    86
   proof_delims : (string * string) list,
blanchet@42578
    87
   known_failures : (failure * string) list,
blanchet@42709
    88
   conj_sym_kind : formula_kind,
blanchet@42709
    89
   prem_kind : formula_kind,
blanchet@43473
    90
   best_slices :
blanchet@44754
    91
     Proof.context
blanchet@46407
    92
     -> (real * (bool * ((int * atp_format * string * string) * string))) list}
wenzelm@28596
    93
blanchet@42723
    94
(* "best_slices" must be found empirically, taking a wholistic approach since
blanchet@46407
    95
   the ATPs are run in parallel. The "real" component gives the faction of the
blanchet@43569
    96
   time available given to the slice and should add up to 1.0. The "bool"
blanchet@42723
    97
   component indicates whether the slice's strategy is complete; the "int", the
blanchet@43569
    98
   preferred number of facts to pass; the first "string", the preferred type
blanchet@45521
    99
   system (which should be sound or quasi-sound); the second "string", the
blanchet@45521
   100
   preferred lambda translation scheme; the third "string", extra information to
blanchet@45521
   101
   the prover (e.g., SOS or no SOS).
blanchet@42723
   102
blanchet@42723
   103
   The last slice should be the most "normal" one, because it will get all the
blanchet@43569
   104
   time available if the other slices fail early and also because it is used if
blanchet@43569
   105
   slicing is disabled (e.g., by the minimizer). *)
blanchet@42710
   106
blanchet@38061
   107
val known_perl_failures =
blanchet@38094
   108
  [(CantConnect, "HTTP error"),
blanchet@38094
   109
   (NoPerl, "env: perl"),
blanchet@38065
   110
   (NoLibwwwPerl, "Can't locate HTTP")]
wenzelm@28596
   111
blanchet@45203
   112
fun known_szs_failures wrap =
blanchet@45203
   113
  [(Unprovable, wrap "CounterSatisfiable"),
blanchet@45203
   114
   (Unprovable, wrap "Satisfiable"),
blanchet@45203
   115
   (GaveUp, wrap "GaveUp"),
blanchet@45203
   116
   (GaveUp, wrap "Unknown"),
blanchet@45203
   117
   (GaveUp, wrap "Incomplete"),
blanchet@45203
   118
   (ProofMissing, wrap "Theorem"),
blanchet@45203
   119
   (ProofMissing, wrap "Unsatisfiable"),
blanchet@45203
   120
   (TimedOut, wrap "Timeout"),
blanchet@45203
   121
   (Inappropriate, wrap "Inappropriate"),
blanchet@45203
   122
   (OutOfResources, wrap "ResourceOut"),
blanchet@45203
   123
   (OutOfResources, wrap "MemoryOut"),
blanchet@45203
   124
   (Interrupted, wrap "Forced"),
blanchet@45203
   125
   (Interrupted, wrap "User")]
blanchet@45203
   126
blanchet@45203
   127
val known_szs_status_failures = known_szs_failures (prefix "SZS status ")
blanchet@45203
   128
val known_says_failures = known_szs_failures (prefix " says ")
blanchet@45203
   129
blanchet@40059
   130
(* named ATPs *)
blanchet@40059
   131
blanchet@40059
   132
val eN = "e"
blanchet@44590
   133
val e_sineN = "e_sine"
blanchet@44590
   134
val e_tofofN = "e_tofof"
blanchet@45338
   135
val iproverN = "iprover"
blanchet@45338
   136
val iprover_eqN = "iprover_eq"
blanchet@44099
   137
val leo2N = "leo2"
blanchet@45365
   138
val dummy_tff1N = "dummy_tff1" (* experimental *)
blanchet@45365
   139
val dummy_thfN = "dummy_thf" (* experimental *)
blanchet@44099
   140
val satallaxN = "satallax"
blanchet@44590
   141
val snarkN = "snark"
blanchet@40059
   142
val spassN = "spass"
blanchet@45365
   143
val spass_newN = "spass_new" (* experimental *)
blanchet@40059
   144
val vampireN = "vampire"
blanchet@44590
   145
val waldmeisterN = "waldmeister"
blanchet@44423
   146
val z3_tptpN = "z3_tptp"
blanchet@40060
   147
val remote_prefix = "remote_"
blanchet@38001
   148
blanchet@38023
   149
structure Data = Theory_Data
blanchet@38023
   150
(
blanchet@40059
   151
  type T = (atp_config * stamp) Symtab.table
blanchet@38023
   152
  val empty = Symtab.empty
blanchet@38023
   153
  val extend = I
blanchet@46407
   154
  fun merge data : T =
blanchet@46407
   155
    Symtab.merge (eq_snd (op =)) data
blanchet@38023
   156
    handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@38023
   157
)
blanchet@38017
   158
blanchet@43981
   159
fun to_secs min time = Int.max (min, (Time.toMilliseconds time + 999) div 1000)
blanchet@36142
   160
blanchet@43473
   161
val sosN = "sos"
blanchet@43473
   162
val no_sosN = "no_sos"
blanchet@43473
   163
blanchet@44099
   164
val force_sos = Attrib.setup_config_bool @{binding atp_force_sos} (K false)
blanchet@44099
   165
blanchet@39491
   166
blanchet@40059
   167
(* E *)
wenzelm@28596
   168
blanchet@44420
   169
fun is_old_e_version () = (string_ord (getenv "E_VERSION", "1.2w") = LESS)
blanchet@44420
   170
blanchet@36369
   171
val tstp_proof_delims =
blanchet@42962
   172
  [("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation"),
blanchet@42962
   173
   ("% SZS output start CNFRefutation", "% SZS output end CNFRefutation")]
blanchet@36369
   174
blanchet@43473
   175
val e_smartN = "smart"
blanchet@42646
   176
val e_autoN = "auto"
blanchet@42646
   177
val e_fun_weightN = "fun_weight"
blanchet@42646
   178
val e_sym_offset_weightN = "sym_offset_weight"
blanchet@41725
   179
blanchet@42646
   180
val e_weight_method =
blanchet@43473
   181
  Attrib.setup_config_string @{binding atp_e_weight_method} (K e_smartN)
blanchet@41770
   182
(* FUDGE *)
blanchet@42646
   183
val e_default_fun_weight =
blanchet@42646
   184
  Attrib.setup_config_real @{binding atp_e_default_fun_weight} (K 20.0)
blanchet@42646
   185
val e_fun_weight_base =
blanchet@42646
   186
  Attrib.setup_config_real @{binding atp_e_fun_weight_base} (K 0.0)
blanchet@42646
   187
val e_fun_weight_span =
blanchet@42646
   188
  Attrib.setup_config_real @{binding atp_e_fun_weight_span} (K 40.0)
blanchet@42646
   189
val e_default_sym_offs_weight =
blanchet@42646
   190
  Attrib.setup_config_real @{binding atp_e_default_sym_offs_weight} (K 1.0)
blanchet@42646
   191
val e_sym_offs_weight_base =
blanchet@42646
   192
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_base} (K ~20.0)
blanchet@42646
   193
val e_sym_offs_weight_span =
blanchet@42646
   194
  Attrib.setup_config_real @{binding atp_e_sym_offs_weight_span} (K 60.0)
blanchet@41725
   195
blanchet@42443
   196
fun e_weight_method_case method fw sow =
blanchet@42646
   197
  if method = e_fun_weightN then fw
blanchet@42646
   198
  else if method = e_sym_offset_weightN then sow
blanchet@43478
   199
  else raise Fail ("unexpected " ^ quote method)
blanchet@41725
   200
blanchet@42646
   201
fun scaled_e_weight ctxt method w =
blanchet@42646
   202
  w * Config.get ctxt
blanchet@42646
   203
          (e_weight_method_case method e_fun_weight_span e_sym_offs_weight_span)
blanchet@42646
   204
  + Config.get ctxt
blanchet@42646
   205
        (e_weight_method_case method e_fun_weight_base e_sym_offs_weight_base)
blanchet@41725
   206
  |> Real.ceil |> signed_string_of_int
blanchet@41313
   207
blanchet@42646
   208
fun e_weight_arguments ctxt method weights =
blanchet@42646
   209
  if method = e_autoN then
blanchet@41725
   210
    "-xAutoDev"
blanchet@41725
   211
  else
blanchet@43622
   212
    (* supplied by Stephan Schulz *)
blanchet@41314
   213
    "--split-clauses=4 --split-reuse-defs --simul-paramod --forward-context-sr \
blanchet@41314
   214
    \--destructive-er-aggressive --destructive-er --presat-simplify \
blanchet@41314
   215
    \--prefer-initial-clauses -tKBO6 -winvfreqrank -c1 -Ginvfreqconjmax -F1 \
blanchet@41314
   216
    \--delete-bad-limit=150000000 -WSelectMaxLComplexAvoidPosPred \
blanchet@42443
   217
    \-H'(4*" ^ e_weight_method_case method "FunWeight" "SymOffsetWeight" ^
blanchet@41725
   218
    "(SimulateSOS, " ^
blanchet@42646
   219
    (e_weight_method_case method e_default_fun_weight e_default_sym_offs_weight
blanchet@42646
   220
     |> Config.get ctxt |> Real.ceil |> signed_string_of_int) ^
blanchet@41314
   221
    ",20,1.5,1.5,1" ^
blanchet@42646
   222
    (weights ()
blanchet@42646
   223
     |> map (fn (s, w) => "," ^ s ^ ":" ^ scaled_e_weight ctxt method w)
blanchet@42646
   224
     |> implode) ^
blanchet@41314
   225
    "),3*ConjectureGeneralSymbolWeight(PreferNonGoals,200,100,200,50,50,1,100,\
blanchet@41314
   226
    \1.5,1.5,1),1*Clauseweight(PreferProcessed,1,1,1),1*\
blanchet@41314
   227
    \FIFOWeight(PreferProcessed))'"
blanchet@41313
   228
blanchet@42646
   229
fun effective_e_weight_method ctxt =
blanchet@42646
   230
  if is_old_e_version () then e_autoN else Config.get ctxt e_weight_method
blanchet@42443
   231
blanchet@40059
   232
val e_config : atp_config =
blanchet@38092
   233
  {exec = ("E_HOME", "eproof"),
blanchet@38092
   234
   required_execs = [],
blanchet@43354
   235
   arguments =
blanchet@43567
   236
     fn ctxt => fn _ => fn method => fn timeout => fn weights =>
blanchet@43473
   237
        "--tstp-in --tstp-out -l5 " ^ e_weight_arguments ctxt method weights ^
blanchet@43981
   238
        " -tAutoDev --silent --cpu-limit=" ^ string_of_int (to_secs 2 timeout),
blanchet@42962
   239
   proof_delims = tstp_proof_delims,
blanchet@36265
   240
   known_failures =
blanchet@45203
   241
     known_szs_status_failures @
blanchet@45203
   242
     [(TimedOut, "Failure: Resource limit exceeded (time)"),
blanchet@36370
   243
      (TimedOut, "time limit exceeded"),
blanchet@45203
   244
      (OutOfResources, "# Cannot determine problem status")],
blanchet@43466
   245
   conj_sym_kind = Hypothesis,
blanchet@42709
   246
   prem_kind = Conjecture,
blanchet@42646
   247
   best_slices = fn ctxt =>
blanchet@43473
   248
     let val method = effective_e_weight_method ctxt in
blanchet@43474
   249
       (* FUDGE *)
blanchet@43473
   250
       if method = e_smartN then
blanchet@46407
   251
         [(0.333, (true, ((500, FOF, "mono_tags??", combsN), e_fun_weightN))),
blanchet@46407
   252
          (0.334, (true, ((50, FOF, "mono_guards??", combsN), e_fun_weightN))),
blanchet@46407
   253
          (0.333, (true, ((1000, FOF, "mono_tags??", combsN),
blanchet@45521
   254
                          e_sym_offset_weightN)))]
blanchet@43473
   255
       else
blanchet@46407
   256
         [(1.0, (true, ((500, FOF, "mono_tags??", combsN), method)))]
blanchet@43473
   257
     end}
blanchet@38454
   258
blanchet@40059
   259
val e = (eN, e_config)
wenzelm@28596
   260
wenzelm@28596
   261
blanchet@44099
   262
(* LEO-II *)
blanchet@44099
   263
blanchet@44754
   264
val leo2_thf0 = THF (TPTP_Monomorphic, TPTP_Explicit, THF_Without_Choice)
blanchet@44754
   265
blanchet@44099
   266
val leo2_config : atp_config =
blanchet@44099
   267
  {exec = ("LEO2_HOME", "leo"),
blanchet@44099
   268
   required_execs = [],
blanchet@44099
   269
   arguments =
blanchet@44099
   270
     fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@45300
   271
        "--proofoutput 1 --timeout " ^ string_of_int (to_secs 1 timeout)
blanchet@44099
   272
        |> sos = sosN ? prefix "--sos ",
blanchet@44099
   273
   proof_delims = tstp_proof_delims,
blanchet@45207
   274
   known_failures =
blanchet@45207
   275
     known_szs_status_failures @
blanchet@45207
   276
     [(TimedOut, "CPU time limit exceeded, terminating")],
blanchet@44099
   277
   conj_sym_kind = Axiom,
blanchet@44099
   278
   prem_kind = Hypothesis,
blanchet@44099
   279
   best_slices = fn ctxt =>
blanchet@44099
   280
     (* FUDGE *)
blanchet@46407
   281
     [(0.667, (false, ((150, leo2_thf0, "mono_simple_higher", liftingN),
blanchet@45521
   282
                       sosN))),
blanchet@46407
   283
      (0.333, (true, ((50, leo2_thf0, "mono_simple_higher", liftingN),
blanchet@45521
   284
                      no_sosN)))]
blanchet@44099
   285
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@44099
   286
         else I)}
blanchet@39491
   287
blanchet@44099
   288
val leo2 = (leo2N, leo2_config)
blanchet@44099
   289
blanchet@44099
   290
blanchet@44099
   291
(* Satallax *)
blanchet@44099
   292
blanchet@44754
   293
val satallax_thf0 = THF (TPTP_Monomorphic, TPTP_Explicit, THF_With_Choice)
blanchet@44754
   294
blanchet@44099
   295
val satallax_config : atp_config =
blanchet@44099
   296
  {exec = ("SATALLAX_HOME", "satallax"),
blanchet@44099
   297
   required_execs = [],
blanchet@44099
   298
   arguments =
blanchet@44099
   299
     fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@45162
   300
        "-p hocore -t " ^ string_of_int (to_secs 1 timeout),
blanchet@45162
   301
   proof_delims =
blanchet@45162
   302
     [("% Higher-Order Unsat Core BEGIN", "% Higher-Order Unsat Core END")],
blanchet@45203
   303
   known_failures = known_szs_status_failures,
blanchet@44099
   304
   conj_sym_kind = Axiom,
blanchet@44099
   305
   prem_kind = Hypothesis,
blanchet@44416
   306
   best_slices =
blanchet@44754
   307
     (* FUDGE *)
blanchet@46407
   308
     K [(1.0, (true, ((100, satallax_thf0, "mono_simple_higher", keep_lamsN),
blanchet@45521
   309
                      "")))]}
blanchet@44099
   310
blanchet@44099
   311
val satallax = (satallaxN, satallax_config)
blanchet@44099
   312
blanchet@44099
   313
blanchet@44099
   314
(* SPASS *)
blanchet@42725
   315
blanchet@46380
   316
val spass_incompleteN = "incomplete"
blanchet@46380
   317
blanchet@36219
   318
(* The "-VarWeight=3" option helps the higher-order problems, probably by
blanchet@44450
   319
   counteracting the presence of explicit application operators. *)
blanchet@40059
   320
val spass_config : atp_config =
blanchet@38092
   321
  {exec = ("ISABELLE_ATP", "scripts/spass"),
blanchet@39002
   322
   required_execs = [("SPASS_HOME", "SPASS"), ("SPASS_HOME", "tptp2dfg")],
blanchet@43569
   323
   arguments = fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@37962
   324
     ("-Auto -PGiven=0 -PProblem=0 -Splits=0 -FullRed=0 -DocProof \
blanchet@43981
   325
      \-VarWeight=3 -TimeLimit=" ^ string_of_int (to_secs 1 timeout))
blanchet@43473
   326
     |> sos = sosN ? prefix "-SOS=1 ",
blanchet@36369
   327
   proof_delims = [("Here is a proof", "Formulae used in the proof")],
blanchet@36289
   328
   known_failures =
blanchet@38061
   329
     known_perl_failures @
blanchet@43050
   330
     [(GaveUp, "SPASS beiseite: Completion found"),
blanchet@36370
   331
      (TimedOut, "SPASS beiseite: Ran out of time"),
blanchet@36965
   332
      (OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"),
blanchet@37413
   333
      (MalformedInput, "Undefined symbol"),
blanchet@37414
   334
      (MalformedInput, "Free Variable"),
blanchet@44391
   335
      (Unprovable, "No formulae and clauses found in input file"),
blanchet@39263
   336
      (InternalError, "Please report this error")],
blanchet@43466
   337
   conj_sym_kind = Hypothesis,
blanchet@42709
   338
   prem_kind = Conjecture,
blanchet@42725
   339
   best_slices = fn ctxt =>
blanchet@42723
   340
     (* FUDGE *)
blanchet@46407
   341
     [(0.333, (false, ((150, DFG DFG_Unsorted, "mono_tags??", liftingN),
blanchet@45521
   342
                       sosN))),
blanchet@46407
   343
      (0.333, (false, ((300, DFG DFG_Unsorted, "poly_tags??", liftingN),
blanchet@45521
   344
                       sosN))),
blanchet@46407
   345
      (0.334, (false, ((50, DFG DFG_Unsorted, "mono_tags??", liftingN),
blanchet@45876
   346
                       no_sosN)))]
blanchet@44099
   347
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@42725
   348
         else I)}
blanchet@38454
   349
blanchet@40059
   350
val spass = (spassN, spass_config)
wenzelm@28596
   351
blanchet@46407
   352
val spass_new_macro_slice_1 = (300, DFG DFG_Sorted, "mono_simple", combsN)
blanchet@46407
   353
val spass_new_macro_slice_2 = (50, DFG DFG_Sorted, "mono_simple", combsN)
blanchet@46407
   354
val spass_new_macro_slice_3 = (150, DFG DFG_Sorted, "mono_simple", liftingN)
blanchet@46407
   355
blanchet@45301
   356
(* Experimental *)
blanchet@45301
   357
val spass_new_config : atp_config =
blanchet@46370
   358
  {exec = ("ISABELLE_ATP", "scripts/spass_new"),
blanchet@46398
   359
   required_execs =
blanchet@46398
   360
     [("SPASS_NEW_HOME", "SPASS"), ("SPASS_NEW_HOME", "tptp2dfg")],
blanchet@46380
   361
   arguments = fn _ => fn _ => fn incomplete => fn timeout => fn _ =>
blanchet@46402
   362
     ("-Auto -LR=1 -LT=1 -Isabelle=1 -TimeLimit=" ^
blanchet@46402
   363
      string_of_int (to_secs 1 timeout))
blanchet@46380
   364
     |> incomplete = spass_incompleteN ? prefix "-Splits=0 -FullRed=0 ",
blanchet@45301
   365
   proof_delims = #proof_delims spass_config,
blanchet@45301
   366
   known_failures = #known_failures spass_config,
blanchet@45301
   367
   conj_sym_kind = #conj_sym_kind spass_config,
blanchet@45301
   368
   prem_kind = #prem_kind spass_config,
blanchet@46381
   369
   best_slices = fn _ =>
blanchet@45301
   370
     (* FUDGE *)
blanchet@46407
   371
     [(0.300, (true, (spass_new_macro_slice_1, ""))),
blanchet@46407
   372
      (0.333, (true, (spass_new_macro_slice_2, ""))),
blanchet@46407
   373
      (0.333, (true, (spass_new_macro_slice_3, "")))]}
blanchet@45301
   374
blanchet@45301
   375
val spass_new = (spass_newN, spass_new_config)
blanchet@45301
   376
blanchet@38454
   377
blanchet@37509
   378
(* Vampire *)
blanchet@37509
   379
blanchet@44507
   380
(* Vampire 1.8 has TFF support, but it's buggy and therefore disabled on
blanchet@44507
   381
   SystemOnTPTP. *)
blanchet@44420
   382
fun is_old_vampire_version () =
blanchet@44507
   383
  string_ord (getenv "VAMPIRE_VERSION", "1.8") <> GREATER
blanchet@44420
   384
blanchet@44754
   385
val vampire_tff0 = TFF (TPTP_Monomorphic, TPTP_Implicit)
blanchet@44589
   386
blanchet@40059
   387
val vampire_config : atp_config =
blanchet@38092
   388
  {exec = ("VAMPIRE_HOME", "vampire"),
blanchet@38092
   389
   required_execs = [],
blanchet@43569
   390
   arguments = fn _ => fn _ => fn sos => fn timeout => fn _ =>
blanchet@44417
   391
     "--mode casc -t " ^ string_of_int (to_secs 1 timeout) ^
blanchet@45234
   392
     " --proof tptp --output_axiom_names on\
blanchet@45234
   393
     \ --forced_options propositional_to_bdd=off\
blanchet@44417
   394
     \ --thanks \"Andrei and Krystof\" --input_file"
blanchet@43473
   395
     |> sos = sosN ? prefix "--sos on ",
blanchet@37509
   396
   proof_delims =
blanchet@37509
   397
     [("=========== Refutation ==========",
blanchet@37509
   398
       "======= End of refutation ======="),
blanchet@38033
   399
      ("% SZS output start Refutation", "% SZS output end Refutation"),
blanchet@38033
   400
      ("% SZS output start Proof", "% SZS output end Proof")],
blanchet@37509
   401
   known_failures =
blanchet@45203
   402
     known_szs_status_failures @
blanchet@43050
   403
     [(GaveUp, "UNPROVABLE"),
blanchet@43050
   404
      (GaveUp, "CANNOT PROVE"),
blanchet@37509
   405
      (Unprovable, "Satisfiability detected"),
blanchet@38647
   406
      (Unprovable, "Termination reason: Satisfiable"),
blanchet@39263
   407
      (Interrupted, "Aborted by signal SIGINT")],
blanchet@43466
   408
   conj_sym_kind = Conjecture,
blanchet@42709
   409
   prem_kind = Conjecture,
blanchet@42725
   410
   best_slices = fn ctxt =>
blanchet@42723
   411
     (* FUDGE *)
blanchet@44420
   412
     (if is_old_vampire_version () then
blanchet@46407
   413
        [(0.333, (false, ((150, FOF, "poly_guards??", combs_or_liftingN),
blanchet@46407
   414
                           sosN))),
blanchet@46407
   415
         (0.333, (false, ((500, FOF, "mono_tags??", combs_or_liftingN), sosN))),
blanchet@46407
   416
         (0.334, (true, ((50, FOF, "mono_guards??", combs_or_liftingN),
blanchet@46407
   417
                         no_sosN)))]
blanchet@44420
   418
      else
blanchet@46407
   419
        [(0.333, (false, ((150, vampire_tff0, "poly_guards??",
blanchet@46407
   420
                           combs_or_liftingN), sosN))),
blanchet@46407
   421
         (0.333, (false, ((500, vampire_tff0, "mono_simple", combs_or_liftingN),
blanchet@45521
   422
                          sosN))),
blanchet@46407
   423
         (0.334, (true, ((50, vampire_tff0, "mono_simple", combs_or_liftingN),
blanchet@45521
   424
                         no_sosN)))])
blanchet@44099
   425
     |> (if Config.get ctxt force_sos then hd #> apfst (K 1.0) #> single
blanchet@42725
   426
         else I)}
blanchet@38454
   427
blanchet@40059
   428
val vampire = (vampireN, vampire_config)
blanchet@37509
   429
blanchet@38454
   430
blanchet@41740
   431
(* Z3 with TPTP syntax *)
blanchet@41740
   432
blanchet@44754
   433
val z3_tff0 = TFF (TPTP_Monomorphic, TPTP_Implicit)
blanchet@44589
   434
blanchet@44423
   435
val z3_tptp_config : atp_config =
blanchet@41740
   436
  {exec = ("Z3_HOME", "z3"),
blanchet@41740
   437
   required_execs = [],
blanchet@43354
   438
   arguments = fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@44420
   439
     "MBQI=true -tptp -t:" ^ string_of_int (to_secs 1 timeout),
blanchet@41740
   440
   proof_delims = [],
blanchet@45203
   441
   known_failures = known_szs_status_failures,
blanchet@42709
   442
   conj_sym_kind = Hypothesis,
blanchet@42709
   443
   prem_kind = Hypothesis,
blanchet@42723
   444
   best_slices =
blanchet@44423
   445
     (* FUDGE *)
blanchet@46407
   446
     K [(0.5, (false, ((250, z3_tff0, "mono_simple", combsN), ""))),
blanchet@46407
   447
        (0.25, (false, ((125, z3_tff0, "mono_simple", combsN), ""))),
blanchet@46407
   448
        (0.125, (false, ((62, z3_tff0, "mono_simple", combsN), ""))),
blanchet@46407
   449
        (0.125, (false, ((31, z3_tff0, "mono_simple", combsN), "")))]}
blanchet@41740
   450
blanchet@44423
   451
val z3_tptp = (z3_tptpN, z3_tptp_config)
blanchet@41740
   452
blanchet@44590
   453
blanchet@44754
   454
(* Not really a prover: Experimental Polymorphic TFF and THF output *)
blanchet@44590
   455
blanchet@44754
   456
fun dummy_config format type_enc : atp_config =
blanchet@44596
   457
  {exec = ("ISABELLE_ATP", "scripts/dummy_atp"),
blanchet@44590
   458
   required_execs = [],
blanchet@44590
   459
   arguments = K (K (K (K (K "")))),
blanchet@44590
   460
   proof_delims = [],
blanchet@45203
   461
   known_failures = known_szs_status_failures,
blanchet@44590
   462
   conj_sym_kind = Hypothesis,
blanchet@44590
   463
   prem_kind = Hypothesis,
blanchet@45521
   464
   best_slices =
blanchet@46407
   465
     K [(1.0, (false, ((200, format, type_enc,
blanchet@46407
   466
                        if is_format_higher_order format then keep_lamsN
blanchet@46407
   467
                        else combsN), "")))]}
blanchet@44590
   468
blanchet@45365
   469
val dummy_tff1_format = TFF (TPTP_Polymorphic, TPTP_Explicit)
blanchet@45365
   470
val dummy_tff1_config = dummy_config dummy_tff1_format "poly_simple"
blanchet@45365
   471
val dummy_tff1 = (dummy_tff1N, dummy_tff1_config)
blanchet@44590
   472
blanchet@45365
   473
val dummy_thf_format = THF (TPTP_Polymorphic, TPTP_Explicit, THF_With_Choice)
blanchet@45365
   474
val dummy_thf_config = dummy_config dummy_thf_format "poly_simple_higher"
blanchet@45365
   475
val dummy_thf = (dummy_thfN, dummy_thf_config)
blanchet@44754
   476
blanchet@41740
   477
blanchet@40059
   478
(* Remote ATP invocation via SystemOnTPTP *)
wenzelm@28596
   479
blanchet@38061
   480
val systems = Synchronized.var "atp_systems" ([] : string list)
immler@31835
   481
immler@31835
   482
fun get_systems () =
blanchet@44589
   483
  case Isabelle_System.bash_output
blanchet@44589
   484
           "\"$ISABELLE_ATP/scripts/remote_atp\" -w 2>&1" of
blanchet@39491
   485
    (output, 0) => split_lines output
blanchet@39491
   486
  | (output, _) =>
blanchet@39491
   487
    error (case extract_known_failure known_perl_failures output of
blanchet@41744
   488
             SOME failure => string_for_failure failure
blanchet@39491
   489
           | NONE => perhaps (try (unsuffix "\n")) output ^ ".")
immler@31835
   490
blanchet@42537
   491
fun find_system name [] systems =
blanchet@42537
   492
    find_first (String.isPrefix (name ^ "---")) systems
blanchet@38690
   493
  | find_system name (version :: versions) systems =
blanchet@38690
   494
    case find_first (String.isPrefix (name ^ "---" ^ version)) systems of
blanchet@38690
   495
      NONE => find_system name versions systems
blanchet@38690
   496
    | res => res
blanchet@38690
   497
blanchet@38690
   498
fun get_system name versions =
blanchet@38589
   499
  Synchronized.change_result systems
blanchet@38589
   500
      (fn systems => (if null systems then get_systems () else systems)
blanchet@42955
   501
                     |> `(`(find_system name versions)))
boehmes@32864
   502
blanchet@38690
   503
fun the_system name versions =
blanchet@38690
   504
  case get_system name versions of
blanchet@42955
   505
    (SOME sys, _) => sys
blanchet@42955
   506
  | (NONE, []) => error ("SystemOnTPTP is currently not available.")
blanchet@42955
   507
  | (NONE, syss) =>
blanchet@42955
   508
    error ("System " ^ quote name ^ " is not available at SystemOnTPTP.\n" ^
blanchet@42955
   509
           "(Available systems: " ^ commas_quote syss ^ ".)")
immler@31835
   510
blanchet@41148
   511
val max_remote_secs = 240 (* give Geoff Sutcliffe's servers a break *)
blanchet@41148
   512
blanchet@38690
   513
fun remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   514
                  conj_sym_kind prem_kind best_slice : atp_config =
blanchet@38092
   515
  {exec = ("ISABELLE_ATP", "scripts/remote_atp"),
blanchet@38092
   516
   required_execs = [],
blanchet@43354
   517
   arguments = fn _ => fn _ => fn _ => fn timeout => fn _ =>
blanchet@43981
   518
     "-t " ^ string_of_int (Int.min (max_remote_secs, to_secs 1 timeout))
blanchet@41148
   519
     ^ " -s " ^ the_system system_name system_versions,
blanchet@42962
   520
   proof_delims = union (op =) tstp_proof_delims proof_delims,
blanchet@45203
   521
   known_failures = known_failures @ known_perl_failures @ known_says_failures,
blanchet@42709
   522
   conj_sym_kind = conj_sym_kind,
blanchet@42709
   523
   prem_kind = prem_kind,
blanchet@43473
   524
   best_slices = fn ctxt =>
blanchet@45521
   525
     let val (max_relevant, format, type_enc, lam_trans) = best_slice ctxt in
blanchet@46407
   526
       [(1.0, (false, ((max_relevant, format, type_enc, lam_trans), "")))]
blanchet@43473
   527
     end}
blanchet@42443
   528
blanchet@43500
   529
fun remotify_config system_name system_versions best_slice
blanchet@44416
   530
        ({proof_delims, known_failures, conj_sym_kind, prem_kind, ...}
blanchet@43500
   531
         : atp_config) : atp_config =
blanchet@38690
   532
  remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   533
                conj_sym_kind prem_kind best_slice
blanchet@38023
   534
blanchet@40059
   535
fun remote_atp name system_name system_versions proof_delims known_failures
blanchet@44416
   536
               conj_sym_kind prem_kind best_slice =
blanchet@40060
   537
  (remote_prefix ^ name,
blanchet@38690
   538
   remote_config system_name system_versions proof_delims known_failures
blanchet@44416
   539
                 conj_sym_kind prem_kind best_slice)
blanchet@43500
   540
fun remotify_atp (name, config) system_name system_versions best_slice =
blanchet@43500
   541
  (remote_prefix ^ name,
blanchet@43500
   542
   remotify_config system_name system_versions best_slice config)
wenzelm@28592
   543
blanchet@44754
   544
val explicit_tff0 = TFF (TPTP_Monomorphic, TPTP_Explicit)
blanchet@44589
   545
blanchet@43500
   546
val remote_e =
blanchet@43500
   547
  remotify_atp e "EP" ["1.0", "1.1", "1.2"]
blanchet@46365
   548
      (K (750, FOF, "mono_tags??", combsN) (* FUDGE *))
blanchet@44099
   549
val remote_leo2 =
blanchet@44099
   550
  remotify_atp leo2 "LEO-II" ["1.2.8", "1.2.6"]
blanchet@46365
   551
      (K (100, leo2_thf0, "mono_simple_higher", liftingN) (* FUDGE *))
blanchet@44099
   552
val remote_satallax =
blanchet@44099
   553
  remotify_atp satallax "Satallax" ["2.1", "2.0", "2"]
blanchet@45521
   554
      (K (100, satallax_thf0, "mono_simple_higher", keep_lamsN) (* FUDGE *))
blanchet@43500
   555
val remote_vampire =
blanchet@44499
   556
  remotify_atp vampire "Vampire" ["1.8"]
blanchet@46365
   557
      (K (250, FOF, "mono_guards??", combs_or_liftingN) (* FUDGE *))
blanchet@44423
   558
val remote_z3_tptp =
blanchet@44754
   559
  remotify_atp z3_tptp "Z3" ["3.0"]
blanchet@46365
   560
      (K (250, z3_tff0, "mono_simple", combsN) (* FUDGE *))
blanchet@44092
   561
val remote_e_sine =
blanchet@44092
   562
  remote_atp e_sineN "SInE" ["0.4"] [] (#known_failures e_config) Axiom
blanchet@46365
   563
      Conjecture (K (500, FOF, "mono_guards??", combsN) (* FUDGE *))
blanchet@45338
   564
val remote_iprover =
blanchet@45338
   565
  remote_atp iproverN "iProver" [] [] [] Axiom Conjecture
blanchet@46365
   566
      (K (150, FOF, "mono_guards??", liftingN) (* FUDGE *))
blanchet@45338
   567
val remote_iprover_eq =
blanchet@45338
   568
  remote_atp iprover_eqN "iProver-Eq" [] [] [] Axiom Conjecture
blanchet@46365
   569
      (K (150, FOF, "mono_guards??", liftingN) (* FUDGE *))
blanchet@41740
   570
val remote_snark =
blanchet@42939
   571
  remote_atp snarkN "SNARK" ["20080805r029", "20080805r024"]
blanchet@45521
   572
      [("refutation.", "end_refutation.")] [] Hypothesis Hypothesis
blanchet@46365
   573
      (K (100, explicit_tff0, "mono_simple", liftingN) (* FUDGE *))
blanchet@44092
   574
val remote_e_tofof =
blanchet@44589
   575
  remote_atp e_tofofN "ToFoF" ["0.1"] [] (#known_failures e_config) Axiom
blanchet@45521
   576
      Hypothesis
blanchet@46365
   577
      (K (150, explicit_tff0, "mono_simple", liftingN) (* FUDGE *))
blanchet@42938
   578
val remote_waldmeister =
blanchet@42938
   579
  remote_atp waldmeisterN "Waldmeister" ["710"]
blanchet@45521
   580
      [("#START OF PROOF", "Proved Goals:")]
blanchet@45521
   581
      [(OutOfResources, "Too many function symbols"),
blanchet@45521
   582
       (Crashed, "Unrecoverable Segmentation Fault")]
blanchet@45521
   583
      Hypothesis Hypothesis
blanchet@46365
   584
      (K (50, CNF_UEQ, "mono_tags??", combsN) (* FUDGE *))
blanchet@38454
   585
blanchet@38454
   586
(* Setup *)
blanchet@38454
   587
blanchet@40059
   588
fun add_atp (name, config) thy =
blanchet@40059
   589
  Data.map (Symtab.update_new (name, (config, stamp ()))) thy
blanchet@40059
   590
  handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
blanchet@40059
   591
blanchet@40059
   592
fun get_atp thy name =
blanchet@40059
   593
  the (Symtab.lookup (Data.get thy) name) |> fst
blanchet@40059
   594
  handle Option.Option => error ("Unknown ATP: " ^ name ^ ".")
blanchet@40059
   595
blanchet@41727
   596
val supported_atps = Symtab.keys o Data.get
blanchet@36371
   597
blanchet@40059
   598
fun is_atp_installed thy name =
blanchet@40059
   599
  let val {exec, required_execs, ...} = get_atp thy name in
blanchet@40059
   600
    forall (curry (op <>) "" o getenv o fst) (exec :: required_execs)
blanchet@40059
   601
  end
blanchet@36371
   602
blanchet@40059
   603
fun refresh_systems_on_tptp () =
blanchet@40059
   604
  Synchronized.change systems (fn _ => get_systems ())
blanchet@40059
   605
blanchet@42962
   606
val atps =
blanchet@45365
   607
  [e, leo2, dummy_tff1, dummy_thf, satallax, spass, spass_new, vampire, z3_tptp,
blanchet@45365
   608
   remote_e, remote_e_sine, remote_e_tofof, remote_iprover, remote_iprover_eq,
blanchet@45339
   609
   remote_leo2, remote_satallax, remote_vampire, remote_z3_tptp, remote_snark,
blanchet@45339
   610
   remote_waldmeister]
blanchet@40059
   611
val setup = fold add_atp atps
blanchet@35867
   612
wenzelm@28592
   613
end;