src/HOL/Tools/ATP/atp_systems.ML
author blanchet
Thu, 16 Sep 2010 15:16:08 +0200
changeset 39491 2416666e6f94
parent 39375 81894ee79ee8
child 40059 6ad9081665db
permissions -rw-r--r--
refactoring: move ATP proof and error extraction code to "ATP_Proof" module
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
38047
9033c03cc214 consequence of directory renaming
blanchet
parents: 38046
diff changeset
     1
(*  Title:      HOL/Tools/ATP/atp_systems.ML
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     2
    Author:     Fabian Immler, TU Muenchen
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
     3
    Author:     Jasmin Blanchette, TU Muenchen
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     4
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
     5
Setup for supported ATPs.
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     6
*)
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     7
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
     8
signature ATP_SYSTEMS =
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     9
sig
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
    10
  type failure = ATP_Proof.failure
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    11
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    12
  type prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    13
    {exec: string * string,
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    14
     required_execs: (string * string) list,
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    15
     arguments: bool -> Time.time -> string,
38645
4d5bbec1a598 be more generous towards SPASS's -SOS mode
blanchet
parents: 38631
diff changeset
    16
     has_incomplete_mode: bool,
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    17
     proof_delims: (string * string) list,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    18
     known_failures: (failure * string) list,
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
    19
     default_max_relevant: int,
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
    20
     explicit_forall: bool,
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
    21
     use_conjecture_for_hypotheses: bool}
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    22
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    23
  val add_prover: string * prover_config -> theory -> theory
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    24
  val get_prover: theory -> string -> prover_config
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    25
  val available_atps: theory -> unit
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
    26
  val refresh_systems_on_tptp : unit -> unit
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
    27
  val default_atps_param_value : unit -> string
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
    28
  val setup : theory -> theory
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    29
end;
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    30
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
    31
structure ATP_Systems : ATP_SYSTEMS =
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    32
struct
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    33
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
    34
open ATP_Proof
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
    35
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
    36
(* prover configuration *)
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
    37
32941
72d48e333b77 eliminated extraneous wrapping of public records;
wenzelm
parents: 32936
diff changeset
    38
type prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    39
  {exec: string * string,
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    40
   required_execs: (string * string) list,
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
    41
   arguments: bool -> Time.time -> string,
38645
4d5bbec1a598 be more generous towards SPASS's -SOS mode
blanchet
parents: 38631
diff changeset
    42
   has_incomplete_mode: bool,
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
    43
   proof_delims: (string * string) list,
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
    44
   known_failures: (failure * string) list,
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
    45
   default_max_relevant: int,
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
    46
   explicit_forall: bool,
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
    47
   use_conjecture_for_hypotheses: bool}
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    48
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    49
val known_perl_failures =
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
    50
  [(CantConnect, "HTTP error"),
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
    51
   (NoPerl, "env: perl"),
38065
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
    52
   (NoLibwwwPerl, "Can't locate HTTP")]
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    53
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    54
(* named provers *)
38001
a9b47b85ca24 reintroduced more preprocessing steps to Sledgehammer, adapted to the new FOF setting
blanchet
parents: 38000
diff changeset
    55
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    56
structure Data = Theory_Data
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    57
(
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    58
  type T = (prover_config * stamp) Symtab.table
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    59
  val empty = Symtab.empty
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    60
  val extend = I
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    61
  fun merge data : T = Symtab.merge (eq_snd op =) data
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    62
    handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    63
)
38017
3ad3e3ca2451 move Sledgehammer-specific code out of "Sledgehammer_TPTP_Format"
blanchet
parents: 38015
diff changeset
    64
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    65
fun add_prover (name, config) thy =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    66
  Data.map (Symtab.update_new (name, (config, stamp ()))) thy
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    67
  handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
38017
3ad3e3ca2451 move Sledgehammer-specific code out of "Sledgehammer_TPTP_Format"
blanchet
parents: 38015
diff changeset
    68
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    69
fun get_prover thy name =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    70
  the (Symtab.lookup (Data.get thy) name) |> fst
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    71
  handle Option.Option => error ("Unknown ATP: " ^ name ^ ".")
37962
d7dbe01f48d7 keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents: 37926
diff changeset
    72
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    73
fun available_atps thy =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    74
  priority ("Available ATPs: " ^
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    75
            commas (sort_strings (Symtab.keys (Data.get thy))) ^ ".")
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
    76
38737
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    77
fun to_secs bonus time = (Time.toMilliseconds time + bonus + 999) div 1000
36142
f5e15e9aae10 make Sledgehammer "minimize" output less confusing + round up (not down) time limits to nearest second
blanchet
parents: 36064
diff changeset
    78
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
    79
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    80
(* E prover *)
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    81
38737
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    82
(* Give older versions of E an extra second, because the "eproof" script wrongly
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    83
   subtracted an entire second to account for the overhead of the script
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    84
   itself, which is in fact much lower. *)
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    85
fun e_bonus () =
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    86
  case getenv "E_VERSION" of
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    87
    "" => 1000
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    88
  | version =>
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    89
    if exists (fn s => String.isPrefix s version) ["0.9", "1.0"] then 1000
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    90
    else 0
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
    91
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
    92
val tstp_proof_delims =
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
    93
  ("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation")
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
    94
35969
c9565298df9e added support for Sledgehammer parameters;
blanchet
parents: 35869
diff changeset
    95
val e_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    96
  {exec = ("E_HOME", "eproof"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    97
   required_execs = [],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
    98
   arguments = fn _ => fn timeout =>
38691
fe5929dacd43 use a soft time limit for E
blanchet
parents: 38690
diff changeset
    99
     "--tstp-in --tstp-out -l5 -xAutoDev -tAutoDev --silent \
38737
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
   100
     \--cpu-limit=" ^ string_of_int (to_secs (e_bonus ()) timeout),
38645
4d5bbec1a598 be more generous towards SPASS's -SOS mode
blanchet
parents: 38631
diff changeset
   101
   has_incomplete_mode = false,
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   102
   proof_delims = [tstp_proof_delims],
36265
41c9e755e552 distinguish between the different ATP errors in the user interface;
blanchet
parents: 36264
diff changeset
   103
   known_failures =
37995
06f02b15ef8a generate full first-order formulas (FOF) in Sledgehammer
blanchet
parents: 37994
diff changeset
   104
     [(Unprovable, "SZS status: CounterSatisfiable"),
06f02b15ef8a generate full first-order formulas (FOF) in Sledgehammer
blanchet
parents: 37994
diff changeset
   105
      (Unprovable, "SZS status CounterSatisfiable"),
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   106
      (TimedOut, "Failure: Resource limit exceeded (time)"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   107
      (TimedOut, "time limit exceeded"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   108
      (OutOfResources,
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   109
       "# Cannot determine problem status within resource limit"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   110
      (OutOfResources, "SZS status: ResourceOut"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   111
      (OutOfResources, "SZS status ResourceOut")],
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   112
   default_max_relevant = 500 (* FUDGE *),
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   113
   explicit_forall = false,
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   114
   use_conjecture_for_hypotheses = true}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   115
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   116
val e = ("e", e_config)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   117
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   118
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   119
(* SPASS *)
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   120
36219
16670b4f0baa set SPASS option on the command-line, so that it doesn't vanish when moving to TPTP format
blanchet
parents: 36190
diff changeset
   121
(* The "-VarWeight=3" option helps the higher-order problems, probably by
16670b4f0baa set SPASS option on the command-line, so that it doesn't vanish when moving to TPTP format
blanchet
parents: 36190
diff changeset
   122
   counteracting the presence of "hAPP". *)
37498
b426cbdb5a23 removed Sledgehammer's support for the DFG syntax;
blanchet
parents: 37480
diff changeset
   123
val spass_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   124
  {exec = ("ISABELLE_ATP", "scripts/spass"),
39002
a2d7be688ea1 add dependency of "spass" script
blanchet
parents: 38999
diff changeset
   125
   required_execs = [("SPASS_HOME", "SPASS"), ("SPASS_HOME", "tptp2dfg")],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   126
   arguments = fn complete => fn timeout =>
37962
d7dbe01f48d7 keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents: 37926
diff changeset
   127
     ("-Auto -PGiven=0 -PProblem=0 -Splits=0 -FullRed=0 -DocProof \
38737
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
   128
      \-VarWeight=3 -TimeLimit=" ^ string_of_int (to_secs 0 timeout))
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   129
     |> not complete ? prefix "-SOS=1 ",
38645
4d5bbec1a598 be more generous towards SPASS's -SOS mode
blanchet
parents: 38631
diff changeset
   130
   has_incomplete_mode = true,
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   131
   proof_delims = [("Here is a proof", "Formulae used in the proof")],
36289
f75b6a3e1450 set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents: 36287
diff changeset
   132
   known_failures =
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   133
     known_perl_failures @
37413
e856582fe9c4 improve ATP-specific error messages
blanchet
parents: 37347
diff changeset
   134
     [(IncompleteUnprovable, "SPASS beiseite: Completion found"),
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   135
      (TimedOut, "SPASS beiseite: Ran out of time"),
36965
67ae217c6b5c identify common SPASS error more clearly
blanchet
parents: 36924
diff changeset
   136
      (OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"),
37413
e856582fe9c4 improve ATP-specific error messages
blanchet
parents: 37347
diff changeset
   137
      (MalformedInput, "Undefined symbol"),
37414
d0cea0796295 expect SPASS 3.7, and give a friendly warning if an older version is used
blanchet
parents: 37413
diff changeset
   138
      (MalformedInput, "Free Variable"),
39263
e2a3c435334b more precise error messages when Vampire is interrupted or SPASS runs into an internal bug
blanchet
parents: 39262
diff changeset
   139
      (SpassTooOld, "tptp2dfg"),
e2a3c435334b more precise error messages when Vampire is interrupted or SPASS runs into an internal bug
blanchet
parents: 39262
diff changeset
   140
      (InternalError, "Please report this error")],
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   141
   default_max_relevant = 350 (* FUDGE *),
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   142
   explicit_forall = true,
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   143
   use_conjecture_for_hypotheses = true}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   144
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   145
val spass = ("spass", spass_config)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   146
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   147
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   148
(* Vampire *)
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   149
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   150
val vampire_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   151
  {exec = ("VAMPIRE_HOME", "vampire"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   152
   required_execs = [],
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   153
   arguments = fn complete => fn timeout =>
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   154
     ("--mode casc -t " ^ string_of_int (to_secs 0 timeout) ^
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   155
      " --thanks Andrei --input_file")
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   156
     |> not complete ? prefix "--sos on ",
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   157
   has_incomplete_mode = true,
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   158
   proof_delims =
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   159
     [("=========== Refutation ==========",
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   160
       "======= End of refutation ======="),
38033
df99f022751d support latest version of Vampire (1.0) locally
blanchet
parents: 38032
diff changeset
   161
      ("% SZS output start Refutation", "% SZS output end Refutation"),
df99f022751d support latest version of Vampire (1.0) locally
blanchet
parents: 38032
diff changeset
   162
      ("% SZS output start Proof", "% SZS output end Proof")],
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   163
   known_failures =
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   164
     [(Unprovable, "UNPROVABLE"),
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   165
      (IncompleteUnprovable, "CANNOT PROVE"),
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   166
      (TimedOut, "SZS status Timeout"),
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   167
      (Unprovable, "Satisfiability detected"),
38647
5500241da479 play with fudge factor + parse one more Vampire error
blanchet
parents: 38646
diff changeset
   168
      (Unprovable, "Termination reason: Satisfiable"),
39263
e2a3c435334b more precise error messages when Vampire is interrupted or SPASS runs into an internal bug
blanchet
parents: 39262
diff changeset
   169
      (VampireTooOld, "not a valid option"),
e2a3c435334b more precise error messages when Vampire is interrupted or SPASS runs into an internal bug
blanchet
parents: 39262
diff changeset
   170
      (Interrupted, "Aborted by signal SIGINT")],
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   171
   default_max_relevant = 400 (* FUDGE *),
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   172
   explicit_forall = false,
38680
634a6d400c2e revert unintended change
blanchet
parents: 38678
diff changeset
   173
   use_conjecture_for_hypotheses = true}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   174
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   175
val vampire = ("vampire", vampire_config)
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   176
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   177
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   178
(* Remote prover invocation via SystemOnTPTP *)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   179
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   180
val systems = Synchronized.var "atp_systems" ([] : string list)
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   181
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   182
fun get_systems () =
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   183
  case bash_output "\"$ISABELLE_ATP/scripts/remote_atp\" -w 2>&1" of
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   184
    (output, 0) => split_lines output
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   185
  | (output, _) =>
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   186
    error (case extract_known_failure known_perl_failures output of
38065
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
   187
             SOME failure => string_for_failure failure
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39375
diff changeset
   188
           | NONE => perhaps (try (unsuffix "\n")) output ^ ".")
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   189
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
   190
fun refresh_systems_on_tptp () =
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   191
  Synchronized.change systems (fn _ => get_systems ())
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   192
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   193
fun find_system name [] systems = find_first (String.isPrefix name) systems
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   194
  | find_system name (version :: versions) systems =
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   195
    case find_first (String.isPrefix (name ^ "---" ^ version)) systems of
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   196
      NONE => find_system name versions systems
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   197
    | res => res
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   198
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   199
fun get_system name versions =
38589
b03f8fe043ec added "max_relevant_per_iter" option to Sledgehammer
blanchet
parents: 38588
diff changeset
   200
  Synchronized.change_result systems
b03f8fe043ec added "max_relevant_per_iter" option to Sledgehammer
blanchet
parents: 38588
diff changeset
   201
      (fn systems => (if null systems then get_systems () else systems)
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   202
                     |> `(find_system name versions))
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
   203
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   204
fun the_system name versions =
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   205
  case get_system name versions of
39010
344028ecc00e show real CPU time
blanchet
parents: 39002
diff changeset
   206
    SOME sys => sys
344028ecc00e show real CPU time
blanchet
parents: 39002
diff changeset
   207
  | NONE => error ("System " ^ quote name ^ " not available at SystemOnTPTP.")
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   208
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   209
fun remote_config system_name system_versions proof_delims known_failures
38997
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   210
                  default_max_relevant use_conjecture_for_hypotheses
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   211
                  : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   212
  {exec = ("ISABELLE_ATP", "scripts/remote_atp"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   213
   required_execs = [],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   214
   arguments = fn _ => fn timeout =>
38737
bdcb23701448 better workaround for E's off-by-one-second issue
blanchet
parents: 38691
diff changeset
   215
     " -t " ^ string_of_int (to_secs 0 timeout) ^ " -s " ^
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   216
     the_system system_name system_versions,
38645
4d5bbec1a598 be more generous towards SPASS's -SOS mode
blanchet
parents: 38631
diff changeset
   217
   has_incomplete_mode = false,
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   218
   proof_delims = insert (op =) tstp_proof_delims proof_delims,
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   219
   known_failures =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   220
     known_failures @ known_perl_failures @
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
   221
     [(TimedOut, "says Timeout")],
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   222
   default_max_relevant = default_max_relevant,
38631
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   223
   explicit_forall = true,
979a0b37f981 prefer TPTP "conjecture" tag to "hypothesis" on ATPs where this is possible;
blanchet
parents: 38603
diff changeset
   224
   use_conjecture_for_hypotheses = use_conjecture_for_hypotheses}
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   225
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   226
fun remotify_config system_name system_versions
38744
2b6333f78a9e make relevance filter work in term of a "max_relevant" option + use Vampire SOS;
blanchet
parents: 38740
diff changeset
   227
        ({proof_delims, known_failures, default_max_relevant,
38997
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   228
          use_conjecture_for_hypotheses, ...} : prover_config) : prover_config =
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   229
  remote_config system_name system_versions proof_delims known_failures
38997
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   230
                default_max_relevant use_conjecture_for_hypotheses
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   231
38598
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   232
val remotify_name = prefix "remote_"
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   233
fun remote_prover name system_name system_versions proof_delims known_failures
38997
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   234
                  default_max_relevant use_conjecture_for_hypotheses =
38598
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   235
  (remotify_name name,
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   236
   remote_config system_name system_versions proof_delims known_failures
38997
78ac4468cf9d got rid of the "theory_relevant" option;
blanchet
parents: 38817
diff changeset
   237
                 default_max_relevant use_conjecture_for_hypotheses)
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   238
fun remotify_prover (name, config) system_name system_versions =
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   239
  (remotify_name name, remotify_config system_name system_versions config)
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
   240
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   241
val remote_e = remotify_prover e "EP" ["1.0", "1.1", "1.2"]
39375
81894ee79ee8 prefer version 0.6 of Vampire, now that we can parse its output
blanchet
parents: 39325
diff changeset
   242
val remote_vampire = remotify_prover vampire "Vampire" ["0.6", "9.0", "1.0"]
38603
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   243
val remote_sine_e =
39257
eec61233dbad improve SInE-E failure message
blanchet
parents: 39011
diff changeset
   244
  remote_prover "sine_e" "SInE" [] [] [(IncompleteUnprovable, "says Unknown")]
38999
8223d0f8f5cc lower number of facts given to SInE
blanchet
parents: 38997
diff changeset
   245
                800 (* FUDGE *) true
38598
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   246
val remote_snark =
38690
38a926e033ad make remote ATP versions more robust, by starting with "preferred" version numbers and falling back on any version
blanchet
parents: 38685
diff changeset
   247
  remote_prover "snark" "SNARK---" [] [("refutation.", "end_refutation.")] []
39011
af0ebd2fb433 SNARK doesn't like facts
blanchet
parents: 39010
diff changeset
   248
                250 (* FUDGE *) true
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   249
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   250
(* Setup *)
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   251
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   252
fun is_installed ({exec, required_execs, ...} : prover_config) =
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   253
  forall (curry (op <>) "" o getenv o fst) (exec :: required_execs)
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   254
fun maybe_remote (name, config) =
38598
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   255
  name |> not (is_installed config) ? remotify_name
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   256
39319
da4e98cb2005 change order of default ATPs;
blanchet
parents: 39263
diff changeset
   257
(* The first prover of the list is used by Auto Sledgehammer. Because of the low
da4e98cb2005 change order of default ATPs;
blanchet
parents: 39263
diff changeset
   258
   timeout, it makes sense to put SPASS first. *)
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   259
fun default_atps_param_value () =
39319
da4e98cb2005 change order of default ATPs;
blanchet
parents: 39263
diff changeset
   260
  space_implode " " ((if is_installed (snd spass) then [fst spass] else []) @
da4e98cb2005 change order of default ATPs;
blanchet
parents: 39263
diff changeset
   261
                     [maybe_remote e] @
38603
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   262
                     [if forall (is_installed o snd) [e, spass] then
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   263
                        remotify_name (fst vampire)
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   264
                      else
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   265
                        maybe_remote vampire,
a57d04dd1b25 fix SInE's error handling + run "vampire" locally if either SPASS or E is missing
blanchet
parents: 38598
diff changeset
   266
                      fst remote_sine_e])
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   267
38598
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   268
val provers = [e, spass, vampire, remote_e, remote_vampire, remote_sine_e,
ce117ef51999 added remote SInE and remote SNARK
blanchet
parents: 38596
diff changeset
   269
               remote_snark]
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   270
val setup = fold add_prover provers
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
   271
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
   272
end;