src/HOL/Tools/ATP/atp_systems.ML
author blanchet
Tue, 17 Aug 2010 18:14:50 +0200
changeset 38495 bb30e2f6fb0e
parent 38492 8a7ff1c25773
child 38519 0dabf05fc86b
permissions -rw-r--r--
tweaking
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
38047
9033c03cc214 consequence of directory renaming
blanchet
parents: 38046
diff changeset
     1
(*  Title:      HOL/Tools/ATP/atp_systems.ML
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     2
    Author:     Fabian Immler, TU Muenchen
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
     3
    Author:     Jasmin Blanchette, TU Muenchen
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     4
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
     5
Setup for supported ATPs.
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     6
*)
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     7
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
     8
signature ATP_SYSTEMS =
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
     9
sig
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    10
  datatype failure =
38465
1f51486da674 made 9043eefe8d71 actually compile;
wenzelm
parents: 38454
diff changeset
    11
    Unprovable | IncompleteUnprovable | CantConnect | TimedOut | OutOfResources |
1f51486da674 made 9043eefe8d71 actually compile;
wenzelm
parents: 38454
diff changeset
    12
    OldSpass | OldVampire | NoPerl | NoLibwwwPerl | MalformedInput |
1f51486da674 made 9043eefe8d71 actually compile;
wenzelm
parents: 38454
diff changeset
    13
    MalformedOutput | UnknownError
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    14
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    15
  type prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    16
    {exec: string * string,
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    17
     required_execs: (string * string) list,
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    18
     arguments: bool -> Time.time -> string,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    19
     proof_delims: (string * string) list,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    20
     known_failures: (failure * string) list,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    21
     max_new_relevant_facts_per_iter: int,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    22
     prefers_theory_relevant: bool,
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    23
     explicit_forall: bool}
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    24
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    25
  val string_for_failure : failure -> string
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    26
  val known_failure_in_output :
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    27
    string -> (failure * string) list -> failure option
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    28
  val add_prover: string * prover_config -> theory -> theory
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    29
  val get_prover: theory -> string -> prover_config
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    30
  val available_atps: theory -> unit
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
    31
  val refresh_systems_on_tptp : unit -> unit
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
    32
  val default_atps_param_value : unit -> string
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
    33
  val setup : theory -> theory
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    34
end;
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    35
36376
e83d52a52449 renamed module "ATP_Wrapper" to "ATP_Systems"
blanchet
parents: 36371
diff changeset
    36
structure ATP_Systems : ATP_SYSTEMS =
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
    37
struct
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    38
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    39
(* prover configuration *)
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
    40
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    41
datatype failure =
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    42
  Unprovable | IncompleteUnprovable | CantConnect | TimedOut | OutOfResources |
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    43
  OldSpass | OldVampire | NoPerl | NoLibwwwPerl | MalformedInput |
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    44
  MalformedOutput | UnknownError
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
    45
32941
72d48e333b77 eliminated extraneous wrapping of public records;
wenzelm
parents: 32936
diff changeset
    46
type prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    47
  {exec: string * string,
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
    48
   required_execs: (string * string) list,
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
    49
   arguments: bool -> Time.time -> string,
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
    50
   proof_delims: (string * string) list,
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
    51
   known_failures: (failure * string) list,
38009
34e1ac9cb71d shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents: 38005
diff changeset
    52
   max_new_relevant_facts_per_iter: int,
37994
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
    53
   prefers_theory_relevant: bool,
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
    54
   explicit_forall: bool}
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    55
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    56
val missing_message_tail =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    57
  " appears to be missing. You will need to install it if you want to run \
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    58
  \ATPs remotely."
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    59
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    60
fun string_for_failure Unprovable = "The ATP problem is unprovable."
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    61
  | string_for_failure IncompleteUnprovable =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    62
    "The ATP cannot prove the problem."
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
    63
  | string_for_failure CantConnect = "Can't connect to remote server."
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    64
  | string_for_failure TimedOut = "Timed out."
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    65
  | string_for_failure OutOfResources = "The ATP ran out of resources."
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    66
  | string_for_failure OldSpass =
38096
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    67
    "Isabelle requires a more recent version of SPASS with support for the \
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    68
    \TPTP syntax. To install it, download and extract the package \
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    69
    \\"http://isabelle.in.tum.de/dist/contrib/spass-3.7.tar.gz\" and add the \
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    70
    \\"spass-3.7\" directory's absolute path to " ^
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    71
    quote (Path.implode (Path.expand (Path.appends
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    72
               (Path.variable "ISABELLE_HOME_USER" ::
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    73
                map Path.basic ["etc", "components"])))) ^
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    74
    " on a line of its own."
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    75
  | string_for_failure OldVampire =
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    76
    "Isabelle requires a more recent version of Vampire. To install it, follow \
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    77
    \the instructions from the Sledgehammer manual (\"isabelle doc\
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
    78
    \ sledgehammer\")."
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    79
  | string_for_failure NoPerl = "Perl" ^ missing_message_tail
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    80
  | string_for_failure NoLibwwwPerl =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    81
    "The Perl module \"libwww-perl\"" ^ missing_message_tail
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    82
  | string_for_failure MalformedInput =
38096
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    83
    "The ATP problem is malformed. Please report this to the Isabelle \
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    84
    \developers."
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    85
  | string_for_failure MalformedOutput = "The ATP output is malformed."
488b38cd3e06 avoid "ATP Error: Error: blah" style messages
blanchet
parents: 38094
diff changeset
    86
  | string_for_failure UnknownError = "An unknown ATP error occurred."
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    87
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    88
fun known_failure_in_output output =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    89
  find_first (fn (_, pattern) => String.isSubstring pattern output)
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    90
  #> Option.map fst
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    91
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
    92
val known_perl_failures =
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
    93
  [(CantConnect, "HTTP error"),
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
    94
   (NoPerl, "env: perl"),
38065
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
    95
   (NoLibwwwPerl, "Can't locate HTTP")]
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
    96
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    97
(* named provers *)
38001
a9b47b85ca24 reintroduced more preprocessing steps to Sledgehammer, adapted to the new FOF setting
blanchet
parents: 38000
diff changeset
    98
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
    99
structure Data = Theory_Data
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   100
(
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   101
  type T = (prover_config * stamp) Symtab.table
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   102
  val empty = Symtab.empty
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   103
  val extend = I
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   104
  fun merge data : T = Symtab.merge (eq_snd op =) data
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   105
    handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   106
)
38017
3ad3e3ca2451 move Sledgehammer-specific code out of "Sledgehammer_TPTP_Format"
blanchet
parents: 38015
diff changeset
   107
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   108
fun add_prover (name, config) thy =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   109
  Data.map (Symtab.update_new (name, (config, stamp ()))) thy
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   110
  handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".")
38017
3ad3e3ca2451 move Sledgehammer-specific code out of "Sledgehammer_TPTP_Format"
blanchet
parents: 38015
diff changeset
   111
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   112
fun get_prover thy name =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   113
  the (Symtab.lookup (Data.get thy) name) |> fst
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   114
  handle Option.Option => error ("Unknown ATP: " ^ name ^ ".")
37962
d7dbe01f48d7 keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents: 37926
diff changeset
   115
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   116
fun available_atps thy =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   117
  priority ("Available ATPs: " ^
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   118
            commas (sort_strings (Symtab.keys (Data.get thy))) ^ ".")
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
   119
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   120
fun available_atps thy =
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   121
  priority ("Available ATPs: " ^
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   122
            commas (sort_strings (Symtab.keys (Data.get thy))) ^ ".")
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   123
36382
b90fc0d75bca cosmetics
blanchet
parents: 36377
diff changeset
   124
fun to_generous_secs time = (Time.toMilliseconds time + 999) div 1000
36142
f5e15e9aae10 make Sledgehammer "minimize" output less confusing + round up (not down) time limits to nearest second
blanchet
parents: 36064
diff changeset
   125
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   126
(* E prover *)
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   127
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   128
val tstp_proof_delims =
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   129
  ("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation")
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   130
35969
c9565298df9e added support for Sledgehammer parameters;
blanchet
parents: 35869
diff changeset
   131
val e_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   132
  {exec = ("E_HOME", "eproof"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   133
   required_execs = [],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   134
   arguments = fn _ => fn timeout =>
36382
b90fc0d75bca cosmetics
blanchet
parents: 36377
diff changeset
   135
     "--tstp-in --tstp-out -l5 -xAutoDev -tAutoDev --silent --cpu-limit=" ^
b90fc0d75bca cosmetics
blanchet
parents: 36377
diff changeset
   136
     string_of_int (to_generous_secs timeout),
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   137
   proof_delims = [tstp_proof_delims],
36265
41c9e755e552 distinguish between the different ATP errors in the user interface;
blanchet
parents: 36264
diff changeset
   138
   known_failures =
37995
06f02b15ef8a generate full first-order formulas (FOF) in Sledgehammer
blanchet
parents: 37994
diff changeset
   139
     [(Unprovable, "SZS status: CounterSatisfiable"),
06f02b15ef8a generate full first-order formulas (FOF) in Sledgehammer
blanchet
parents: 37994
diff changeset
   140
      (Unprovable, "SZS status CounterSatisfiable"),
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   141
      (TimedOut, "Failure: Resource limit exceeded (time)"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   142
      (TimedOut, "time limit exceeded"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   143
      (OutOfResources,
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   144
       "# Cannot determine problem status within resource limit"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   145
      (OutOfResources, "SZS status: ResourceOut"),
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   146
      (OutOfResources, "SZS status ResourceOut")],
38495
bb30e2f6fb0e tweaking
blanchet
parents: 38492
diff changeset
   147
   max_new_relevant_facts_per_iter = 50 (* FIXME *),
37994
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   148
   prefers_theory_relevant = false,
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   149
   explicit_forall = false}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   150
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   151
val e = ("e", e_config)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   152
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   153
36219
16670b4f0baa set SPASS option on the command-line, so that it doesn't vanish when moving to TPTP format
blanchet
parents: 36190
diff changeset
   154
(* The "-VarWeight=3" option helps the higher-order problems, probably by
16670b4f0baa set SPASS option on the command-line, so that it doesn't vanish when moving to TPTP format
blanchet
parents: 36190
diff changeset
   155
   counteracting the presence of "hAPP". *)
37498
b426cbdb5a23 removed Sledgehammer's support for the DFG syntax;
blanchet
parents: 37480
diff changeset
   156
val spass_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   157
  {exec = ("ISABELLE_ATP", "scripts/spass"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   158
   required_execs = [("SPASS_HOME", "SPASS")],
37550
fc2f979b9a08 split SPASS time slot between SOS and non-SOS, in case SOS times out
blanchet
parents: 37514
diff changeset
   159
   (* "div 2" accounts for the fact that SPASS is often run twice. *)
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   160
   arguments = fn complete => fn timeout =>
37962
d7dbe01f48d7 keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents: 37926
diff changeset
   161
     ("-Auto -PGiven=0 -PProblem=0 -Splits=0 -FullRed=0 -DocProof \
37550
fc2f979b9a08 split SPASS time slot between SOS and non-SOS, in case SOS times out
blanchet
parents: 37514
diff changeset
   162
      \-VarWeight=3 -TimeLimit=" ^
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
   163
      string_of_int ((to_generous_secs timeout + 1) div 2))
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   164
     |> not complete ? prefix "-SOS=1 ",
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   165
   proof_delims = [("Here is a proof", "Formulae used in the proof")],
36289
f75b6a3e1450 set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents: 36287
diff changeset
   166
   known_failures =
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   167
     known_perl_failures @
37413
e856582fe9c4 improve ATP-specific error messages
blanchet
parents: 37347
diff changeset
   168
     [(IncompleteUnprovable, "SPASS beiseite: Completion found"),
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   169
      (TimedOut, "SPASS beiseite: Ran out of time"),
36965
67ae217c6b5c identify common SPASS error more clearly
blanchet
parents: 36924
diff changeset
   170
      (OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"),
37413
e856582fe9c4 improve ATP-specific error messages
blanchet
parents: 37347
diff changeset
   171
      (MalformedInput, "Undefined symbol"),
37414
d0cea0796295 expect SPASS 3.7, and give a friendly warning if an older version is used
blanchet
parents: 37413
diff changeset
   172
      (MalformedInput, "Free Variable"),
37962
d7dbe01f48d7 keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents: 37926
diff changeset
   173
      (OldSpass, "tptp2dfg")],
38090
fe51c098b0ab fiddle with the fudge factors, to get similar results as before
blanchet
parents: 38065
diff changeset
   174
   max_new_relevant_facts_per_iter = 35 (* FIXME *),
37994
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   175
   prefers_theory_relevant = true,
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   176
   explicit_forall = true}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   177
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   178
val spass = ("spass", spass_config)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   179
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   180
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   181
(* Vampire *)
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   182
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   183
val vampire_config : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   184
  {exec = ("VAMPIRE_HOME", "vampire"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   185
   required_execs = [],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   186
   arguments = fn _ => fn timeout =>
38033
df99f022751d support latest version of Vampire (1.0) locally
blanchet
parents: 38032
diff changeset
   187
     "--mode casc -t " ^ string_of_int (to_generous_secs timeout) ^
38487
1b460d6a9d58 improve detection of old Vampire versions
blanchet
parents: 38454
diff changeset
   188
     " --input_file",
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   189
   proof_delims =
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   190
     [("=========== Refutation ==========",
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   191
       "======= End of refutation ======="),
38033
df99f022751d support latest version of Vampire (1.0) locally
blanchet
parents: 38032
diff changeset
   192
      ("% SZS output start Refutation", "% SZS output end Refutation"),
df99f022751d support latest version of Vampire (1.0) locally
blanchet
parents: 38032
diff changeset
   193
      ("% SZS output start Proof", "% SZS output end Proof")],
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   194
   known_failures =
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   195
     [(Unprovable, "UNPROVABLE"),
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   196
      (IncompleteUnprovable, "CANNOT PROVE"),
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   197
      (TimedOut, "SZS status Timeout"),
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   198
      (Unprovable, "Satisfiability detected"),
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   199
      (OutOfResources, "Refutation not found"),
38487
1b460d6a9d58 improve detection of old Vampire versions
blanchet
parents: 38454
diff changeset
   200
      (OldVampire, "not a valid option")],
38495
bb30e2f6fb0e tweaking
blanchet
parents: 38492
diff changeset
   201
   max_new_relevant_facts_per_iter = 45 (* FIXME *),
37994
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   202
   prefers_theory_relevant = false,
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   203
   explicit_forall = false}
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   204
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   205
val vampire = ("vampire", vampire_config)
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   206
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   207
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   208
(* Remote prover invocation via SystemOnTPTP *)
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   209
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   210
val systems = Synchronized.var "atp_systems" ([] : string list)
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   211
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   212
fun get_systems () =
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   213
  case bash_output "\"$ISABELLE_ATP/scripts/remote_atp\" -w 2>&1" of
36370
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   214
    (answer, 0) => split_lines answer
a4f601daa175 centralized ATP-specific error handling in "atp_wrapper.ML"
blanchet
parents: 36369
diff changeset
   215
  | (answer, _) =>
38065
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
   216
    error (case known_failure_in_output answer known_perl_failures of
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
   217
             SOME failure => string_for_failure failure
9069e1ad1527 improved ATP error handling some more
blanchet
parents: 38064
diff changeset
   218
           | NONE => perhaps (try (unsuffix "\n")) answer ^ ".")
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   219
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
   220
fun refresh_systems_on_tptp () =
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   221
  Synchronized.change systems (fn _ => get_systems ())
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   222
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   223
fun get_system prefix = Synchronized.change_result systems (fn systems =>
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
   224
  (if null systems then get_systems () else systems)
32942
b6711ec9de26 misc tuning and recovery of Isabelle coding style;
wenzelm
parents: 32941
diff changeset
   225
  |> `(find_first (String.isPrefix prefix)));
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
   226
32948
e95a4be101a8 natural argument order for prover;
wenzelm
parents: 32944
diff changeset
   227
fun the_system prefix =
32864
a226f29d4bdc re-organized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents: 32740
diff changeset
   228
  (case get_system prefix of
37509
f39464d971c4 factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents: 37506
diff changeset
   229
    NONE => error ("System " ^ quote prefix ^ " not available at SystemOnTPTP.")
32942
b6711ec9de26 misc tuning and recovery of Isabelle coding style;
wenzelm
parents: 32941
diff changeset
   230
  | SOME sys => sys);
31835
b686d4df54c2 check for current versions on server
immler@in.tum.de
parents: 31832
diff changeset
   231
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   232
fun remote_config atp_prefix
38009
34e1ac9cb71d shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents: 38005
diff changeset
   233
        ({proof_delims, known_failures, max_new_relevant_facts_per_iter,
38433
1e28e2e1c2fb Geoff's formatter now needs closed formulas
blanchet
parents: 38281
diff changeset
   234
          prefers_theory_relevant, ...} : prover_config) : prover_config =
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   235
  {exec = ("ISABELLE_ATP", "scripts/remote_atp"),
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   236
   required_execs = [],
37514
b147d01b8ebc if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents: 37509
diff changeset
   237
   arguments = fn _ => fn timeout =>
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   238
     " -t " ^ string_of_int (to_generous_secs timeout) ^ " -s " ^
36382
b90fc0d75bca cosmetics
blanchet
parents: 36377
diff changeset
   239
     the_system atp_prefix,
36369
d2cd0d04b8e6 handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents: 36289
diff changeset
   240
   proof_delims = insert (op =) tstp_proof_delims proof_delims,
38061
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   241
   known_failures =
685d1f0f75b3 handle Perl and "libwww-perl" failures more gracefully, giving the user some clues about what goes on
blanchet
parents: 38049
diff changeset
   242
     known_failures @ known_perl_failures @
38094
d01b8119b2e0 better error and minimizer output
blanchet
parents: 38092
diff changeset
   243
     [(TimedOut, "says Timeout")],
38009
34e1ac9cb71d shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents: 38005
diff changeset
   244
   max_new_relevant_facts_per_iter = max_new_relevant_facts_per_iter,
37994
b04307085a09 make TPTP generator accept full first-order formulas
blanchet
parents: 37989
diff changeset
   245
   prefers_theory_relevant = prefers_theory_relevant,
38433
1e28e2e1c2fb Geoff's formatter now needs closed formulas
blanchet
parents: 38281
diff changeset
   246
   explicit_forall = true}
28596
fcd463a6b6de tuned interfaces -- plain prover function, without thread;
wenzelm
parents: 28592
diff changeset
   247
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   248
val remote_name = prefix "remote_"
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   249
fun remote_prover (name, config) atp_prefix =
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   250
  (remote_name name, remote_config atp_prefix config)
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   251
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   252
val remote_e = remote_prover e "EP---"
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   253
val remote_vampire = remote_prover vampire "Vampire---9"
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
   254
38454
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   255
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   256
(* Setup *)
9043eefe8d71 detect old Vampire and give a nicer error message
blanchet
parents: 38433
diff changeset
   257
38092
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   258
fun is_installed ({exec, required_execs, ...} : prover_config) =
81a003f7de0d speed up the minimizer by using the time taken for the first iteration as a timeout for the following iterations, and fix a subtle bug in "string_for_failure"
blanchet
parents: 38090
diff changeset
   259
  forall (curry (op <>) "" o getenv o fst) (exec :: required_execs)
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   260
fun maybe_remote (name, config) =
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   261
  name |> not (is_installed config) ? remote_name
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   262
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   263
fun default_atps_param_value () =
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   264
  space_implode " " ([maybe_remote e] @
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   265
                     (if is_installed (snd spass) then [fst spass] else []) @
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   266
                     [remote_name (fst vampire)])
36371
8c83ea1a7740 move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents: 36370
diff changeset
   267
38041
3b80d6082131 remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents: 38033
diff changeset
   268
val provers = [e, spass, vampire, remote_e, remote_vampire]
38023
962b0a7f544b more refactoring
blanchet
parents: 38022
diff changeset
   269
val setup = fold add_prover provers
35867
16279c4c7a33 move all ATP setup code into ATP_Wrapper
blanchet
parents: 35865
diff changeset
   270
28592
824f8390aaa2 renamed AtpThread to AtpWrapper;
wenzelm
parents:
diff changeset
   271
end;