src/HOL/Tools/ATP/atp_proof.ML
author blanchet
Mon, 14 May 2012 15:54:26 +0200
changeset 47919 1be466c58a26
parent 47917 b287682bf917
child 47921 fc26d5538868
permissions -rw-r--r--
repaired snag in debug function
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     1
(*  Title:      HOL/Tools/ATP/atp_proof.ML
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     2
    Author:     Lawrence C. Paulson, Cambridge University Computer Laboratory
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     3
    Author:     Claire Quigley, Cambridge University Computer Laboratory
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     4
    Author:     Jasmin Blanchette, TU Muenchen
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     5
42876
e336ef6313aa more informative message when Sledgehammer finds an unsound proof
blanchet
parents: 42848
diff changeset
     6
Abstract representation of ATP proofs and TSTP/SPASS syntax.
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     7
*)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     8
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
     9
signature ATP_PROOF =
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    10
sig
43678
56d352659500 improved translation of lambdas in THF
nik
parents: 43602
diff changeset
    11
  type ('a, 'b) ho_term = ('a, 'b) ATP_Problem.ho_term
42531
a462dbaa584f added more rudimentary type support to Sledgehammer's ATP encoding
blanchet
parents: 42526
diff changeset
    12
  type ('a, 'b, 'c) formula = ('a, 'b, 'c) ATP_Problem.formula
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
    13
  type 'a problem = 'a ATP_Problem.problem
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    14
42965
1403595ec38c slightly gracefuller handling of LEO-II and Satallax output
blanchet
parents: 42962
diff changeset
    15
  exception UNRECOGNIZED_ATP_PROOF of unit
1403595ec38c slightly gracefuller handling of LEO-II and Satallax output
blanchet
parents: 42962
diff changeset
    16
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    17
  datatype failure =
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    18
    Unprovable |
43050
59284a13abc4 support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents: 43029
diff changeset
    19
    GaveUp |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    20
    ProofMissing |
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
    21
    ProofIncomplete |
44915
635ae0a73688 simplified unsound proof detection by removing impossible case
blanchet
parents: 44784
diff changeset
    22
    UnsoundProof of bool * string list |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    23
    CantConnect |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    24
    TimedOut |
42953
26111aafab12 detect inappropriate problems and crashes better in Waldmeister
blanchet
parents: 42943
diff changeset
    25
    Inappropriate |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    26
    OutOfResources |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    27
    NoPerl |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    28
    NoLibwwwPerl |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    29
    MalformedInput |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    30
    MalformedOutput |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    31
    Interrupted |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    32
    Crashed |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    33
    InternalError |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    34
    UnknownError of string
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    35
45551
a62c7a21f4ab removed needless baggage
blanchet
parents: 45301
diff changeset
    36
  type step_name = string * string list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    37
39453
1740a2d6bef9 use the same TSTP/Vampire/SPASS parser for one-liners as for Isar proofs
blanchet
parents: 39452
diff changeset
    38
  datatype 'a step =
47774
blanchet
parents: 47506
diff changeset
    39
    Definition_Step of step_name * 'a * 'a |
blanchet
parents: 47506
diff changeset
    40
    Inference_Step of step_name * 'a * string * step_name list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    41
43678
56d352659500 improved translation of lambdas in THF
nik
parents: 43602
diff changeset
    42
  type 'a proof = ('a, 'a, ('a, 'a) ho_term) formula step list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    43
41259
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    44
  val short_output : bool -> string -> string
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
    45
  val string_for_failure : failure -> string
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    46
  val extract_important_message : string -> string
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    47
  val extract_known_failure :
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    48
    (failure * string) list -> string -> failure option
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    49
  val extract_tstplike_proof_and_outcome :
43473
fb2713b803e6 deal with ATP time slices in a more flexible/robust fashion
blanchet
parents: 43465
diff changeset
    50
    bool -> bool -> (string * string) list -> (failure * string) list -> string
fb2713b803e6 deal with ATP time slices in a more flexible/robust fashion
blanchet
parents: 43465
diff changeset
    51
    -> string * failure option
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
    52
  val is_same_atp_step : step_name -> step_name -> bool
42961
f30ae82cb62e eliminated more code duplication in Nitrox
blanchet
parents: 42953
diff changeset
    53
  val scan_general_id : string list -> string * string list
f30ae82cb62e eliminated more code duplication in Nitrox
blanchet
parents: 42953
diff changeset
    54
  val parse_formula :
43678
56d352659500 improved translation of lambdas in THF
nik
parents: 43602
diff changeset
    55
    string list -> (string, 'a, (string, 'a) ho_term) formula * string list
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
    56
  val atp_proof_from_tstplike_proof :
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
    57
    string problem -> string -> string -> string proof
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
    58
  val clean_up_atp_proof_dependencies : string proof -> string proof
39454
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
    59
  val map_term_names_in_atp_proof :
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
    60
    (string -> string) -> string proof -> string proof
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
    61
  val nasty_atp_proof : string Symtab.table -> string proof -> string proof
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    62
end;
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    63
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    64
structure ATP_Proof : ATP_PROOF =
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    65
struct
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
    66
43085
0a2f5b86bdd7 first step in sharing more code between ATP and Metis translation
blanchet
parents: 43050
diff changeset
    67
open ATP_Util
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    68
open ATP_Problem
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    69
42965
1403595ec38c slightly gracefuller handling of LEO-II and Satallax output
blanchet
parents: 42962
diff changeset
    70
exception UNRECOGNIZED_ATP_PROOF of unit
1403595ec38c slightly gracefuller handling of LEO-II and Satallax output
blanchet
parents: 42962
diff changeset
    71
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    72
datatype failure =
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    73
  Unprovable |
43050
59284a13abc4 support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents: 43029
diff changeset
    74
  GaveUp |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    75
  ProofMissing |
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
    76
  ProofIncomplete |
44915
635ae0a73688 simplified unsound proof detection by removing impossible case
blanchet
parents: 44784
diff changeset
    77
  UnsoundProof of bool * string list |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    78
  CantConnect |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    79
  TimedOut |
42953
26111aafab12 detect inappropriate problems and crashes better in Waldmeister
blanchet
parents: 42943
diff changeset
    80
  Inappropriate |
42587
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    81
  OutOfResources |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    82
  NoPerl |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    83
  NoLibwwwPerl |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    84
  MalformedInput |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    85
  MalformedOutput |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    86
  Interrupted |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    87
  Crashed |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    88
  InternalError |
4fbb1de05169 fixed SPASS fact offset calculation and report unexpected unsound proofs with so-called sound encodings
blanchet
parents: 42550
diff changeset
    89
  UnknownError of string
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
    90
41259
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    91
fun elide_string threshold s =
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    92
  if size s > threshold then
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    93
    String.extract (s, 0, SOME (threshold div 2 - 5)) ^ " ...... " ^
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    94
    String.extract (s, size s - (threshold + 1) div 2 + 6, NONE)
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    95
  else
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    96
    s
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
    97
fun short_output verbose output =
42060
889d767ce5f4 make Minimizer honor "verbose" and "debug" options better
blanchet
parents: 41944
diff changeset
    98
  if verbose then
889d767ce5f4 make Minimizer honor "verbose" and "debug" options better
blanchet
parents: 41944
diff changeset
    99
    if output = "" then "No details available" else elide_string 1000 output
889d767ce5f4 make Minimizer honor "verbose" and "debug" options better
blanchet
parents: 41944
diff changeset
   100
  else
889d767ce5f4 make Minimizer honor "verbose" and "debug" options better
blanchet
parents: 41944
diff changeset
   101
    ""
41259
13972ced98d9 more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents: 41222
diff changeset
   102
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   103
val missing_message_tail =
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   104
  " appears to be missing. You will need to install it if you want to invoke \
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   105
  \remote provers."
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   106
42876
e336ef6313aa more informative message when Sledgehammer finds an unsound proof
blanchet
parents: 42848
diff changeset
   107
fun involving [] = ""
43005
c96f06bffd90 merge timeout messages from several ATPs into one message to avoid clutter
blanchet
parents: 42998
diff changeset
   108
  | involving ss =
43029
3e060b1c844b use helpers and tweak Quickcheck's priority to it comes second (to give Solve Direct slightly more time before another prover runs)
blanchet
parents: 43005
diff changeset
   109
    "involving " ^ space_implode " " (Try.serial_commas "and" (map quote ss)) ^
3e060b1c844b use helpers and tweak Quickcheck's priority to it comes second (to give Solve Direct slightly more time before another prover runs)
blanchet
parents: 43005
diff changeset
   110
    " "
42876
e336ef6313aa more informative message when Sledgehammer finds an unsound proof
blanchet
parents: 42848
diff changeset
   111
47506
da72e05849ef more helpful error message
blanchet
parents: 46451
diff changeset
   112
fun string_for_failure Unprovable = "The generated problem is unprovable."
43050
59284a13abc4 support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents: 43029
diff changeset
   113
  | string_for_failure GaveUp = "The prover gave up."
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   114
  | string_for_failure ProofMissing =
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   115
    "The prover claims the conjecture is a theorem but did not provide a proof."
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   116
  | string_for_failure ProofIncomplete =
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   117
    "The prover claims the conjecture is a theorem but provided an incomplete \
46427
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   118
    \(or unparsable) proof."
44915
635ae0a73688 simplified unsound proof detection by removing impossible case
blanchet
parents: 44784
diff changeset
   119
  | string_for_failure (UnsoundProof (false, ss)) =
43823
9361c7c930d0 clearer unsound message
blanchet
parents: 43678
diff changeset
   120
    "The prover found a type-unsound proof " ^ involving ss ^
9361c7c930d0 clearer unsound message
blanchet
parents: 43678
diff changeset
   121
    "(or, less likely, your axioms are inconsistent). Specify a sound type \
9361c7c930d0 clearer unsound message
blanchet
parents: 43678
diff changeset
   122
    \encoding or omit the \"type_enc\" option."
44915
635ae0a73688 simplified unsound proof detection by removing impossible case
blanchet
parents: 44784
diff changeset
   123
  | string_for_failure (UnsoundProof (true, ss)) =
42876
e336ef6313aa more informative message when Sledgehammer finds an unsound proof
blanchet
parents: 42848
diff changeset
   124
    "The prover found a type-unsound proof " ^ involving ss ^
e336ef6313aa more informative message when Sledgehammer finds an unsound proof
blanchet
parents: 42848
diff changeset
   125
    "even though a supposedly type-sound encoding was used (or, less likely, \
43465
5ca37e764139 more forceful message
blanchet
parents: 43246
diff changeset
   126
    \your axioms are inconsistent). Please report this to the Isabelle \
5ca37e764139 more forceful message
blanchet
parents: 43246
diff changeset
   127
    \developers."
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   128
  | string_for_failure CantConnect = "Cannot connect to remote server."
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   129
  | string_for_failure TimedOut = "Timed out."
42953
26111aafab12 detect inappropriate problems and crashes better in Waldmeister
blanchet
parents: 42943
diff changeset
   130
  | string_for_failure Inappropriate =
47506
da72e05849ef more helpful error message
blanchet
parents: 46451
diff changeset
   131
    "The generated problem lies outside the prover's scope."
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   132
  | string_for_failure OutOfResources = "The prover ran out of resources."
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   133
  | string_for_failure NoPerl = "Perl" ^ missing_message_tail
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   134
  | string_for_failure NoLibwwwPerl =
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   135
    "The Perl module \"libwww-perl\"" ^ missing_message_tail
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   136
  | string_for_failure MalformedInput =
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   137
    "The generated problem is malformed. Please report this to the Isabelle \
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   138
    \developers."
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   139
  | string_for_failure MalformedOutput = "The prover output is malformed."
43085
0a2f5b86bdd7 first step in sharing more code between ATP and Metis translation
blanchet
parents: 43050
diff changeset
   140
  | string_for_failure Interrupted = "The prover was interrupted."
41744
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   141
  | string_for_failure Crashed = "The prover crashed."
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   142
  | string_for_failure InternalError = "An internal prover error occurred."
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   143
  | string_for_failure (UnknownError string) =
a18e7bbca258 make minimizer verbose
blanchet
parents: 41738
diff changeset
   144
    "A prover error occurred" ^
41334
3cb52cbf0eed enable E weight generation with unofficial latest version of E (tentatively called E 1.2B) -- backed by Judgment Day
blanchet
parents: 41265
diff changeset
   145
    (if string = "" then ". (Pass the \"verbose\" option for details.)"
3cb52cbf0eed enable E weight generation with unofficial latest version of E (tentatively called E 1.2B) -- backed by Judgment Day
blanchet
parents: 41265
diff changeset
   146
     else ":\n" ^ string)
39491
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   147
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   148
fun extract_delimited (begin_delim, end_delim) output =
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   149
  output |> first_field begin_delim |> the |> snd
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   150
         |> first_field end_delim |> the |> fst
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   151
         |> first_field "\n" |> the |> snd
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   152
  handle Option.Option => ""
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   153
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   154
val tstp_important_message_delims =
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   155
  ("% SZS start RequiredInformation", "% SZS end RequiredInformation")
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   156
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   157
fun extract_important_message output =
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   158
  case extract_delimited tstp_important_message_delims output of
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   159
    "" => ""
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   160
  | s => s |> space_explode "\n" |> filter_out (curry (op =) "")
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   161
           |> map (perhaps (try (unprefix "%")))
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   162
           |> map (perhaps (try (unprefix " ")))
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   163
           |> space_implode "\n " |> quote
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   164
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   165
(* Splits by the first possible of a list of delimiters. *)
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   166
fun extract_tstplike_proof delims output =
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   167
  case pairself (find_first (fn s => String.isSubstring s output))
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   168
                (ListPair.unzip delims) of
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   169
    (SOME begin_delim, SOME end_delim) =>
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   170
    extract_delimited (begin_delim, end_delim) output
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   171
  | _ => ""
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   172
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   173
fun extract_known_failure known_failures output =
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   174
  known_failures
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   175
  |> find_first (fn (_, pattern) => String.isSubstring pattern output)
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   176
  |> Option.map fst
2416666e6f94 refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents: 39457
diff changeset
   177
43473
fb2713b803e6 deal with ATP time slices in a more flexible/robust fashion
blanchet
parents: 43465
diff changeset
   178
fun extract_tstplike_proof_and_outcome verbose complete proof_delims
42848
403d3b4a95fc fixed empty proof detection
blanchet
parents: 42844
diff changeset
   179
                                       known_failures output =
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   180
  case (extract_tstplike_proof proof_delims output,
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   181
        extract_known_failure known_failures output) of
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   182
    (_, SOME ProofIncomplete) => ("", SOME ProofIncomplete)
43246
01b6391a763f fixed missing proof handling
blanchet
parents: 43163
diff changeset
   183
  | ("", SOME ProofMissing) => ("", NONE)
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   184
  | ("", SOME failure) =>
43050
59284a13abc4 support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents: 43029
diff changeset
   185
    ("", SOME (if failure = GaveUp andalso complete then Unprovable
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   186
               else failure))
43246
01b6391a763f fixed missing proof handling
blanchet
parents: 43163
diff changeset
   187
  | ("", NONE) => ("", SOME (UnknownError (short_output verbose output)))
42882
391e41ac038b make sure the Vampire incomplete proof detection code kicks in
blanchet
parents: 42876
diff changeset
   188
  | (tstplike_proof, _) => (tstplike_proof, NONE)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   189
45551
a62c7a21f4ab removed needless baggage
blanchet
parents: 45301
diff changeset
   190
type step_name = string * string list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   191
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   192
fun is_same_atp_step (s1, _) (s2, _) = s1 = s2
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   193
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   194
val vampire_fact_prefix = "f"
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   195
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   196
fun step_name_ord p =
39455
c6b21584f336 merge constructors
blanchet
parents: 39454
diff changeset
   197
  let val q = pairself fst p in
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   198
    (* The "unprefix" part is to cope with remote Vampire's output. The proper
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   199
       solution would be to perform a topological sort, e.g. using the nice
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   200
       "Graph" functor. *)
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   201
    case pairself (Int.fromString
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   202
                   o perhaps (try (unprefix vampire_fact_prefix))) q of
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   203
      (NONE, NONE) => string_ord q
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   204
    | (NONE, SOME _) => LESS
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   205
    | (SOME _, NONE) => GREATER
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   206
    | (SOME i, SOME j) => int_ord (i, j)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   207
  end
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   208
39453
1740a2d6bef9 use the same TSTP/Vampire/SPASS parser for one-liners as for Isar proofs
blanchet
parents: 39452
diff changeset
   209
datatype 'a step =
47774
blanchet
parents: 47506
diff changeset
   210
  Definition_Step of step_name * 'a * 'a |
blanchet
parents: 47506
diff changeset
   211
  Inference_Step of step_name * 'a * string * step_name list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   212
43678
56d352659500 improved translation of lambdas in THF
nik
parents: 43602
diff changeset
   213
type 'a proof = ('a, 'a, ('a, 'a) ho_term) formula step list
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   214
47774
blanchet
parents: 47506
diff changeset
   215
fun step_name (Definition_Step (name, _, _)) = name
blanchet
parents: 47506
diff changeset
   216
  | step_name (Inference_Step (name, _, _, _)) = name
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   217
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   218
(**** PARSING OF TSTP FORMAT ****)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   219
42536
a513730db7b0 unprefix evil "fof_" prefix inserted by ToFoF
blanchet
parents: 42531
diff changeset
   220
(* Strings enclosed in single quotes (e.g., file names) *)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   221
val scan_general_id =
47917
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   222
  $$ "'" |-- Scan.repeat (~$$ "'") --| $$ "'" >> implode
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   223
  || Scan.repeat ($$ "$") -- Scan.many1 Symbol.is_letdig
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   224
     >> (fn (ss1, ss2) => implode ss1 ^ implode ss2)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   225
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   226
val skip_term =
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   227
  let
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   228
    fun skip _ accum [] = (accum, [])
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   229
      | skip 0 accum (ss as "," :: _) = (accum, ss)
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   230
      | skip 0 accum (ss as ")" :: _) = (accum, ss)
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   231
      | skip 0 accum (ss as "]" :: _) = (accum, ss)
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   232
      | skip n accum ((s as "(") :: ss) = skip (n + 1) (s :: accum) ss
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   233
      | skip n accum ((s as "[") :: ss) = skip (n + 1) (s :: accum) ss
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   234
      | skip n accum ((s as "]") :: ss) = skip (n - 1) (s :: accum) ss
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   235
      | skip n accum ((s as ")") :: ss) = skip (n - 1) (s :: accum) ss
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   236
      | skip n accum (s :: ss) = skip n (s :: accum) ss
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   237
  in skip 0 [] #>> (rev #> implode) end
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   238
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   239
datatype source =
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   240
  File_Source of string * string option |
45209
0e5e56e32bc0 cleaner LEO-II extensionality step detection
blanchet
parents: 45208
diff changeset
   241
  Inference_Source of string * string list
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   242
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   243
val dummy_phi = AAtom (ATerm ("", []))
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   244
val dummy_inference = Inference_Source ("", [])
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   245
47917
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   246
(* "skip_term" is there to cope with Waldmeister nonsense such as
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   247
   "theory(equality)". *)
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   248
val parse_dependency = scan_general_id --| skip_term
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   249
val parse_dependencies =
b287682bf917 improve parsing of Waldmeister dependencies (and kill obsolete hack)
blanchet
parents: 47787
diff changeset
   250
  parse_dependency ::: Scan.repeat ($$ "," |-- parse_dependency)
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   251
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   252
fun parse_source x =
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   253
  (Scan.this_string "file" |-- $$ "(" |-- scan_general_id --
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   254
     Scan.option ($$ "," |-- scan_general_id) --| $$ ")"
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   255
     >> File_Source
45209
0e5e56e32bc0 cleaner LEO-II extensionality step detection
blanchet
parents: 45208
diff changeset
   256
   || Scan.this_string "inference" |-- $$ "(" |-- scan_general_id
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   257
        --| skip_term --| $$ "," --| skip_term --| $$ "," --| $$ "["
45209
0e5e56e32bc0 cleaner LEO-II extensionality step detection
blanchet
parents: 45208
diff changeset
   258
        -- parse_dependencies --| $$ "]" --| $$ ")"
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   259
       >> Inference_Source
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   260
   || skip_term >> K dummy_inference) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   261
42966
4e2d6c1e5392 more work on parsing LEO-II proofs without lambdas
blanchet
parents: 42965
diff changeset
   262
fun list_app (f, args) =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   263
  fold (fn arg => fn f => ATerm (tptp_app, [f, arg])) args f
42966
4e2d6c1e5392 more work on parsing LEO-II proofs without lambdas
blanchet
parents: 42965
diff changeset
   264
45881
3be79bdcc702 fixed parsing of TPTP atoms
blanchet
parents: 45551
diff changeset
   265
(* We currently ignore TFF and THF types. *)
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   266
fun parse_type_stuff x =
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   267
  Scan.repeat (($$ tptp_has_type || $$ tptp_fun_type) |-- parse_arg) x
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   268
and parse_arg x =
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   269
  ($$ "(" |-- parse_term --| $$ ")" --| parse_type_stuff
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   270
   || scan_general_id --| parse_type_stuff
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   271
        -- Scan.optional ($$ "(" |-- parse_terms --| $$ ")") []
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   272
      >> ATerm) x
45881
3be79bdcc702 fixed parsing of TPTP atoms
blanchet
parents: 45551
diff changeset
   273
and parse_term x =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   274
  (parse_arg -- Scan.repeat ($$ tptp_app |-- parse_arg) >> list_app) x
42966
4e2d6c1e5392 more work on parsing LEO-II proofs without lambdas
blanchet
parents: 42965
diff changeset
   275
and parse_terms x =
4e2d6c1e5392 more work on parsing LEO-II proofs without lambdas
blanchet
parents: 42965
diff changeset
   276
  (parse_term ::: Scan.repeat ($$ "," |-- parse_term)) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   277
39598
57413334669d make SML/NJ happier
blanchet
parents: 39491
diff changeset
   278
fun parse_atom x =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   279
  (parse_term -- Scan.option (Scan.option ($$ tptp_not_infix) --| $$ tptp_equal
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   280
                              -- parse_term)
39598
57413334669d make SML/NJ happier
blanchet
parents: 39491
diff changeset
   281
   >> (fn (u1, NONE) => AAtom u1
45881
3be79bdcc702 fixed parsing of TPTP atoms
blanchet
parents: 45551
diff changeset
   282
        | (u1, SOME (neg, u2)) =>
3be79bdcc702 fixed parsing of TPTP atoms
blanchet
parents: 45551
diff changeset
   283
          AAtom (ATerm ("equal", [u1, u2])) |> is_some neg ? mk_anot)) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   284
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   285
(* TPTP formulas are fully parenthesized, so we don't need to worry about
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   286
   operator precedence. *)
42605
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   287
fun parse_literal x =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   288
  ((Scan.repeat ($$ tptp_not) >> length)
42605
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   289
      -- ($$ "(" |-- parse_formula --| $$ ")"
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   290
          || parse_quantified_formula
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   291
          || parse_atom)
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   292
      >> (fn (n, phi) => phi |> n mod 2 = 1 ? mk_anot)) x
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   293
and parse_formula x =
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   294
  (parse_literal
43163
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   295
   -- Scan.option ((Scan.this_string tptp_implies
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   296
                    || Scan.this_string tptp_iff
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   297
                    || Scan.this_string tptp_not_iff
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   298
                    || Scan.this_string tptp_if
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   299
                    || $$ tptp_or
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   300
                    || $$ tptp_and) -- parse_formula)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   301
   >> (fn (phi1, NONE) => phi1
43163
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   302
        | (phi1, SOME (c, phi2)) =>
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   303
          if c = tptp_implies then mk_aconn AImplies phi1 phi2
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   304
          else if c = tptp_iff then mk_aconn AIff phi1 phi2
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   305
          else if c = tptp_not_iff then mk_anot (mk_aconn AIff phi1 phi2)
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   306
          else if c = tptp_if then mk_aconn AImplies phi2 phi1
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   307
          else if c = tptp_or then mk_aconn AOr phi1 phi2
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   308
          else if c = tptp_and then mk_aconn AAnd phi1 phi2
31babd4b1552 killed odd connectives
blanchet
parents: 43085
diff changeset
   309
          else raise Fail ("impossible connective " ^ quote c))) x
42605
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   310
and parse_quantified_formula x =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   311
  (($$ tptp_forall >> K AForall || $$ tptp_exists >> K AExists)
42605
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   312
   --| $$ "[" -- parse_terms --| $$ "]" --| $$ ":" -- parse_literal
8734eb0033b3 Vampire sometimes generates formulas with ~ (not) followed by a quantified subformula, without parentheses -- parse these correctly
blanchet
parents: 42603
diff changeset
   313
   >> (fn ((q, ts), phi) =>
42966
4e2d6c1e5392 more work on parsing LEO-II proofs without lambdas
blanchet
parents: 42965
diff changeset
   314
          (* We ignore TFF and THF types for now. *)
45881
3be79bdcc702 fixed parsing of TPTP atoms
blanchet
parents: 45551
diff changeset
   315
          AQuant (q, map (fn ATerm (s, _) => (s, NONE)) ts, phi))) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   316
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   317
val parse_tstp_extra_arguments =
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   318
  Scan.optional ($$ "," |-- parse_source --| Scan.option ($$ "," |-- skip_term))
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   319
                dummy_inference
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   320
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   321
val waldmeister_conjecture = "conjecture_1"
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   322
42536
a513730db7b0 unprefix evil "fof_" prefix inserted by ToFoF
blanchet
parents: 42531
diff changeset
   323
val tofof_fact_prefix = "fof_"
41203
1393514094d7 fixed more issues with the Vampire output parser, and added support for Vampire's TSTP output (--proof tptp)
blanchet
parents: 41201
diff changeset
   324
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   325
fun is_same_term subst tm1 tm2 =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   326
  let
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   327
    fun do_term_pair _ NONE = NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   328
      | do_term_pair (ATerm (s1, tm1), ATerm (s2, tm2)) (SOME subst) =
42998
1c80902d0456 fully support all type system encodings in typed formats (TFF, THF)
blanchet
parents: 42975
diff changeset
   329
        case pairself is_tptp_variable (s1, s2) of
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   330
          (true, true) =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   331
          (case AList.lookup (op =) subst s1 of
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   332
             SOME s2' => if s2' = s2 then SOME subst else NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   333
           | NONE =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   334
             if null (AList.find (op =) subst s2) then SOME ((s1, s2) :: subst)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   335
             else NONE)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   336
        | (false, false) =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   337
          if s1 = s2 andalso length tm1 = length tm2 then
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   338
            SOME subst |> fold do_term_pair (tm1 ~~ tm2)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   339
          else
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   340
            NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   341
        | _ => NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   342
  in SOME subst |> do_term_pair (tm1, tm2) |> is_some end
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   343
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   344
fun is_same_formula subst (AQuant (q1, xs1, phi1)) (AQuant (q2, xs2, phi2)) =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   345
    q1 = q2 andalso length xs1 = length xs2 andalso
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   346
    is_same_formula ((map fst xs1 ~~ map fst xs2) @ subst) phi1 phi2
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   347
  | is_same_formula subst (AConn (c1, phis1)) (AConn (c2, phis2)) =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   348
    c1 = c2 andalso length phis1 = length phis2 andalso
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   349
    forall (uncurry (is_same_formula subst)) (phis1 ~~ phis2)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   350
  | is_same_formula subst (AAtom (ATerm ("equal", [tm11, tm12]))) (AAtom tm2) =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   351
    is_same_term subst (ATerm ("equal", [tm11, tm12])) tm2 orelse
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   352
    is_same_term subst (ATerm ("equal", [tm12, tm11])) tm2
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   353
  | is_same_formula subst (AAtom tm1) (AAtom tm2) = is_same_term subst tm1 tm2
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   354
  | is_same_formula _ _ _ = false
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   355
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   356
fun matching_formula_line_identifier phi (Formula (ident, _, phi', _, _)) =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   357
    if is_same_formula [] phi phi' then SOME ident else NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   358
  | matching_formula_line_identifier _ _ = NONE
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   359
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   360
fun find_formula_in_problem problem phi =
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   361
  problem |> maps snd |> map_filter (matching_formula_line_identifier phi)
45551
a62c7a21f4ab removed needless baggage
blanchet
parents: 45301
diff changeset
   362
          |> try (single o hd) |> the_default []
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   363
42962
3b50fdeb6cfc started adding support for THF output (but no lambdas)
blanchet
parents: 42961
diff changeset
   364
(* Syntax: (cnf|fof|tff|thf)\(<num>, <formula_role>,
3b50fdeb6cfc started adding support for THF output (but no lambdas)
blanchet
parents: 42961
diff changeset
   365
            <formula> <extra_arguments>\).
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   366
   The <num> could be an identifier, but we assume integers. *)
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   367
fun parse_tstp_line problem =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   368
  ((Scan.this_string tptp_cnf || Scan.this_string tptp_fof
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   369
    || Scan.this_string tptp_tff || Scan.this_string tptp_thf) -- $$ "(")
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   370
    |-- scan_general_id --| $$ "," -- Symbol.scan_id --| $$ ","
45235
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   371
    -- (parse_formula || skip_term >> K dummy_phi) -- parse_tstp_extra_arguments
7187bce94e88 more robust parsing of TSTP sources -- Vampire has nonstandard "introduced()" tags and Waldmeister(OnTPTP) has weird "theory(...)" dependencies
blanchet
parents: 45209
diff changeset
   372
    --| $$ ")" --| $$ "."
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   373
   >> (fn (((num, role), phi), deps) =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   374
          let
45209
0e5e56e32bc0 cleaner LEO-II extensionality step detection
blanchet
parents: 45208
diff changeset
   375
            val (name, rule, deps) =
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   376
              (* Waldmeister isn't exactly helping. *)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   377
              case deps of
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   378
                File_Source (_, SOME s) =>
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   379
                ((num,
44417
c76c04d876ef kindly ask Vampire to output axiom names
blanchet
parents: 43823
diff changeset
   380
                  if s = waldmeister_conjecture then
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   381
                    find_formula_in_problem problem (mk_anot phi)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   382
                  else
45551
a62c7a21f4ab removed needless baggage
blanchet
parents: 45301
diff changeset
   383
                    [s |> perhaps (try (unprefix tofof_fact_prefix))]), "",
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   384
                 [])
45208
9a00f9cc8707 marginally cleaner proof parsing, that doesn't stumble upon LEO-II's E-step proofs
blanchet
parents: 45203
diff changeset
   385
              | File_Source _ =>
45209
0e5e56e32bc0 cleaner LEO-II extensionality step detection
blanchet
parents: 45208
diff changeset
   386
                ((num, find_formula_in_problem problem phi), "", [])
45551
a62c7a21f4ab removed needless baggage
blanchet
parents: 45301
diff changeset
   387
              | Inference_Source (rule, deps) => ((num, []), rule, deps)
47787
35fcb0daab8d tweak LEO-II setup
blanchet
parents: 47774
diff changeset
   388
            fun mk_step () =
35fcb0daab8d tweak LEO-II setup
blanchet
parents: 47774
diff changeset
   389
              Inference_Step (name, phi, rule, map (rpair []) deps)
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   390
          in
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   391
            case role of
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   392
              "definition" =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   393
              (case phi of
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   394
                 AConn (AIff, [phi1 as AAtom _, phi2]) =>
47774
blanchet
parents: 47506
diff changeset
   395
                 Definition_Step (name, phi1, phi2)
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   396
               | AAtom (ATerm ("equal", _)) =>
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   397
                 (* Vampire's equality proxy axiom *)
47774
blanchet
parents: 47506
diff changeset
   398
                 Inference_Step (name, phi, rule, map (rpair []) deps)
47787
35fcb0daab8d tweak LEO-II setup
blanchet
parents: 47774
diff changeset
   399
               | _ => mk_step ())
35fcb0daab8d tweak LEO-II setup
blanchet
parents: 47774
diff changeset
   400
            | _ => mk_step ()
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   401
          end)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   402
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   403
(**** PARSING OF SPASS OUTPUT ****)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   404
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   405
(* SPASS returns clause references of the form "x.y". We ignore "y", whose role
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   406
   is not clear anyway. *)
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   407
val parse_dot_name = scan_general_id --| $$ "." --| scan_general_id
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   408
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   409
val parse_spass_annotations =
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   410
  Scan.optional ($$ ":" |-- Scan.repeat (parse_dot_name
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   411
                                         --| Scan.option ($$ ","))) []
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   412
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   413
(* It is not clear why some literals are followed by sequences of stars and/or
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   414
   pluses. We ignore them. *)
39602
ae2c3059f8cc make SML/NJ happier
blanchet
parents: 39598
diff changeset
   415
fun parse_decorated_atom x =
ae2c3059f8cc make SML/NJ happier
blanchet
parents: 39598
diff changeset
   416
  (parse_atom --| Scan.repeat ($$ "*" || $$ "+" || $$ " ")) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   417
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   418
fun mk_horn ([], []) = AAtom (ATerm ("c_False", []))
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   419
  | mk_horn ([], pos_lits) = foldr1 (uncurry (mk_aconn AOr)) pos_lits
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   420
  | mk_horn (neg_lits, []) = mk_anot (foldr1 (uncurry (mk_aconn AAnd)) neg_lits)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   421
  | mk_horn (neg_lits, pos_lits) =
42943
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   422
    mk_aconn AImplies (foldr1 (uncurry (mk_aconn AAnd)) neg_lits)
62a14c80d194 fish out axioms in Waldmeister output
blanchet
parents: 42882
diff changeset
   423
                      (foldr1 (uncurry (mk_aconn AOr)) pos_lits)
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   424
39645
6eb38a00ae47 make SML/NJ happy
blanchet
parents: 39602
diff changeset
   425
fun parse_horn_clause x =
6eb38a00ae47 make SML/NJ happy
blanchet
parents: 39602
diff changeset
   426
  (Scan.repeat parse_decorated_atom --| $$ "|" --| $$ "|"
6eb38a00ae47 make SML/NJ happy
blanchet
parents: 39602
diff changeset
   427
     -- Scan.repeat parse_decorated_atom --| $$ "-" --| $$ ">"
6eb38a00ae47 make SML/NJ happy
blanchet
parents: 39602
diff changeset
   428
     -- Scan.repeat parse_decorated_atom
6eb38a00ae47 make SML/NJ happy
blanchet
parents: 39602
diff changeset
   429
   >> (mk_horn o apfst (op @))) x
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   430
46427
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   431
fun resolve_spass_num (SOME names) _ _ = names
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   432
  | resolve_spass_num NONE spass_names num =
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   433
    case Int.fromString num of
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   434
      SOME j => if j > 0 andalso j <= Vector.length spass_names then
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   435
                  Vector.sub (spass_names, j - 1)
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   436
                else
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   437
                  []
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   438
    | NONE => []
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   439
46390
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   440
val parse_spass_debug =
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   441
  Scan.option ($$ "(" |-- Scan.repeat (scan_general_id --| Scan.option ($$ ","))
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   442
               --| $$ ")")
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   443
46427
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   444
(* Syntax: <num>[0:<inference><annotations>] <atoms> || <atoms> -> <atoms>.
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   445
           derived from formulae <ident>* *)
45162
170dffc6df75 parse Satallax unsat cores
blanchet
parents: 44915
diff changeset
   446
fun parse_spass_line spass_names =
46390
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   447
  parse_spass_debug |-- scan_general_id --| $$ "[" --| $$ "0" --| $$ ":"
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   448
    -- Symbol.scan_id -- parse_spass_annotations --| $$ "]"
6467c99c4872 don't stumble on SPASS debug output
blanchet
parents: 45881
diff changeset
   449
    -- parse_horn_clause --| $$ "."
46427
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   450
    -- Scan.option (Scan.this_string "derived from formulae "
46451
4989249a4b81 parse clauses generated from several formulas
blanchet
parents: 46427
diff changeset
   451
                    |-- Scan.repeat (scan_general_id --| Scan.option ($$ " ")))
46427
4fd25dadbd94 cleaned up new SPASS parsing
blanchet
parents: 46390
diff changeset
   452
  >> (fn ((((num, rule), deps), u), names) =>
47774
blanchet
parents: 47506
diff changeset
   453
         Inference_Step ((num, resolve_spass_num names spass_names num), u,
blanchet
parents: 47506
diff changeset
   454
             rule, map (swap o `(resolve_spass_num NONE spass_names)) deps))
45162
170dffc6df75 parse Satallax unsat cores
blanchet
parents: 44915
diff changeset
   455
170dffc6df75 parse Satallax unsat cores
blanchet
parents: 44915
diff changeset
   456
(* Syntax: <name> *)
45203
e3c13fa443ef more uniform SZS status handling
blanchet
parents: 45162
diff changeset
   457
fun parse_satallax_line x =
e3c13fa443ef more uniform SZS status handling
blanchet
parents: 45162
diff changeset
   458
  (scan_general_id --| Scan.option ($$ " ")
47774
blanchet
parents: 47506
diff changeset
   459
   >> (fn s => Inference_Step ((s, [s]), dummy_phi, "", []))) x
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   460
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   461
fun parse_line problem spass_names =
45203
e3c13fa443ef more uniform SZS status handling
blanchet
parents: 45162
diff changeset
   462
  parse_tstp_line problem || parse_spass_line spass_names || parse_satallax_line
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   463
fun parse_proof problem spass_names tstp =
44784
blanchet
parents: 44417
diff changeset
   464
  tstp |> strip_spaces_except_between_idents
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   465
       |> raw_explode
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   466
       |> Scan.finite Symbol.stopper
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   467
              (Scan.error (!! (fn _ => raise UNRECOGNIZED_ATP_PROOF ())
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   468
                              (Scan.repeat1 (parse_line problem spass_names))))
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   469
       |> fst
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   470
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   471
(** SPASS's FLOTTER hack **)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   472
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   473
(* This is a hack required for keeping track of facts after they have been
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   474
   clausified by SPASS's FLOTTER preprocessor. The "ATP/scripts/spass" script is
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   475
   also part of this hack. *)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   476
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   477
val set_ClauseFormulaRelationN = "set_ClauseFormulaRelation"
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   478
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   479
fun extract_clause_sequence output =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   480
  let
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   481
    val tokens_of = String.tokens (not o Char.isAlphaNum)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   482
    fun extract_num ("clause" :: (ss as _ :: _)) = Int.fromString (List.last ss)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   483
      | extract_num _ = NONE
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   484
  in output |> split_lines |> map_filter (extract_num o tokens_of) end
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   485
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   486
fun is_head_digit s = Char.isDigit (String.sub (s, 0))
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   487
val scan_integer = Scan.many1 is_head_digit >> (the o Int.fromString o implode)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   488
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   489
val parse_clause_formula_pair =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   490
  $$ "(" |-- scan_integer --| $$ ","
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   491
  -- (Symbol.scan_id ::: Scan.repeat ($$ "," |-- Symbol.scan_id)) --| $$ ")"
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   492
  --| Scan.option ($$ ",")
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   493
val parse_clause_formula_relation =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   494
  Scan.this_string set_ClauseFormulaRelationN |-- $$ "("
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   495
  |-- Scan.repeat parse_clause_formula_pair
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   496
val extract_clause_formula_relation =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   497
  Substring.full #> Substring.position set_ClauseFormulaRelationN
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   498
  #> snd #> Substring.position "." #> fst #> Substring.string
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   499
  #> raw_explode #> filter_out Symbol.is_blank #> parse_clause_formula_relation
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   500
  #> fst
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   501
43481
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   502
fun extract_spass_name_vector output =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   503
  (if String.isSubstring set_ClauseFormulaRelationN output then
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   504
     let
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   505
       val num_seq = extract_clause_sequence output
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   506
       val name_map = extract_clause_formula_relation output
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   507
       val name_seq = num_seq |> map (these o AList.lookup (op =) name_map)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   508
     in name_seq end
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   509
   else
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   510
     [])
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   511
  |> Vector.fromList
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   512
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   513
fun atp_proof_from_tstplike_proof _ _ "" = []
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   514
  | atp_proof_from_tstplike_proof problem output tstp =
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   515
    tstp ^ "$" (* the $ sign acts as a sentinel (FIXME: needed?) *)
51857e7fa64b clean up SPASS FLOTTER hack
blanchet
parents: 43473
diff changeset
   516
    |> parse_proof problem (extract_spass_name_vector output)
42449
494e4ac5b0f8 detect some unsound proofs before showing them to the user
blanchet
parents: 42060
diff changeset
   517
    |> sort (step_name_ord o pairself step_name)
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   518
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   519
fun clean_up_dependencies _ [] = []
47774
blanchet
parents: 47506
diff changeset
   520
  | clean_up_dependencies seen
blanchet
parents: 47506
diff changeset
   521
                          ((step as Definition_Step (name, _, _)) :: steps) =
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   522
    step :: clean_up_dependencies (name :: seen) steps
47774
blanchet
parents: 47506
diff changeset
   523
  | clean_up_dependencies seen (Inference_Step (name, u, rule, deps) :: steps) =
blanchet
parents: 47506
diff changeset
   524
    Inference_Step (name, u, rule,
blanchet
parents: 47506
diff changeset
   525
        map_filter (fn dep => find_first (is_same_atp_step dep) seen) deps) ::
42968
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   526
    clean_up_dependencies (name :: seen) steps
74415622d293 more work on parsing LEO-II proofs and extracting uses of extensionality
blanchet
parents: 42966
diff changeset
   527
42975
284f9a7af1c9 eta-expand to make SML/NJ happy
blanchet
parents: 42973
diff changeset
   528
fun clean_up_atp_proof_dependencies proof = clean_up_dependencies [] proof
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   529
39454
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   530
fun map_term_names_in_term f (ATerm (s, ts)) =
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   531
  ATerm (f s, map (map_term_names_in_term f) ts)
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   532
fun map_term_names_in_formula f (AQuant (q, xs, phi)) =
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   533
    AQuant (q, xs, map_term_names_in_formula f phi)
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   534
  | map_term_names_in_formula f (AConn (c, phis)) =
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   535
    AConn (c, map (map_term_names_in_formula f) phis)
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   536
  | map_term_names_in_formula f (AAtom t) = AAtom (map_term_names_in_term f t)
47774
blanchet
parents: 47506
diff changeset
   537
fun map_term_names_in_step f (Definition_Step (name, phi1, phi2)) =
blanchet
parents: 47506
diff changeset
   538
    Definition_Step (name, map_term_names_in_formula f phi1,
blanchet
parents: 47506
diff changeset
   539
                     map_term_names_in_formula f phi2)
blanchet
parents: 47506
diff changeset
   540
  | map_term_names_in_step f (Inference_Step (name, phi, rule, deps)) =
blanchet
parents: 47506
diff changeset
   541
    Inference_Step (name, map_term_names_in_formula f phi, rule, deps)
39454
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   542
fun map_term_names_in_atp_proof f = map (map_term_names_in_step f)
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   543
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   544
fun nasty_name pool s = s |> Symtab.lookup pool |> the_default s
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   545
fun nasty_atp_proof pool =
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   546
  if Symtab.is_empty pool then I
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   547
  else map_term_names_in_atp_proof (nasty_name pool)
acb25e9cf6fb factor out the inverse of "nice_atp_problem"
blanchet
parents: 39453
diff changeset
   548
39452
70a57e40f795 factored out TSTP/SPASS/Vampire proof parsing;
blanchet
parents:
diff changeset
   549
end;