#
# $Id$
# Author: David von Oheimb, TU Muenchen
# License: GPL (GNU GENERAL PUBLIC LICENSE)
#
# convert.pl - convert legacy tactic scripts to Isabelle/Isar tactic
# emulation using heuristics - leaves unrecognized patterns unchanged
# produces from each input file (on the command line) a new file with
# ".thy" appended and renames the original input file by appending "~0~"
sub thmlist {
my $s = shift;
$s =~ s/^\[(.*)\]$/$1/sg;
$s =~ s/, +/ /g;
$s =~ s/,/ /g;
$s;
}
sub subst_RS {
s/ RS ([\w\'\.]+)/ [THEN $1]/g;
s/ RS \((.+?)\)/ [THEN $1]/g;
s/\(([\w\'\.]+ \[THEN [\w\'\.]+\])\)/$1/g;
s/\] \[THEN /, THEN /g;
s/THEN sym\b/symmetric/g;
}
sub subst_RS_standard {
my $s = shift;
$_ = $s;
s/\s+/ /sg; # remove multiple whitespace
s/\s/ /sg; # substitute all remaining tabs and newlines by space
subst_RS();
s/\]\s*$/, standard]/g;
$_;
}
sub decl {
my $s = shift;
my $a = shift;
$_ = $s;
subst_RS();
s/, */ [$a] /g;
s/$/ [$a]/;
s/\] *\[/, /g;
"declare $_";
}
sub process_tac {
$prefer = "";
my $lead = shift;
my $t = shift;
my $simpmodmod = ($t =~ m/auto_tac|force_tac|clarsimp_tac/) ? "simp " : "";
$_ = $t;
s/\s+/ /sg; # remove multiple whitespace
s/\s/ /sg; # substitute all remaining tabs and newlines by space
s/\( /\(/g; s/ \)/\)/g; # remove leading and trailing space inside parentheses
s/\[ /\[/g; s/ \]/\]/g; # remove leading and trailing space inside sq brackets
s/ ?\( ?\)/\(\)/g; # remove space before and inside empty tuples
s/([^ ])\(/$1 \(/g; # possibly add space before opening parentheses
s/\)([^ ])/\) $1/g; # possibly add space after closing parentheses
s/EVERY *\[(.*?)\]/$1/;
if(s/EVERY\' ?\[(.*?)\] *(\d+)/$1 $2/) {
$goal = $2;
s/,/ $goal,/g;
}
s/Blast_tac 1/blast/g;
s/^Blast_tac (\d+)/{$prefer="prefer $1 "; "blast"}/e;
s/Fast_tac 1/fast/g;
s/^Fast_tac (\d+)/{$prefer="prefer $1 "; "fast"}/e;
s/Slow_tac 1/slow/g;
s/^Slow_tac (\d+)/{$prefer="prefer $1 "; "slow"}/e;
s/Best_tac 1/best/g;
s/^Best_tac (\d+)/{$prefer="prefer $1 "; "best"}/e;
s/Safe_tac/safe/g;
s/Clarify_tac 1/clarify/g;
s/blast_tac \(claset\(\) (.*?)\) 1/blast $1/g;
s/^blast_tac \(claset\(\) (.*?)\) (\d+)/{$prefer="prefer $2 "; "blast $1"}/e;
s/fast_tac \(claset\(\) (.*?)\) 1/fast $1/g;
s/^fast_tac \(claset\(\) (.*?)\) (\d+)/{$prefer="prefer $2 "; "fast $1"}/e;
s/slow_tac \(claset\(\) (.*?)\) 1/slow $1/g;
s/^slow_tac \(claset\(\) (.*?)\) (\d+)/{$prefer="prefer $2 "; "slow $1"}/e;
s/best_tac \(claset\(\) (.*?)\) 1/best $1/g;
s/^best_tac \(claset\(\) (.*?)\) (\d+)/{$prefer="prefer $2 "; "best $1"}/e;
s/safe_tac \(claset\(\) (.*?)\)/safe $1/g;
s/clarify_tac \(claset\(\) (.*?)\) 1/clarify $1/g;
s/Auto_tac/auto/g;
s/Force_tac 1/force/g;
s/^Force_tac (\d+)/{$prefer="prefer $1 "; "force"}/e;
s/Clarsimp_tac 1/clarsimp/g;
s/auto_tac \(claset \(\) (.*?), *simpset \(\) (.*?)\)/auto $1 $2/g;
s/force_tac \(claset \(\) (.*?), *simpset \(\) (.*?)\) 1/force $1 $2/g;
s/^force_tac \(claset \(\) (.*?), *simpset \(\) (.*?)\) (\d+)/{$prefer="prefer $3 "; "force $1 $2"}/e;
s/clarsimp_tac \(claset \(*\) (.*?), *simpset \(\) (.*?)\) 1/clarsimp $1 $2/g;
s/Asm_full_simp_tac 1/simp/g;
s/Full_simp_tac 1/simp (no_asm_use)/g;
s/Asm_simp_tac 1/simp (no_asm_simp)/g;
s/Simp_tac 1/simp (no_asm)/g;
s/ALLGOALS Asm_full_simp_tac/simp_all/g;
s/ALLGOALS Full_simp_tac/simp_all (no_asm_use)/g;
s/ALLGOALS Asm_simp_tac/simp_all (no_asm_simp)/g;
s/ALLGOALS Simp_tac/simp_all (no_asm)/g;
s/asm_full_simp_tac \(simpset \(\) (.*?)\) 1/simp $1/g;
s/full_simp_tac \(simpset \(\) (.*?)\) 1/simp (no_asm_use) $1/g;
s/asm_simp_tac \(simpset \(\) (.*?)\) 1/simp (no_asm_simp) $1/g;
s/simp_tac \(simpset \(\) (.*?)\) 1/simp (no_asm) $1/g;
s/ALLGOALS \(asm_full_simp_tac \(simpset \(\) (.*?)\) \)/simp_all $1/g;
s/ALLGOALS \(full_simp_tac \(simpset \(\) (.*?)\) \)/simp_all (no_asm_use) $1/g;
s/ALLGOALS \(asm_simp_tac \(simpset \(\) (.*?)\) \)/simp_all (no_asm_simp) $1/g;
s/ALLGOALS \(simp_tac \(simpset \(\) (.*?)\) \)/simp_all (no_asm) $1/g;
s/a(ssume_)?tac 1/assumption/g;
s/^a(ssume_)?tac (\d+)/{$prefer="prefer $2 "; "assumption"}/e;
s/\bmp_tac 1/erule (1) notE impE/g;
s/\bmp_tac (\d+)/erule_tac [$1] notE impE, tactic \"assume_tac $1\"/g;
s/hypsubst_tac 1/hypsubst/g;
s/arith_tac 1/arith/g;
s/strip_tac 1/intro strip/g;
s/split_all_tac 1/simp (no_asm_simp) only: split_tupled_all/g;
s/smp_tac (\d+) (\d+)/tactic "smp_tac $1 $2"/g;
s/rotate_tac (\d+) (\d+)/rotate_tac [$2] $1/g;
s/rotate_tac ~ *(\d+) (\d+)/rotate_tac [$2] -$1/g;
s/rename_tac (\".*?\") (\d+)/rename_tac [$2] $1/g;
s/case_tac (\".*?\") (\d+)/case_tac [$2] $1/g;
s/induct_tac (\".*?\") (\d+)/induct_tac [$2] $1/g;
s/induct_thm_tac ([\w\'\. \[,\]]+?) (\".*?\") (\d+)/induct_tac [$3] $2 rule: $1/g;
s/subgoal_tac (\".*?\") (\d+)/subgoal_tac [$2] $1/g;
s/thin_tac (\".*?\") *(\d+)/erule_tac [$2] V = $1 in thin_rl/g;
s/THEN /, /g;
s/ORELSE/|/g;
subst_RS();
s/\(\"(.*?)\" *, *(\".*?\")\) , */$1 = $2 and /g; # instantiations
s/\(\"(.*?)\" *, *(\".*?\")\)/$1 = $2/g; # last instantiation
s/rewtac ([\w\'\. \[,\]]+)/unfold $1/g;
s/stac ([\w\'\. \[,\]]+?) 1/subst $1/g;
s/rtac ([\w\'\. \[,\]]+?) 1/rule $1/g;
s/rtac ([\w\'\. \[,\]]+?) (\d+)/rule_tac [$2] $1/g;
s/res_inst_tac \[(.*?)\] ([\w\'\. \[,\]]+?) (\d+)/rule_tac [$3] $1 in $2/g;
s/dtac ([\w\'\. \[,\]]+?) 1/drule $1/g;
s/dtac ([\w\'\. \[,\]]+?) (\d+)/drule_tac [$2] $1/g;
s/dres_inst_tac \[(.*?)\] ([\w\'\. \[,\]]+?) (\d+)/drule_tac [$3] $1 in $2/g;
s/datac ([\w\'\. \[,\]]+?) (\d+) 1/drule ($2) $1/g;
s/etac ([\w\'\. \[,\]]+?) 1/erule $1/g;
s/etac ([\w\'\. \[,\]]+?) (\d+)/erule_tac [$2] $1/g;
s/eres_inst_tac \[(.*?)\] ([\w\'\. \[,\]]+?) (\d+)/erule_tac [$3] $1 in $2/g;
s/eatac ([\w\'\. \[,\]]+?) (\d+) 1/erule ($2) $1/g;
s/forward_tac \[([\w\'\. \[,\]]+)\] 1/frule $1/g;
s/forward_tac \[([\w\'\. \[,\]]+)\] (\d+)/frule_tac [$2] $1/g;
s/ftac ([\w\'\. \[,\]]+?) 1/frule $1/g;
s/ftac ([\w\'\. \[,\]]+?) (\d+)/frule_tac [$2] $1/g;
s/forw_inst_tac \[(.*?)\] ([\w\'\. \[,\]]+?) (\d+)/frule_tac [$3] $1 in $2/g;
s/fatac ([\w\'\. \[,\]]+?) (\d+) 1/frule ($2) $1/g;
s/fold_goals_tac *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"fold ".thmlist($1)/eg;
s/rewrite_goals_tac *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"unfold ".thmlist($1)/eg;
s/cut_inst_tac \[(.*?)\] ([\w\'\. \[,\]]+?) (\d+)/cut_tac [$3] $1 in $2/g;
s/cut_facts_tac *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+) (\d+)/"cut_tac [$2] ".thmlist($1)/eg;
s/resolve_tac *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+) 1/"rule ".thmlist($1)/eg;
s/addIs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"intro: ".thmlist($1)/eg;
s/addSIs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"intro!: ".thmlist($1)/eg;
s/addEs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"elim: ".thmlist($1)/eg;
s/addSEs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"elim!: ".thmlist($1)/eg;
s/addDs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"dest: ".thmlist($1)/eg;
s/addSDs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"dest!: ".thmlist($1)/eg;
s/delrules *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"del: ".thmlist($1)/eg;
s/addsimps *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"$simpmodmod"."add: ".thmlist($1)/eg;
s/delsimps *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"$simpmodmod"."del: ".thmlist($1)/eg;
s/addcongs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"cong add: ".thmlist($1)/eg;
s/delcongs *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"cong del: ".thmlist($1)/eg;
s/addsplits *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"split add: ".thmlist($1)/eg;
s/delsplits *(\[[\w\'\. ,]*\]|[\w\'\. \[,\]]+)/"split del: ".thmlist($1)/eg;
s/_tac \[1\]/_tac/g;
s/ +/ /g; # remove multiple whitespace
s/\( /\(/; s/ \)/\)/g; # remove leading and trailing space inside parentheses
s/^ *(.*?) *$/$1/s; # remove enclosing whitespace
s/^([a-zA-Z])/ $1/ if (!($lead =~ m/[\s\(]$/)); # add space if required
$prefer."apply".$lead.$_;
}
sub lemmaname {
$lemmanames[++$lemmacount] = "??unknown??";
"@@" . $lemmacount . "@@";
}
sub backpatch_lemmanames {
if($currfile ne "") {
select(STDOUT);
close(ARGVOUT);
open(TMPW, '>'.$finalfile);
open TMPR,$tmpfile or die "Can't find tmp file $tmp: $!\n";
while(<TMPR>) {
s/@@(\d+)@@/$lemmanames[$1]/eg;
print TMPW;
}
system("mv $currfile $currfile~0~") if($currfile ne $default);
system("rm $tmpfile");
}
}
sub done {
my $name = shift;
my $attr = shift;
$lemmanames[$lemmacount] = $name.$attr;
"done";
}
$currfile = "";
$default = "convert_default_stdout";
while (<>) { # main loop
if ($ARGV ne $currfile) {
$x=$_; backpatch_lemmanames; $_=$x;
$currfile = ($ARGV eq "-" ? $default : $ARGV);
$lemmacount=0;
$finalfile = "$currfile.thy";
$tmpfile = "$finalfile.~0~";
open(ARGVOUT, '>'.$tmpfile);
select(ARGVOUT);
}
nl:
if(!s/;(\s*?(\n?$|\(\*))/$1/s && !eof()) {# no end_of_ML_command marker
$_ = $_ . <>;
goto nl;
}
s/\\(\s*\n\s*)\\/ $1 /g; # remove backslashes escaping newlines
nlc:
m/^(\s*)(.*?)(\s*)$/s;
$head=$1; $line=$2; $tail=$3;
$tail =~ s/\s+\n/\n/sg; # remove trailing whitespace at end of lines
print $head; $_=$line.$tail;
if ($line =~ m/^\(\*/) { # start comment
while (($i = index $_,"*)") == -1 && !eof()) { # no end comment
print;
$_ = <>;
}
if ($i == -1) { print; last; }
print substr $_,0,$i+2;
$_ = substr $_,$i+2;
goto nlc;
}
$_=$line;
if(!($head =~ m/^\n/)) { $head = "\n$head"; }
s/^Goalw *(\[[\w\'\.\s,]*\]|[\w\'\. \[,\]]+) *(.+)/
"lemma ".lemmaname().": $2$head"."apply (unfold ".thmlist($1).")"/se;
s/^Goal *(.+)/"lemma ".lemmaname().": $1"/se;
s/\bgoal/"(*".lemmaname()."*)goal"/se; # ugly old-style goals
s/^qed_spec_mp *\"(.*?)\"/done($1," [rule_format (no_asm)]")/se;
s/^qed *\"(.*?)\"/done($1,"")/se;
s/^val *(\w+) *= *result *\( *\) *$/done($1,"")/se;
s/^bind_thm *\( *\"(.*?)\" *, *(result *\( *\) *?) *\) *$/done($1,"")/se;
s/^bind_thm *\( *\"(.*?)\" *, *(.*?result *\( *\).*?) *\) *$/done($1,"[?? $2 ??] ")/se;
s/^bind_thm *\( *\"(.*?)\" *, *(.*?) *\) *$/"lemmas $1 = ".subst_RS_standard($2)/se;
s/^by(\s*\(?\s*)(.*?)\s*(\)?)\s*$/process_tac($1,$2).$3/se;
s/^b\s+y(\s*)(.*?)(\s*)$/process_tac($1,"(".$2.")").$3/se;
s/^(apply +)\( *([\w\'\.]+)\s*\)\s*$/$1$2/;
# remove outermost parentheses if around atoms
s/^Addsimps\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"simp")/seg;
s/^Delsimps\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"simp del")/seg;
s/^Addsplits\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"split")/seg;
s/^Delsplits\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"split del")/seg;
s/^AddIs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"intro")/seg;
s/^AddSIs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"intro!")/seg;
s/^AddXIs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"intro?")/seg;
s/^AddEs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"elim")/seg;
s/^AddSEs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"elim!")/seg;
s/^AddXEs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"elim?")/seg;
s/^AddDs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"dest")/seg;
s/^AddSDs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"dest!")/seg;
s/^AddXDs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"dest?")/seg;
s/^AddIffs\s*\[?\s*([\w\'\. ,]*)\s*\]?/decl($1,"iff")/seg;
print "$_$tail";
if(eof()) { last; } # prevents reading finally from stdin (thru <>)!
}
backpatch_lemmanames;
select(STDOUT);