author | bulwahn |
Fri, 03 Dec 2010 08:40:47 +0100 | |
changeset 40910 | 508c83827364 |
parent 40909 | e006d1e06920 |
child 40911 | 7febf76e0a69 |
permissions | -rw-r--r-- |
30824 | 1 |
(* Title: Tools/quickcheck.ML |
40246
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
2 |
Author: Stefan Berghofer, Florian Haftmann, Lukas Bulwahn, TU Muenchen |
28256 | 3 |
|
4 |
Generic counterexample search engine. |
|
5 |
*) |
|
6 |
||
7 |
signature QUICKCHECK = |
|
8 |
sig |
|
37910
555287ba8d8d
reordering quickcheck signature; exporting test_params and inspection function
bulwahn
parents:
37909
diff
changeset
|
9 |
val setup: theory -> theory |
555287ba8d8d
reordering quickcheck signature; exporting test_params and inspection function
bulwahn
parents:
37909
diff
changeset
|
10 |
(* configuration *) |
32740 | 11 |
val auto: bool Unsynchronized.ref |
34948
2d5f2a9f7601
refactoring the predicate compiler; adding theories for Sequences; adding retrieval to Spec_Rules; adding timing to Quickcheck
bulwahn
parents:
34128
diff
changeset
|
12 |
val timing : bool Unsynchronized.ref |
40908 | 13 |
val tester : string Config.T |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
14 |
val size : int Config.T |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
15 |
val iterations : int Config.T |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
16 |
val no_assms : bool Config.T |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
17 |
val report : bool Config.T |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
18 |
val quiet : bool Config.T |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
19 |
val timeout : real Config.T |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
20 |
val finite_types : bool Config.T |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
21 |
val finite_type_size : int Config.T |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
22 |
datatype report = Report of |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
23 |
{ iterations : int, raised_match_errors : int, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
24 |
satisfied_assms : int list, positive_concl_tests : int } |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
25 |
datatype expectation = No_Expectation | No_Counterexample | Counterexample; |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
26 |
datatype test_params = Test_Params of {default_type: typ list, expect : expectation}; |
40246
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
27 |
val test_params_of : Proof.context -> test_params |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
28 |
val map_test_params : (typ list * expectation -> typ list * expectation) |
40246
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
29 |
-> Context.generic -> Context.generic |
37910
555287ba8d8d
reordering quickcheck signature; exporting test_params and inspection function
bulwahn
parents:
37909
diff
changeset
|
30 |
val add_generator: |
39253
0c47d615a69b
removing report from the arguments of the quickcheck functions and refering to it by picking it from the context
bulwahn
parents:
39252
diff
changeset
|
31 |
string * (Proof.context -> term -> int -> term list option * (bool list * bool)) |
39252
8f176e575a49
changing the container for the quickcheck options to a generic data
bulwahn
parents:
39138
diff
changeset
|
32 |
-> Context.generic -> Context.generic |
37910
555287ba8d8d
reordering quickcheck signature; exporting test_params and inspection function
bulwahn
parents:
37909
diff
changeset
|
33 |
(* testing terms and proof states *) |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
34 |
val test_term: Proof.context -> bool -> term -> |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
35 |
(string * term) list option * ((string * int) list * ((int * report) list) option) |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
36 |
val test_goal_terms: |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
37 |
Proof.context -> bool -> (string * typ) list -> term list |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
38 |
-> (string * term) list option * ((string * int) list * ((int * report) list) option) list |
37909
583543ad6ad1
changed default types to a list of types; extended quickcheck parameters to be a list of values to parse a list of default types
bulwahn
parents:
36960
diff
changeset
|
39 |
val quickcheck: (string * string list) list -> int -> Proof.state -> (string * term) list option |
28256 | 40 |
end; |
41 |
||
42 |
structure Quickcheck : QUICKCHECK = |
|
43 |
struct |
|
44 |
||
30980 | 45 |
(* preferences *) |
46 |
||
32740 | 47 |
val auto = Unsynchronized.ref false; |
30980 | 48 |
|
34948
2d5f2a9f7601
refactoring the predicate compiler; adding theories for Sequences; adding retrieval to Spec_Rules; adding timing to Quickcheck
bulwahn
parents:
34128
diff
changeset
|
49 |
val timing = Unsynchronized.ref false; |
2d5f2a9f7601
refactoring the predicate compiler; adding theories for Sequences; adding retrieval to Spec_Rules; adding timing to Quickcheck
bulwahn
parents:
34128
diff
changeset
|
50 |
|
30980 | 51 |
val _ = |
52 |
ProofGeneralPgip.add_preference Preferences.category_tracing |
|
39616
8052101883c3
renamed setmp_noncritical to Unsynchronized.setmp to emphasize its meaning;
wenzelm
parents:
39329
diff
changeset
|
53 |
(Unsynchronized.setmp auto true (fn () => |
30980 | 54 |
Preferences.bool_pref auto |
55 |
"auto-quickcheck" |
|
39329 | 56 |
"Run Quickcheck automatically.") ()); |
30980 | 57 |
|
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
58 |
(* quickcheck report *) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
59 |
|
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
60 |
datatype single_report = Run of bool list * bool | MatchExc |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
61 |
|
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
62 |
datatype report = Report of |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
63 |
{ iterations : int, raised_match_errors : int, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
64 |
satisfied_assms : int list, positive_concl_tests : int } |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
65 |
|
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
66 |
fun collect_single_report single_report |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
67 |
(Report {iterations = iterations, raised_match_errors = raised_match_errors, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
68 |
satisfied_assms = satisfied_assms, positive_concl_tests = positive_concl_tests}) = |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
69 |
case single_report |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
70 |
of MatchExc => |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
71 |
Report {iterations = iterations + 1, raised_match_errors = raised_match_errors + 1, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
72 |
satisfied_assms = satisfied_assms, positive_concl_tests = positive_concl_tests} |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
73 |
| Run (assms, concl) => |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
74 |
Report {iterations = iterations + 1, raised_match_errors = raised_match_errors, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
75 |
satisfied_assms = |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
76 |
map2 (fn b => fn s => if b then s + 1 else s) assms |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
77 |
(if null satisfied_assms then replicate (length assms) 0 else satisfied_assms), |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
78 |
positive_concl_tests = if concl then positive_concl_tests + 1 else positive_concl_tests} |
30973
304ab57afa6e
observe distinction between Pure/Tools and Tools more closely
haftmann
parents:
30824
diff
changeset
|
79 |
|
37929
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
80 |
(* expectation *) |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
81 |
|
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
82 |
datatype expectation = No_Expectation | No_Counterexample | Counterexample; |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
83 |
|
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
84 |
fun merge_expectation (expect1, expect2) = |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
85 |
if expect1 = expect2 then expect1 else No_Expectation |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
86 |
|
28315 | 87 |
(* quickcheck configuration -- default parameters, test generators *) |
40908 | 88 |
val (tester, setup_tester) = Attrib.config_string "quickcheck_tester" (K "") |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
89 |
val (size, setup_size) = Attrib.config_int "quickcheck_size" (K 10) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
90 |
val (iterations, setup_iterations) = Attrib.config_int "quickcheck_iterations" (K 100) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
91 |
val (no_assms, setup_no_assms) = Attrib.config_bool "quickcheck_no_assms" (K false) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
92 |
val (report, setup_report) = Attrib.config_bool "quickcheck_report" (K true) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
93 |
val (quiet, setup_quiet) = Attrib.config_bool "quickcheck_quiet" (K false) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
94 |
val (timeout, setup_timeout) = Attrib.config_real "quickcheck_timeout" (K 30.0) |
40646 | 95 |
val (finite_types, setup_finite_types) = Attrib.config_bool "quickcheck_finite_types" (K true) |
40647 | 96 |
val (finite_type_size, setup_finite_type_size) = Attrib.config_int "quickcheck_finite_type_size" (K 3) |
38759
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
97 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
98 |
val setup_config = |
40908 | 99 |
setup_tester #> setup_size #> setup_iterations #> setup_no_assms #> setup_report #> setup_quiet |
100 |
#> setup_timeout #> setup_finite_types #> setup_finite_type_size |
|
40646 | 101 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
102 |
datatype test_params = Test_Params of |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
103 |
{default_type: typ list, expect : expectation}; |
38759
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
104 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
105 |
fun dest_test_params (Test_Params {default_type, expect}) = (default_type, expect); |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
106 |
|
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
107 |
fun make_test_params (default_type, expect) = Test_Params {default_type = default_type, expect = expect}; |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
108 |
|
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
109 |
fun map_test_params' f (Test_Params {default_type, expect}) = make_test_params (f (default_type, expect)); |
38759
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
110 |
|
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
111 |
fun merge_test_params |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
112 |
(Test_Params {default_type = default_type1, expect = expect1}, |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
113 |
Test_Params {default_type = default_type2, expect = expect2}) = |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
114 |
make_test_params (merge (op =) (default_type1, default_type2), merge_expectation (expect1, expect2)); |
28309 | 115 |
|
39252
8f176e575a49
changing the container for the quickcheck options to a generic data
bulwahn
parents:
39138
diff
changeset
|
116 |
structure Data = Generic_Data |
33522 | 117 |
( |
38759
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
118 |
type T = |
39253
0c47d615a69b
removing report from the arguments of the quickcheck functions and refering to it by picking it from the context
bulwahn
parents:
39252
diff
changeset
|
119 |
(string * (Proof.context -> term -> int -> term list option * (bool list * bool))) list |
38759
37a9092de102
simplification/standardization of some theory data;
wenzelm
parents:
38390
diff
changeset
|
120 |
* test_params; |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
121 |
val empty = ([], Test_Params {default_type = [], expect = No_Expectation}); |
28256 | 122 |
val extend = I; |
33522 | 123 |
fun merge ((generators1, params1), (generators2, params2)) : T = |
124 |
(AList.merge (op =) (K true) (generators1, generators2), |
|
28309 | 125 |
merge_test_params (params1, params2)); |
33522 | 126 |
); |
28256 | 127 |
|
39252
8f176e575a49
changing the container for the quickcheck options to a generic data
bulwahn
parents:
39138
diff
changeset
|
128 |
val test_params_of = snd o Data.get o Context.Proof; |
37910
555287ba8d8d
reordering quickcheck signature; exporting test_params and inspection function
bulwahn
parents:
37909
diff
changeset
|
129 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
130 |
val default_type = fst o dest_test_params o test_params_of |
40246
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
131 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
132 |
val expect = snd o dest_test_params o test_params_of |
40246
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
133 |
|
c03fc7d3fa97
changed global fixed timeout to a configurable timeout for quickcheck; test parameters in quickcheck are now fully passed around with the context
bulwahn
parents:
40225
diff
changeset
|
134 |
val map_test_params = Data.map o apsnd o map_test_params' |
39253
0c47d615a69b
removing report from the arguments of the quickcheck functions and refering to it by picking it from the context
bulwahn
parents:
39252
diff
changeset
|
135 |
|
28309 | 136 |
val add_generator = Data.map o apfst o AList.update (op =); |
137 |
||
28315 | 138 |
(* generating tests *) |
139 |
||
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
140 |
fun mk_tester ctxt t = |
28309 | 141 |
let |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
142 |
val name = Config.get ctxt tester |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
143 |
val tester = case AList.lookup (op =) ((fst o Data.get o Context.Proof) ctxt) name |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
144 |
of NONE => error ("No such quickcheck tester: " ^ name) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
145 |
| SOME tester => tester ctxt; |
40235
87998864284e
use Exn.interruptible_capture to keep user-code interruptible (Exn.capture not immediately followed by Exn.release here);
wenzelm
parents:
40225
diff
changeset
|
146 |
in |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
147 |
if Config.get ctxt quiet then |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
148 |
try tester t |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
149 |
else |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
150 |
let |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
151 |
val tester = Exn.interruptible_capture tester t |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
152 |
in case Exn.get_result tester of |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
153 |
NONE => SOME (Exn.release tester) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
154 |
| SOME tester => SOME tester |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
155 |
end |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
156 |
end |
28315 | 157 |
|
158 |
(* testing propositions *) |
|
159 |
||
28309 | 160 |
fun prep_test_term t = |
161 |
let |
|
29266 | 162 |
val _ = (null (Term.add_tvars t []) andalso null (Term.add_tfrees t [])) orelse |
28309 | 163 |
error "Term to be tested contains type variables"; |
29266 | 164 |
val _ = null (Term.add_vars t []) orelse |
28309 | 165 |
error "Term to be tested contains schematic variables"; |
31138 | 166 |
val frees = Term.add_frees t []; |
28309 | 167 |
in (map fst frees, list_abs_free (frees, t)) end |
28256 | 168 |
|
35324
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
169 |
fun cpu_time description f = |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
170 |
let |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
171 |
val start = start_timing () |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
172 |
val result = Exn.capture f () |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
173 |
val time = Time.toMilliseconds (#cpu (end_timing start)) |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
174 |
in (Exn.release result, (description, time)) end |
c9f428269b38
adopting mutabelle and quickcheck to return timing information; exporting make_case_combs in datatype package for predicate compiler; adding Spec_Rules declaration for tail recursive functions; improving the predicate compiler and function flattening
bulwahn
parents:
35077
diff
changeset
|
175 |
|
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
176 |
(* we actually assume we know the generators and its behaviour *) |
40656 | 177 |
fun is_iteratable "SML" = true |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
178 |
| is_iteratable "random" = true |
40656 | 179 |
| is_iteratable _ = false |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
180 |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
181 |
fun test_term ctxt is_interactive t = |
28309 | 182 |
let |
183 |
val (names, t') = prep_test_term t; |
|
40366
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
184 |
val current_size = Unsynchronized.ref 0 |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
185 |
fun excipit s = |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
186 |
"Quickcheck " ^ s ^ " while testing at size " ^ string_of_int (!current_size) |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
187 |
val (test_fun, comp_time) = cpu_time "quickcheck compilation" (fn () => mk_tester ctxt t'); |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
188 |
fun iterate f 0 report = (NONE, report) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
189 |
| iterate f j report = |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
190 |
let |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
191 |
val (test_result, single_report) = apsnd Run (f ()) handle Match => |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
192 |
(if Config.get ctxt quiet then () |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
193 |
else warning "Exception Match raised during quickcheck"; (NONE, MatchExc)) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
194 |
val report = collect_single_report single_report report |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
195 |
in |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
196 |
case test_result of NONE => iterate f (j - 1) report | SOME q => (SOME q, report) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
197 |
end |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
198 |
val empty_report = Report { iterations = 0, raised_match_errors = 0, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
199 |
satisfied_assms = [], positive_concl_tests = 0 } |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
200 |
fun with_size test_fun k reports = |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
201 |
if k > Config.get ctxt size then (NONE, reports) |
40132
7ee65dbffa31
renamed Output.priority to Output.urgent_message to emphasize its special role more clearly;
wenzelm
parents:
39656
diff
changeset
|
202 |
else |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
203 |
(if Config.get ctxt quiet then () else Output.urgent_message ("Test data size: " ^ string_of_int k); |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
204 |
let |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
205 |
val _ = current_size := k |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
206 |
val niterations = |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
207 |
if is_iteratable (Config.get ctxt tester) then Config.get ctxt iterations else 1 |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
208 |
val ((result, new_report), timing) = cpu_time ("size " ^ string_of_int k) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
209 |
(fn () => iterate (fn () => test_fun (k - 1)) niterations empty_report) |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
210 |
val reports = ((k, new_report) :: reports) |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
211 |
in case result of NONE => with_size test_fun (k + 1) reports | SOME q => (SOME q, reports) end); |
34948
2d5f2a9f7601
refactoring the predicate compiler; adding theories for Sequences; adding retrieval to Spec_Rules; adding timing to Quickcheck
bulwahn
parents:
34128
diff
changeset
|
212 |
in |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
213 |
case test_fun of NONE => (NONE, ([comp_time], NONE)) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
214 |
| SOME test_fun => |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
215 |
TimeLimit.timeLimit (seconds (Config.get ctxt timeout)) (fn () => |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
216 |
let |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
217 |
val ((result, reports), exec_time) = |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
218 |
cpu_time "quickcheck execution" (fn () => with_size test_fun 1 []) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
219 |
in |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
220 |
(case result of NONE => NONE | SOME ts => SOME (names ~~ ts), |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
221 |
([exec_time, comp_time], if Config.get ctxt report then SOME reports else NONE)) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
222 |
end) () |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
223 |
handle TimeLimit.TimeOut => |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
224 |
if is_interactive then error (excipit "ran out of time") else raise TimeLimit.TimeOut |
28309 | 225 |
end; |
226 |
||
40647 | 227 |
fun get_finite_types ctxt = |
228 |
fst (chop (Config.get ctxt finite_type_size) |
|
229 |
(map (Type o rpair []) ["Enum.finite_1", "Enum.finite_2", "Enum.finite_3", |
|
230 |
"Enum.finite_4", "Enum.finite_5"])) |
|
231 |
||
37913
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
232 |
exception WELLSORTED of string |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
233 |
|
28309 | 234 |
fun monomorphic_term thy insts default_T = |
235 |
let |
|
236 |
fun subst (T as TFree (v, S)) = |
|
40903 | 237 |
let |
238 |
val T' = AList.lookup (op =) insts v |
|
239 |
|> the_default default_T |
|
240 |
in if Sign.of_sort thy (T', S) then T' |
|
241 |
else raise (WELLSORTED ("For instantiation with default_type " ^ Syntax.string_of_typ_global thy default_T ^ |
|
242 |
":\n" ^ Syntax.string_of_typ_global thy T' ^ |
|
243 |
" to be substituted for variable " ^ |
|
244 |
Syntax.string_of_typ_global thy T ^ " does not have sort " ^ |
|
245 |
Syntax.string_of_sort_global thy S)) |
|
246 |
end |
|
28309 | 247 |
| subst T = T; |
248 |
in (map_types o map_atyps) subst end; |
|
249 |
||
37913
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
250 |
datatype wellsorted_error = Wellsorted_Error of string | Term of term |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
251 |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
252 |
fun test_goal_terms lthy is_interactive insts check_goals = |
28309 | 253 |
let |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
254 |
val thy = ProofContext.theory_of lthy |
40647 | 255 |
val inst_goals = |
256 |
if Config.get lthy finite_types then |
|
257 |
maps (fn check_goal => map (fn T => |
|
258 |
Term ((Object_Logic.atomize_term thy o monomorphic_term thy insts T) check_goal) |
|
259 |
handle WELLSORTED s => Wellsorted_Error s) (get_finite_types lthy)) check_goals |
|
260 |
else |
|
261 |
maps (fn check_goal => map (fn T => |
|
262 |
Term ((Object_Logic.atomize_term thy o monomorphic_term thy insts T) check_goal) |
|
263 |
handle WELLSORTED s => Wellsorted_Error s) (default_type lthy)) check_goals |
|
37913
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
264 |
val error_msg = cat_lines (map_filter (fn Term t => NONE | Wellsorted_Error s => SOME s) inst_goals) |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
265 |
val correct_inst_goals = |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
266 |
case map_filter (fn Term t => SOME t | Wellsorted_Error s => NONE) inst_goals of |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
267 |
[] => error error_msg |
e85f5ad02a8f
correcting wellsortedness check and improving error message
bulwahn
parents:
37912
diff
changeset
|
268 |
| xs => xs |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
269 |
val _ = if Config.get lthy quiet then () else warning error_msg |
37912 | 270 |
fun collect_results f reports [] = (NONE, rev reports) |
271 |
| collect_results f reports (t :: ts) = |
|
272 |
case f t of |
|
273 |
(SOME res, report) => (SOME res, rev (report :: reports)) |
|
274 |
| (NONE, report) => collect_results f (report :: reports) ts |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
275 |
in collect_results (test_term lthy is_interactive) [] correct_inst_goals end; |
37912 | 276 |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
277 |
fun test_goal insts i state = |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
278 |
let |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
279 |
val lthy = Proof.context_of state; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
280 |
val thy = Proof.theory_of state; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
281 |
fun strip (Const ("all", _) $ Abs (_, _, t)) = strip t |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
282 |
| strip t = t; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
283 |
val {goal = st, ...} = Proof.raw_goal state; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
284 |
val (gi, frees) = Logic.goal_params (prop_of st) i; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
285 |
val some_locale = case (Option.map #target o Named_Target.peek) lthy |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
286 |
of NONE => NONE |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
287 |
| SOME "" => NONE |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
288 |
| SOME locale => SOME locale; |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
289 |
val assms = if Config.get lthy no_assms then [] else case some_locale |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
290 |
of NONE => Assumption.all_assms_of lthy |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
291 |
| SOME locale => Assumption.local_assms_of lthy (Locale.init locale thy); |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
292 |
val proto_goal = Logic.list_implies (map Thm.term_of assms, subst_bounds (frees, strip gi)); |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
293 |
val check_goals = case some_locale |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
294 |
of NONE => [proto_goal] |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
295 |
| SOME locale => map (fn (_, phi) => Morphism.term phi proto_goal) |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
296 |
(Locale.registrations_of (Context.Theory thy) (*FIXME*) locale); |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
297 |
in |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
298 |
test_goal_terms lthy true insts check_goals |
40648
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
299 |
end |
1598ec648b0d
splitting test_goal function in two functions; exporting new configurations in quickcheck; iterations depend on generator_name in quickcheck
bulwahn
parents:
40647
diff
changeset
|
300 |
|
37912 | 301 |
(* pretty printing *) |
28315 | 302 |
|
40225 | 303 |
fun tool_name auto = (if auto then "Auto " else "") ^ "Quickcheck" |
304 |
||
305 |
fun pretty_counterex ctxt auto NONE = Pretty.str (tool_name auto ^ " found no counterexample.") |
|
306 |
| pretty_counterex ctxt auto (SOME cex) = |
|
307 |
Pretty.chunks (Pretty.str (tool_name auto ^ " found a counterexample:\n") :: |
|
28315 | 308 |
map (fn (s, t) => |
309 |
Pretty.block [Pretty.str (s ^ " ="), Pretty.brk 1, Syntax.pretty_term ctxt t]) cex); |
|
310 |
||
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
311 |
fun pretty_report (Report {iterations = iterations, raised_match_errors = raised_match_errors, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
312 |
satisfied_assms = satisfied_assms, positive_concl_tests = positive_concl_tests}) = |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
313 |
let |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
314 |
fun pretty_stat s i = Pretty.block ([Pretty.str (s ^ ": " ^ string_of_int i)]) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
315 |
in |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
316 |
([pretty_stat "iterations" iterations, |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
317 |
pretty_stat "match exceptions" raised_match_errors] |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
318 |
@ map_index (fn (i, n) => pretty_stat ("satisfied " ^ string_of_int (i + 1) ^ ". assumption") n) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
319 |
satisfied_assms |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
320 |
@ [pretty_stat "positive conclusion tests" positive_concl_tests]) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
321 |
end |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
322 |
|
35380
6ac5b81a763d
adopting Mutabelle to quickcheck reporting; improving quickcheck reporting
bulwahn
parents:
35379
diff
changeset
|
323 |
fun pretty_reports ctxt (SOME reports) = |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
324 |
Pretty.chunks (Pretty.str "Quickcheck report:" :: |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
325 |
maps (fn (size, report) => |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
326 |
Pretty.str ("size " ^ string_of_int size ^ ":") :: pretty_report report @ [Pretty.brk 1]) |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
327 |
(rev reports)) |
35380
6ac5b81a763d
adopting Mutabelle to quickcheck reporting; improving quickcheck reporting
bulwahn
parents:
35379
diff
changeset
|
328 |
| pretty_reports ctxt NONE = Pretty.str "" |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
329 |
|
40225 | 330 |
fun pretty_counterex_and_reports ctxt auto (cex, timing_and_reports) = |
331 |
Pretty.chunks (pretty_counterex ctxt auto cex :: |
|
332 |
map (pretty_reports ctxt) (map snd timing_and_reports)) |
|
28315 | 333 |
|
334 |
(* automatic testing *) |
|
28309 | 335 |
|
33561
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
336 |
fun auto_quickcheck state = |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
337 |
if not (!auto) then |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
338 |
(false, state) |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
339 |
else |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
340 |
let |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
341 |
val ctxt = Proof.context_of state; |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
342 |
val res = |
39253
0c47d615a69b
removing report from the arguments of the quickcheck functions and refering to it by picking it from the context
bulwahn
parents:
39252
diff
changeset
|
343 |
state |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
344 |
|> Proof.map_context (Config.put report false #> Config.put quiet true) |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
345 |
|> try (test_goal [] 1); |
33561
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
346 |
in |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
347 |
case res of |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
348 |
NONE => (false, state) |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
349 |
| SOME (NONE, report) => (false, state) |
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
350 |
| SOME (cex, report) => (true, Proof.goal_message (K (Pretty.chunks [Pretty.str "", |
40225 | 351 |
Pretty.mark Markup.hilite (pretty_counterex ctxt true cex)])) state) |
33561
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
352 |
end |
ab01b72715ef
introduced Auto Nitpick in addition to Auto Quickcheck;
blanchet
parents:
33560
diff
changeset
|
353 |
|
39324
05452dd66b2b
finished renaming "Auto_Counterexample" to "Auto_Tools"
blanchet
parents:
39253
diff
changeset
|
354 |
val setup = Auto_Tools.register_tool ("quickcheck", auto_quickcheck) |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
355 |
#> setup_config |
28315 | 356 |
|
30980 | 357 |
(* Isar commands *) |
28315 | 358 |
|
28336 | 359 |
fun read_nat s = case (Library.read_int o Symbol.explode) s |
360 |
of (k, []) => if k >= 0 then k |
|
361 |
else error ("Not a natural number: " ^ s) |
|
362 |
| (_, _ :: _) => error ("Not a natural number: " ^ s); |
|
37909
583543ad6ad1
changed default types to a list of types; extended quickcheck parameters to be a list of values to parse a list of default types
bulwahn
parents:
36960
diff
changeset
|
363 |
|
34128
8650a073dd9b
made Quickcheck take structured proof assumptions into account (like Refute and Nitpick) by default;
blanchet
parents:
33583
diff
changeset
|
364 |
fun read_bool "false" = false |
8650a073dd9b
made Quickcheck take structured proof assumptions into account (like Refute and Nitpick) by default;
blanchet
parents:
33583
diff
changeset
|
365 |
| read_bool "true" = true |
8650a073dd9b
made Quickcheck take structured proof assumptions into account (like Refute and Nitpick) by default;
blanchet
parents:
33583
diff
changeset
|
366 |
| read_bool s = error ("Not a Boolean value: " ^ s) |
28315 | 367 |
|
40366
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
368 |
fun read_real s = |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
369 |
case (Real.fromString s) of |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
370 |
SOME s => s |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
371 |
| NONE => error ("Not a real number: " ^ s) |
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
372 |
|
37929
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
373 |
fun read_expectation "no_expectation" = No_Expectation |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
374 |
| read_expectation "no_counterexample" = No_Counterexample |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
375 |
| read_expectation "counterexample" = Counterexample |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
376 |
| read_expectation s = error ("Not an expectation value: " ^ s) |
22e0797857e6
adding checking of expected result for the tool quickcheck; annotated a few quickcheck examples
bulwahn
parents:
37913
diff
changeset
|
377 |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
378 |
fun parse_test_param ("tester", [arg]) = Config.put_generic tester arg |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
379 |
| parse_test_param ("size", [arg]) = Config.put_generic size (read_nat arg) |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
380 |
| parse_test_param ("iterations", [arg]) = Config.put_generic iterations (read_nat arg) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
381 |
| parse_test_param ("default_type", arg) = (fn gen_ctxt => |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
382 |
map_test_params ((apfst o K) (map (ProofContext.read_typ (Context.proof_of gen_ctxt)) arg)) gen_ctxt) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
383 |
| parse_test_param ("no_assms", [arg]) = Config.put_generic no_assms (read_bool arg) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
384 |
| parse_test_param ("expect", [arg]) = map_test_params ((apsnd o K) (read_expectation arg)) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
385 |
| parse_test_param ("report", [arg]) = Config.put_generic report (read_bool arg) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
386 |
| parse_test_param ("quiet", [arg]) = Config.put_generic quiet (read_bool arg) |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
387 |
| parse_test_param ("timeout", [arg]) = Config.put_generic timeout (read_real arg) |
40646 | 388 |
| parse_test_param ("finite_types", [arg]) = Config.put_generic finite_types (read_bool arg) |
40647 | 389 |
| parse_test_param ("finite_type_size", [arg]) = Config.put_generic finite_type_size (read_nat arg) |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
390 |
| parse_test_param (name, _) = error ("Unknown test parameter: " ^ name); |
28315 | 391 |
|
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
392 |
fun parse_test_param_inst (name, arg) (insts, ctxt) = |
28336 | 393 |
case try (ProofContext.read_typ ctxt) name |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
394 |
of SOME (TFree (v, _)) => (apfst o AList.update (op =)) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
395 |
(v, ProofContext.read_typ ctxt (the_single arg)) (insts, ctxt) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
396 |
| _ => (apsnd o Context.proof_map o parse_test_param) (name, arg) (insts, ctxt); |
28309 | 397 |
|
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
398 |
fun quickcheck_params_cmd args = Context.theory_map (fold parse_test_param args); |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
399 |
|
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
400 |
fun gen_quickcheck args i state = |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
401 |
state |
40909
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
402 |
|> Proof.map_context_result (fn ctxt => fold parse_test_param_inst args ([], ctxt)) |
e006d1e06920
renamed parameter from generator to tester; quickcheck only applies one tester on invocation
bulwahn
parents:
40908
diff
changeset
|
403 |
|> (fn (insts, state') => test_goal insts i state' |
40644
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
404 |
|> tap (fn (SOME x, _) => if expect (Proof.context_of state') = No_Counterexample then |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
405 |
error ("quickcheck expected to find no counterexample but found one") else () |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
406 |
| (NONE, _) => if expect (Proof.context_of state') = Counterexample then |
0850a2a16dce
changed old-style quickcheck configurations to new Config.T configurations
bulwahn
parents:
40643
diff
changeset
|
407 |
error ("quickcheck expected to find a counterexample but did not find one") else ())) |
32297 | 408 |
|
36960
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
409 |
fun quickcheck args i state = fst (gen_quickcheck args i state); |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
410 |
|
32297 | 411 |
fun quickcheck_cmd args i state = |
35378
95d0e3adf38e
added basic reporting of test cases to quickcheck
bulwahn
parents:
35324
diff
changeset
|
412 |
gen_quickcheck args i (Toplevel.proof_of state) |
40225 | 413 |
|> Pretty.writeln o pretty_counterex_and_reports (Toplevel.context_of state) false; |
28309 | 414 |
|
37909
583543ad6ad1
changed default types to a list of types; extended quickcheck parameters to be a list of values to parse a list of default types
bulwahn
parents:
36960
diff
changeset
|
415 |
val parse_arg = Parse.name -- (Scan.optional (Parse.$$$ "=" |-- |
40366
a2866dbfbe6b
changing timeout to real value; handling Interrupt and Timeout more like nitpick does
bulwahn
parents:
40253
diff
changeset
|
416 |
(((Parse.name || Parse.float_number) >> single) || (Parse.$$$ "[" |-- Parse.list1 Parse.name --| Parse.$$$ "]"))) ["true"]); |
28309 | 417 |
|
36960
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
418 |
val parse_args = Parse.$$$ "[" |-- Parse.list1 parse_arg --| Parse.$$$ "]" |
28336 | 419 |
|| Scan.succeed []; |
420 |
||
36960
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
421 |
val _ = |
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
422 |
Outer_Syntax.command "quickcheck_params" "set parameters for random testing" Keyword.thy_decl |
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
423 |
(parse_args >> (fn args => Toplevel.theory (quickcheck_params_cmd args))); |
28309 | 424 |
|
36960
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
425 |
val _ = |
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
426 |
Outer_Syntax.improper_command "quickcheck" "try to find counterexample for subgoal" Keyword.diag |
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
427 |
(parse_args -- Scan.optional Parse.nat 1 |
01594f816e3a
prefer structure Keyword, Parse, Parse_Spec, Outer_Syntax;
wenzelm
parents:
36610
diff
changeset
|
428 |
>> (fn (args, i) => Toplevel.no_timing o Toplevel.keep (quickcheck_cmd args i))); |
28309 | 429 |
|
28315 | 430 |
end; |
28309 | 431 |
|
432 |
||
28315 | 433 |
val auto_quickcheck = Quickcheck.auto; |