src/Pure/General/ord_list.ML
author wenzelm
Wed, 11 Sep 2024 22:28:42 +0200
changeset 80863 af34fcf7215d
parent 44334 605381e7c7c5
permissions -rw-r--r--
tuned signature: more operations;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     1
(*  Title:      Pure/General/ord_list.ML
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     3
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     4
Ordered lists without duplicates -- a light-weight representation of
16497
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
     5
finite sets, all operations take linear time and economize heap usage.
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     6
*)
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     7
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     8
signature ORD_LIST =
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
     9
sig
28354
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    10
  type 'a T = 'a list
28626
f65736dfc40d added make;
wenzelm
parents: 28354
diff changeset
    11
  val make: ('a * 'a -> order) -> 'a list -> 'a T
28354
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    12
  val member: ('b * 'a -> order) -> 'a T -> 'b -> bool
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    13
  val insert: ('a * 'a -> order) -> 'a -> 'a T -> 'a T
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    14
  val remove: ('b * 'a -> order) -> 'b -> 'a T -> 'a T
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    15
  val subset: ('b * 'a -> order) -> 'b T * 'a T -> bool
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    16
  val union: ('a * 'a -> order) -> 'a T -> 'a T -> 'a T
44334
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    17
  val unions: ('a * 'a -> order) -> 'a T list -> 'a T
41473
3717fc42ebe9 Ord_List.merge convenience;
wenzelm
parents: 39687
diff changeset
    18
  val merge: ('a * 'a -> order) -> 'a T * 'a T -> 'a T
28354
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    19
  val inter: ('b * 'a -> order) -> 'b T -> 'a T -> 'a T
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    20
  val subtract: ('b * 'a -> order) -> 'b T -> 'a T -> 'a T
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    21
end;
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    22
39687
4e9b6ada3a21 modernized structure Ord_List;
wenzelm
parents: 33037
diff changeset
    23
structure Ord_List: ORD_LIST =
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    24
struct
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    25
28354
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    26
type 'a T = 'a list;
28626
f65736dfc40d added make;
wenzelm
parents: 28354
diff changeset
    27
fun make ord = sort_distinct ord;
28354
c5fe7372ae4e explicit type OrdList.T;
wenzelm
parents: 22364
diff changeset
    28
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    29
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    30
(* single elements *)
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    31
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    32
fun find_index ord list x =
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    33
  let
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    34
    fun find i [] = ~ i
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    35
      | find i (y :: ys) =
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    36
          (case ord (x, y) of
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    37
            LESS => ~ i
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    38
          | EQUAL => i
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    39
          | GREATER => find (i + 1) ys);
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    40
  in find 1 list end;
16497
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    41
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    42
fun member ord list x = find_index ord list x > 0;
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    43
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    44
fun insert ord x list =
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    45
  let
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    46
    fun insrt 1 ys = x :: ys
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    47
      | insrt i (y :: ys) = y :: insrt (i - 1) ys;
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    48
    val idx = find_index ord list x;
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    49
  in if idx > 0 then list else insrt (~ idx) list end;
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    50
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    51
fun remove ord x list =
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    52
  let
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    53
    fun rmove 1 (_ :: ys) = ys
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    54
      | rmove i (y :: ys) = y :: rmove (i - 1) ys;
16811
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    55
    val idx = find_index ord list x;
23b9c52612db avoid excessive exceptions;
wenzelm
parents: 16680
diff changeset
    56
  in if idx > 0 then rmove idx list else list end;
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    57
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    58
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    59
(* lists as sets *)
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    60
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    61
fun subset ord (list1, list2) =
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    62
  let
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    63
    fun sub [] _ = true
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    64
      | sub _ [] = false
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    65
      | sub (lst1 as x :: xs) (y :: ys) =
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    66
          (case ord (x, y) of
16511
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    67
            LESS => false
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    68
          | EQUAL => sub xs ys
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    69
          | GREATER => sub lst1 ys);
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    70
  in sub list1 list2 end;
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    71
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    72
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    73
(* algebraic operations *)
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    74
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    75
exception SAME;
dad516b121cd added subset, eq_set;
wenzelm
parents: 16497
diff changeset
    76
fun handle_same f x = f x handle SAME => x;
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    77
16497
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    78
(*union: insert elements of first list into second list*)
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    79
fun union ord list1 list2 =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    80
  let
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    81
    fun unio [] _ = raise SAME
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    82
      | unio xs [] = xs
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    83
      | unio (lst1 as x :: xs) (lst2 as y :: ys) =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    84
          (case ord (x, y) of
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    85
            LESS => x :: handle_same (unio xs) lst2
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    86
          | EQUAL => y :: unio xs ys
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
    87
          | GREATER => y :: unio lst1 ys);
30572
8fbc355100f2 Library.merge/OrdList.union: optimize the important special case where the tables coincide -- NOTE: this changes both the operational behaviour and the result for non-standard eq/ord notion;
wenzelm
parents: 29606
diff changeset
    88
  in if pointer_eq (list1, list2) then list1 else handle_same (unio list1) list2 end;
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
    89
44334
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    90
fun unions ord lists =
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    91
  let
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    92
    fun unios (xs :: ys :: rest) acc = unios rest (union ord xs ys :: acc)
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    93
      | unios [xs] (ys :: acc) = unios (union ord xs ys :: acc) []
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    94
      | unios [xs] [] = xs
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    95
      | unios [] [] = []
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    96
      | unios [] acc = unios acc [];
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    97
  in unios lists [] end;
605381e7c7c5 more direct balanced version Ord_List.unions;
wenzelm
parents: 41473
diff changeset
    98
41473
3717fc42ebe9 Ord_List.merge convenience;
wenzelm
parents: 39687
diff changeset
    99
fun merge ord (list1, list2) = union ord list2 list1;
3717fc42ebe9 Ord_List.merge convenience;
wenzelm
parents: 39687
diff changeset
   100
16497
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   101
(*intersection: filter second list for elements present in first list*)
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   102
fun inter ord list1 list2 =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   103
  let
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   104
    fun intr _ [] = raise SAME
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   105
      | intr [] _ = []
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   106
      | intr (lst1 as x :: xs) (lst2 as y :: ys) =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   107
          (case ord (x, y) of
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   108
            LESS => intr xs lst2
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   109
          | EQUAL => y :: intr xs ys
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   110
          | GREATER => handle_same (intr lst1) ys);
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   111
  in handle_same (intr list1) list2 end;
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   112
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   113
(*subtraction: filter second list for elements NOT present in first list*)
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   114
fun subtract ord list1 list2 =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   115
  let
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   116
    fun subtr [] _ = raise SAME
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   117
      | subtr _ [] = raise SAME
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   118
      | subtr (lst1 as x :: xs) (lst2 as y :: ys) =
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   119
          (case ord (x, y) of
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   120
            LESS => subtr xs lst2
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   121
          | EQUAL => handle_same (subtr xs) ys
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   122
          | GREATER => y :: subtr lst1 ys);
474472ca4e4d generalized type of inter;
wenzelm
parents: 16468
diff changeset
   123
  in handle_same (subtr list1) list2 end;
16464
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
   124
db2711d07cd8 Ordered lists without duplicates.
wenzelm
parents:
diff changeset
   125
end;