src/HOL/Library/Inner_Product.thy
author huffman
Fri Jun 12 16:23:07 2009 -0700 (2009-06-12)
changeset 31590 776d6a4c1327
parent 31492 5400beeddb55
child 39198 f967a16dfcdd
permissions -rw-r--r--
declare inner_add, inner_diff [algebra_simps]; declare inner_scaleR [simp]
huffman@29993
     1
(* Title:      Inner_Product.thy
huffman@29993
     2
   Author:     Brian Huffman
huffman@29993
     3
*)
huffman@29993
     4
huffman@29993
     5
header {* Inner Product Spaces and the Gradient Derivative *}
huffman@29993
     6
huffman@29993
     7
theory Inner_Product
haftmann@30663
     8
imports Complex_Main FrechetDeriv
huffman@29993
     9
begin
huffman@29993
    10
huffman@29993
    11
subsection {* Real inner product spaces *}
huffman@29993
    12
huffman@31492
    13
text {*
huffman@31492
    14
  Temporarily relax type constraints for @{term "open"},
huffman@31492
    15
  @{term dist}, and @{term norm}.
huffman@31492
    16
*}
huffman@31492
    17
huffman@31492
    18
setup {* Sign.add_const_constraint
huffman@31492
    19
  (@{const_name "open"}, SOME @{typ "'a::open set \<Rightarrow> bool"}) *}
huffman@31446
    20
huffman@31446
    21
setup {* Sign.add_const_constraint
huffman@31446
    22
  (@{const_name dist}, SOME @{typ "'a::dist \<Rightarrow> 'a \<Rightarrow> real"}) *}
huffman@31446
    23
huffman@31446
    24
setup {* Sign.add_const_constraint
huffman@31446
    25
  (@{const_name norm}, SOME @{typ "'a::norm \<Rightarrow> real"}) *}
huffman@31446
    26
huffman@31492
    27
class real_inner = real_vector + sgn_div_norm + dist_norm + open_dist +
huffman@29993
    28
  fixes inner :: "'a \<Rightarrow> 'a \<Rightarrow> real"
huffman@29993
    29
  assumes inner_commute: "inner x y = inner y x"
huffman@31590
    30
  and inner_add_left: "inner (x + y) z = inner x z + inner y z"
huffman@31590
    31
  and inner_scaleR_left [simp]: "inner (scaleR r x) y = r * (inner x y)"
huffman@29993
    32
  and inner_ge_zero [simp]: "0 \<le> inner x x"
huffman@29993
    33
  and inner_eq_zero_iff [simp]: "inner x x = 0 \<longleftrightarrow> x = 0"
huffman@29993
    34
  and norm_eq_sqrt_inner: "norm x = sqrt (inner x x)"
huffman@29993
    35
begin
huffman@29993
    36
huffman@29993
    37
lemma inner_zero_left [simp]: "inner 0 x = 0"
huffman@31590
    38
  using inner_add_left [of 0 0 x] by simp
huffman@29993
    39
huffman@29993
    40
lemma inner_minus_left [simp]: "inner (- x) y = - inner x y"
huffman@31590
    41
  using inner_add_left [of x "- x" y] by simp
huffman@29993
    42
huffman@29993
    43
lemma inner_diff_left: "inner (x - y) z = inner x z - inner y z"
huffman@31590
    44
  by (simp add: diff_minus inner_add_left)
huffman@29993
    45
huffman@29993
    46
text {* Transfer distributivity rules to right argument. *}
huffman@29993
    47
huffman@31590
    48
lemma inner_add_right: "inner x (y + z) = inner x y + inner x z"
huffman@31590
    49
  using inner_add_left [of y z x] by (simp only: inner_commute)
huffman@29993
    50
huffman@31590
    51
lemma inner_scaleR_right [simp]: "inner x (scaleR r y) = r * (inner x y)"
huffman@29993
    52
  using inner_scaleR_left [of r y x] by (simp only: inner_commute)
huffman@29993
    53
huffman@29993
    54
lemma inner_zero_right [simp]: "inner x 0 = 0"
huffman@29993
    55
  using inner_zero_left [of x] by (simp only: inner_commute)
huffman@29993
    56
huffman@29993
    57
lemma inner_minus_right [simp]: "inner x (- y) = - inner x y"
huffman@29993
    58
  using inner_minus_left [of y x] by (simp only: inner_commute)
huffman@29993
    59
huffman@29993
    60
lemma inner_diff_right: "inner x (y - z) = inner x y - inner x z"
huffman@29993
    61
  using inner_diff_left [of y z x] by (simp only: inner_commute)
huffman@29993
    62
huffman@31590
    63
lemmas inner_add [algebra_simps] = inner_add_left inner_add_right
huffman@31590
    64
lemmas inner_diff [algebra_simps]  = inner_diff_left inner_diff_right
huffman@31590
    65
lemmas inner_scaleR = inner_scaleR_left inner_scaleR_right
huffman@31590
    66
huffman@31590
    67
text {* Legacy theorem names *}
huffman@31590
    68
lemmas inner_left_distrib = inner_add_left
huffman@31590
    69
lemmas inner_right_distrib = inner_add_right
huffman@29993
    70
lemmas inner_distrib = inner_left_distrib inner_right_distrib
huffman@29993
    71
huffman@29993
    72
lemma inner_gt_zero_iff [simp]: "0 < inner x x \<longleftrightarrow> x \<noteq> 0"
huffman@29993
    73
  by (simp add: order_less_le)
huffman@29993
    74
huffman@29993
    75
lemma power2_norm_eq_inner: "(norm x)\<twosuperior> = inner x x"
huffman@29993
    76
  by (simp add: norm_eq_sqrt_inner)
huffman@29993
    77
huffman@30046
    78
lemma Cauchy_Schwarz_ineq:
huffman@29993
    79
  "(inner x y)\<twosuperior> \<le> inner x x * inner y y"
huffman@29993
    80
proof (cases)
huffman@29993
    81
  assume "y = 0"
huffman@29993
    82
  thus ?thesis by simp
huffman@29993
    83
next
huffman@29993
    84
  assume y: "y \<noteq> 0"
huffman@29993
    85
  let ?r = "inner x y / inner y y"
huffman@29993
    86
  have "0 \<le> inner (x - scaleR ?r y) (x - scaleR ?r y)"
huffman@29993
    87
    by (rule inner_ge_zero)
huffman@29993
    88
  also have "\<dots> = inner x x - inner y x * ?r"
huffman@31590
    89
    by (simp add: inner_diff)
huffman@29993
    90
  also have "\<dots> = inner x x - (inner x y)\<twosuperior> / inner y y"
huffman@29993
    91
    by (simp add: power2_eq_square inner_commute)
huffman@29993
    92
  finally have "0 \<le> inner x x - (inner x y)\<twosuperior> / inner y y" .
huffman@29993
    93
  hence "(inner x y)\<twosuperior> / inner y y \<le> inner x x"
huffman@29993
    94
    by (simp add: le_diff_eq)
huffman@29993
    95
  thus "(inner x y)\<twosuperior> \<le> inner x x * inner y y"
huffman@29993
    96
    by (simp add: pos_divide_le_eq y)
huffman@29993
    97
qed
huffman@29993
    98
huffman@30046
    99
lemma Cauchy_Schwarz_ineq2:
huffman@29993
   100
  "\<bar>inner x y\<bar> \<le> norm x * norm y"
huffman@29993
   101
proof (rule power2_le_imp_le)
huffman@29993
   102
  have "(inner x y)\<twosuperior> \<le> inner x x * inner y y"
huffman@30046
   103
    using Cauchy_Schwarz_ineq .
huffman@29993
   104
  thus "\<bar>inner x y\<bar>\<twosuperior> \<le> (norm x * norm y)\<twosuperior>"
huffman@29993
   105
    by (simp add: power_mult_distrib power2_norm_eq_inner)
huffman@29993
   106
  show "0 \<le> norm x * norm y"
huffman@29993
   107
    unfolding norm_eq_sqrt_inner
huffman@29993
   108
    by (intro mult_nonneg_nonneg real_sqrt_ge_zero inner_ge_zero)
huffman@29993
   109
qed
huffman@29993
   110
huffman@29993
   111
subclass real_normed_vector
huffman@29993
   112
proof
huffman@29993
   113
  fix a :: real and x y :: 'a
huffman@29993
   114
  show "0 \<le> norm x"
huffman@29993
   115
    unfolding norm_eq_sqrt_inner by simp
huffman@29993
   116
  show "norm x = 0 \<longleftrightarrow> x = 0"
huffman@29993
   117
    unfolding norm_eq_sqrt_inner by simp
huffman@29993
   118
  show "norm (x + y) \<le> norm x + norm y"
huffman@29993
   119
    proof (rule power2_le_imp_le)
huffman@29993
   120
      have "inner x y \<le> norm x * norm y"
huffman@30046
   121
        by (rule order_trans [OF abs_ge_self Cauchy_Schwarz_ineq2])
huffman@29993
   122
      thus "(norm (x + y))\<twosuperior> \<le> (norm x + norm y)\<twosuperior>"
huffman@29993
   123
        unfolding power2_sum power2_norm_eq_inner
huffman@31590
   124
        by (simp add: inner_add inner_commute)
huffman@29993
   125
      show "0 \<le> norm x + norm y"
huffman@29993
   126
        unfolding norm_eq_sqrt_inner
huffman@29993
   127
        by (simp add: add_nonneg_nonneg)
huffman@29993
   128
    qed
huffman@29993
   129
  have "sqrt (a\<twosuperior> * inner x x) = \<bar>a\<bar> * sqrt (inner x x)"
huffman@29993
   130
    by (simp add: real_sqrt_mult_distrib)
huffman@29993
   131
  then show "norm (a *\<^sub>R x) = \<bar>a\<bar> * norm x"
huffman@29993
   132
    unfolding norm_eq_sqrt_inner
huffman@31590
   133
    by (simp add: power2_eq_square mult_assoc)
huffman@29993
   134
qed
huffman@29993
   135
huffman@29993
   136
end
huffman@29993
   137
huffman@31492
   138
text {*
huffman@31492
   139
  Re-enable constraints for @{term "open"},
huffman@31492
   140
  @{term dist}, and @{term norm}.
huffman@31492
   141
*}
huffman@31492
   142
huffman@31492
   143
setup {* Sign.add_const_constraint
huffman@31492
   144
  (@{const_name "open"}, SOME @{typ "'a::topological_space set \<Rightarrow> bool"}) *}
huffman@31446
   145
huffman@31446
   146
setup {* Sign.add_const_constraint
huffman@31446
   147
  (@{const_name dist}, SOME @{typ "'a::metric_space \<Rightarrow> 'a \<Rightarrow> real"}) *}
huffman@31446
   148
huffman@31446
   149
setup {* Sign.add_const_constraint
huffman@31446
   150
  (@{const_name norm}, SOME @{typ "'a::real_normed_vector \<Rightarrow> real"}) *}
huffman@31446
   151
wenzelm@30729
   152
interpretation inner:
huffman@29993
   153
  bounded_bilinear "inner::'a::real_inner \<Rightarrow> 'a \<Rightarrow> real"
huffman@29993
   154
proof
huffman@29993
   155
  fix x y z :: 'a and r :: real
huffman@29993
   156
  show "inner (x + y) z = inner x z + inner y z"
huffman@31590
   157
    by (rule inner_add_left)
huffman@29993
   158
  show "inner x (y + z) = inner x y + inner x z"
huffman@31590
   159
    by (rule inner_add_right)
huffman@29993
   160
  show "inner (scaleR r x) y = scaleR r (inner x y)"
huffman@29993
   161
    unfolding real_scaleR_def by (rule inner_scaleR_left)
huffman@29993
   162
  show "inner x (scaleR r y) = scaleR r (inner x y)"
huffman@29993
   163
    unfolding real_scaleR_def by (rule inner_scaleR_right)
huffman@29993
   164
  show "\<exists>K. \<forall>x y::'a. norm (inner x y) \<le> norm x * norm y * K"
huffman@29993
   165
  proof
huffman@29993
   166
    show "\<forall>x y::'a. norm (inner x y) \<le> norm x * norm y * 1"
huffman@30046
   167
      by (simp add: Cauchy_Schwarz_ineq2)
huffman@29993
   168
  qed
huffman@29993
   169
qed
huffman@29993
   170
wenzelm@30729
   171
interpretation inner_left:
huffman@29993
   172
  bounded_linear "\<lambda>x::'a::real_inner. inner x y"
huffman@29993
   173
  by (rule inner.bounded_linear_left)
huffman@29993
   174
wenzelm@30729
   175
interpretation inner_right:
huffman@29993
   176
  bounded_linear "\<lambda>y::'a::real_inner. inner x y"
huffman@29993
   177
  by (rule inner.bounded_linear_right)
huffman@29993
   178
huffman@29993
   179
huffman@29993
   180
subsection {* Class instances *}
huffman@29993
   181
huffman@29993
   182
instantiation real :: real_inner
huffman@29993
   183
begin
huffman@29993
   184
huffman@29993
   185
definition inner_real_def [simp]: "inner = op *"
huffman@29993
   186
huffman@29993
   187
instance proof
huffman@29993
   188
  fix x y z r :: real
huffman@29993
   189
  show "inner x y = inner y x"
huffman@29993
   190
    unfolding inner_real_def by (rule mult_commute)
huffman@29993
   191
  show "inner (x + y) z = inner x z + inner y z"
huffman@29993
   192
    unfolding inner_real_def by (rule left_distrib)
huffman@29993
   193
  show "inner (scaleR r x) y = r * inner x y"
huffman@29993
   194
    unfolding inner_real_def real_scaleR_def by (rule mult_assoc)
huffman@29993
   195
  show "0 \<le> inner x x"
huffman@29993
   196
    unfolding inner_real_def by simp
huffman@29993
   197
  show "inner x x = 0 \<longleftrightarrow> x = 0"
huffman@29993
   198
    unfolding inner_real_def by simp
huffman@29993
   199
  show "norm x = sqrt (inner x x)"
huffman@29993
   200
    unfolding inner_real_def by simp
huffman@29993
   201
qed
huffman@29993
   202
huffman@29993
   203
end
huffman@29993
   204
huffman@29993
   205
instantiation complex :: real_inner
huffman@29993
   206
begin
huffman@29993
   207
huffman@29993
   208
definition inner_complex_def:
huffman@29993
   209
  "inner x y = Re x * Re y + Im x * Im y"
huffman@29993
   210
huffman@29993
   211
instance proof
huffman@29993
   212
  fix x y z :: complex and r :: real
huffman@29993
   213
  show "inner x y = inner y x"
huffman@29993
   214
    unfolding inner_complex_def by (simp add: mult_commute)
huffman@29993
   215
  show "inner (x + y) z = inner x z + inner y z"
huffman@29993
   216
    unfolding inner_complex_def by (simp add: left_distrib)
huffman@29993
   217
  show "inner (scaleR r x) y = r * inner x y"
huffman@29993
   218
    unfolding inner_complex_def by (simp add: right_distrib)
huffman@29993
   219
  show "0 \<le> inner x x"
huffman@29993
   220
    unfolding inner_complex_def by (simp add: add_nonneg_nonneg)
huffman@29993
   221
  show "inner x x = 0 \<longleftrightarrow> x = 0"
huffman@29993
   222
    unfolding inner_complex_def
huffman@29993
   223
    by (simp add: add_nonneg_eq_0_iff complex_Re_Im_cancel_iff)
huffman@29993
   224
  show "norm x = sqrt (inner x x)"
huffman@29993
   225
    unfolding inner_complex_def complex_norm_def
huffman@29993
   226
    by (simp add: power2_eq_square)
huffman@29993
   227
qed
huffman@29993
   228
huffman@29993
   229
end
huffman@29993
   230
huffman@29993
   231
huffman@29993
   232
subsection {* Gradient derivative *}
huffman@29993
   233
huffman@29993
   234
definition
huffman@29993
   235
  gderiv ::
huffman@29993
   236
    "['a::real_inner \<Rightarrow> real, 'a, 'a] \<Rightarrow> bool"
huffman@29993
   237
          ("(GDERIV (_)/ (_)/ :> (_))" [1000, 1000, 60] 60)
huffman@29993
   238
where
huffman@29993
   239
  "GDERIV f x :> D \<longleftrightarrow> FDERIV f x :> (\<lambda>h. inner h D)"
huffman@29993
   240
huffman@29993
   241
lemma deriv_fderiv: "DERIV f x :> D \<longleftrightarrow> FDERIV f x :> (\<lambda>h. h * D)"
huffman@29993
   242
  by (simp only: deriv_def field_fderiv_def)
huffman@29993
   243
huffman@29993
   244
lemma gderiv_deriv [simp]: "GDERIV f x :> D \<longleftrightarrow> DERIV f x :> D"
huffman@29993
   245
  by (simp only: gderiv_def deriv_fderiv inner_real_def)
huffman@29993
   246
huffman@29993
   247
lemma GDERIV_DERIV_compose:
huffman@29993
   248
    "\<lbrakk>GDERIV f x :> df; DERIV g (f x) :> dg\<rbrakk>
huffman@29993
   249
     \<Longrightarrow> GDERIV (\<lambda>x. g (f x)) x :> scaleR dg df"
huffman@29993
   250
  unfolding gderiv_def deriv_fderiv
huffman@29993
   251
  apply (drule (1) FDERIV_compose)
huffman@31590
   252
  apply (simp add: mult_ac)
huffman@29993
   253
  done
huffman@29993
   254
huffman@29993
   255
lemma FDERIV_subst: "\<lbrakk>FDERIV f x :> df; df = d\<rbrakk> \<Longrightarrow> FDERIV f x :> d"
huffman@29993
   256
  by simp
huffman@29993
   257
huffman@29993
   258
lemma GDERIV_subst: "\<lbrakk>GDERIV f x :> df; df = d\<rbrakk> \<Longrightarrow> GDERIV f x :> d"
huffman@29993
   259
  by simp
huffman@29993
   260
huffman@29993
   261
lemma GDERIV_const: "GDERIV (\<lambda>x. k) x :> 0"
huffman@29993
   262
  unfolding gderiv_def inner_right.zero by (rule FDERIV_const)
huffman@29993
   263
huffman@29993
   264
lemma GDERIV_add:
huffman@29993
   265
    "\<lbrakk>GDERIV f x :> df; GDERIV g x :> dg\<rbrakk>
huffman@29993
   266
     \<Longrightarrow> GDERIV (\<lambda>x. f x + g x) x :> df + dg"
huffman@29993
   267
  unfolding gderiv_def inner_right.add by (rule FDERIV_add)
huffman@29993
   268
huffman@29993
   269
lemma GDERIV_minus:
huffman@29993
   270
    "GDERIV f x :> df \<Longrightarrow> GDERIV (\<lambda>x. - f x) x :> - df"
huffman@29993
   271
  unfolding gderiv_def inner_right.minus by (rule FDERIV_minus)
huffman@29993
   272
huffman@29993
   273
lemma GDERIV_diff:
huffman@29993
   274
    "\<lbrakk>GDERIV f x :> df; GDERIV g x :> dg\<rbrakk>
huffman@29993
   275
     \<Longrightarrow> GDERIV (\<lambda>x. f x - g x) x :> df - dg"
huffman@29993
   276
  unfolding gderiv_def inner_right.diff by (rule FDERIV_diff)
huffman@29993
   277
huffman@29993
   278
lemma GDERIV_scaleR:
huffman@29993
   279
    "\<lbrakk>DERIV f x :> df; GDERIV g x :> dg\<rbrakk>
huffman@29993
   280
     \<Longrightarrow> GDERIV (\<lambda>x. scaleR (f x) (g x)) x
huffman@29993
   281
      :> (scaleR (f x) dg + scaleR df (g x))"
huffman@29993
   282
  unfolding gderiv_def deriv_fderiv inner_right.add inner_right.scaleR
huffman@29993
   283
  apply (rule FDERIV_subst)
huffman@29993
   284
  apply (erule (1) scaleR.FDERIV)
huffman@29993
   285
  apply (simp add: mult_ac)
huffman@29993
   286
  done
huffman@29993
   287
huffman@29993
   288
lemma GDERIV_mult:
huffman@29993
   289
    "\<lbrakk>GDERIV f x :> df; GDERIV g x :> dg\<rbrakk>
huffman@29993
   290
     \<Longrightarrow> GDERIV (\<lambda>x. f x * g x) x :> scaleR (f x) dg + scaleR (g x) df"
huffman@29993
   291
  unfolding gderiv_def
huffman@29993
   292
  apply (rule FDERIV_subst)
huffman@29993
   293
  apply (erule (1) FDERIV_mult)
huffman@31590
   294
  apply (simp add: inner_add mult_ac)
huffman@29993
   295
  done
huffman@29993
   296
huffman@29993
   297
lemma GDERIV_inverse:
huffman@29993
   298
    "\<lbrakk>GDERIV f x :> df; f x \<noteq> 0\<rbrakk>
huffman@29993
   299
     \<Longrightarrow> GDERIV (\<lambda>x. inverse (f x)) x :> - (inverse (f x))\<twosuperior> *\<^sub>R df"
huffman@29993
   300
  apply (erule GDERIV_DERIV_compose)
huffman@29993
   301
  apply (erule DERIV_inverse [folded numeral_2_eq_2])
huffman@29993
   302
  done
huffman@29993
   303
huffman@29993
   304
lemma GDERIV_norm:
huffman@29993
   305
  assumes "x \<noteq> 0" shows "GDERIV (\<lambda>x. norm x) x :> sgn x"
huffman@29993
   306
proof -
huffman@29993
   307
  have 1: "FDERIV (\<lambda>x. inner x x) x :> (\<lambda>h. inner x h + inner h x)"
huffman@29993
   308
    by (intro inner.FDERIV FDERIV_ident)
huffman@29993
   309
  have 2: "(\<lambda>h. inner x h + inner h x) = (\<lambda>h. inner h (scaleR 2 x))"
huffman@31590
   310
    by (simp add: expand_fun_eq inner_commute)
huffman@29993
   311
  have "0 < inner x x" using `x \<noteq> 0` by simp
huffman@29993
   312
  then have 3: "DERIV sqrt (inner x x) :> (inverse (sqrt (inner x x)) / 2)"
huffman@29993
   313
    by (rule DERIV_real_sqrt)
huffman@29993
   314
  have 4: "(inverse (sqrt (inner x x)) / 2) *\<^sub>R 2 *\<^sub>R x = sgn x"
huffman@29993
   315
    by (simp add: sgn_div_norm norm_eq_sqrt_inner)
huffman@29993
   316
  show ?thesis
huffman@29993
   317
    unfolding norm_eq_sqrt_inner
huffman@29993
   318
    apply (rule GDERIV_subst [OF _ 4])
huffman@29993
   319
    apply (rule GDERIV_DERIV_compose [where g=sqrt and df="scaleR 2 x"])
huffman@29993
   320
    apply (subst gderiv_def)
huffman@29993
   321
    apply (rule FDERIV_subst [OF _ 2])
huffman@29993
   322
    apply (rule 1)
huffman@29993
   323
    apply (rule 3)
huffman@29993
   324
    done
huffman@29993
   325
qed
huffman@29993
   326
huffman@29993
   327
lemmas FDERIV_norm = GDERIV_norm [unfolded gderiv_def]
huffman@29993
   328
huffman@29993
   329
end