feat(library/algebra): define matrices, prove Farkas' lemma

2016-03-17 17:29:55 -04:00 · 2016-03-17 17:29:55 -04:00 · b7a25a249a
commit b7a25a249a
parent 651df51cb7
1 changed files with 310 additions and 0 deletions
--- a/library/algebra/matrix.lean
+++ b/library/algebra/matrix.lean
@ -0,0 +1,310 @@
+import data.real data.tuple data.fin algebra.field data.list
+open nat  tuple eq.ops rat -- list
+
+namespace matrix
+
+definition matrix (A : Type) [field A] (m n : ℕ) := fin m → fin n → A
+
+definition rvector (A : Type) [field A] (n : ℕ) := matrix A 1 n
+
+definition cvector (A : Type) [field A] (m : ℕ) := matrix A m 1
+
+-- useful for testing
+definition cvector_of_list {A : Type} [field A] (l : list A) : cvector A (list.length l) :=
+  λ i j, list.ith l (fin.val i) !fin.val_lt
+
+definition rvector_of_list {A : Type} [field A] (l : list A) : rvector A (list.length l) :=
+  λ i j, list.ith l (fin.val j) !fin.val_lt
+
+section
+variable {A : Type}
+variable [linear_ordered_field A]
+variables {m n k : ℕ}
+
+definition col_of (M : matrix A m n) (j : fin n) : cvector A m := λ a b, M a j
+
+definition row_of (M : matrix A m n) (i : fin m) : rvector A n := λ a b, M i b
+
+definition r_ith (v : rvector A n) (i : fin n) := v !fin.zero i
+
+definition c_ith (v : cvector A m) (i : fin m) := v i !fin.zero
+
+definition nonneg (M : matrix A m n) := ∀ i j, M i j ≥ 0
+
+definition r_dot (u v : rvector A n) := Suml (fin.upto n) (λ i, r_ith u i * r_ith v i)
+
+definition c_dot (u v : cvector A m) := Suml (fin.upto m) (λ i, c_ith u i * c_ith v i)
+
+-- generalize this to transpose and remove coercion
+definition cvector_of_rvector [coercion] (u : rvector A n) : cvector A n := λ i j, u !fin.zero i
+
+definition mul (M : matrix A m n) (N : matrix A n k) : matrix A m k :=
+  λ (a : fin m) (b : fin k), c_dot (cvector_of_rvector (row_of M a)) (col_of N b) -- why doesn't coercion work?
+
+infix `⬝` := mul
+
+theorem fin_one_eq_zero (x : fin 1) : x = !fin.zero :=
+  begin
+    induction x,
+    unfold fin.zero,
+    congruence,
+    apply eq_zero_of_le_zero,
+    apply le_of_lt_succ is_lt
+  end
+
+theorem row_of_rvector (v : rvector A n) : row_of v !fin.zero = v :=
+  begin
+    apply funext,
+    intro x,
+    unfold row_of,
+    rewrite (fin_one_eq_zero x)
+  end
+
+theorem col_of_cvector (v : cvector A m) : col_of v !fin.zero = v :=
+  begin
+    apply funext,
+    intro x,
+    apply funext,
+    intro y,
+    unfold col_of,
+    rewrite (fin_one_eq_zero y)
+  end
+
+theorem Suml_assoc {B C : Type} (la : list B) (lb : list C) (f : B → C → A) :
+        Suml la (λ a, Suml lb (λ b, f a b))
+          = Suml lb (λ b, Suml la (λ a, f a b)) :=
+  begin
+    induction la with h tt ih,
+    induction lb with h' tt' ih',
+    {rewrite [Suml_nil]},
+    {rewrite [Suml_nil at *, Suml_cons, -ih', add_zero]},
+    {induction lb with h' tt' ih',
+    {rewrite [Suml_cons, *Suml_nil at *, ih, add_zero]},
+    {rewrite [Suml_cons, ih, -Suml_add],
+    congruence,
+    apply funext,
+    intro b,
+    rewrite Suml_cons}}
+  end
+
+theorem length_cons_pos {A : Type} (h : A) (tt : list A) : 0 < list.length (list.cons h tt) :=
+  begin
+    apply lt_of_not_ge,
+    intro H,
+    let H' := list.eq_nil_of_length_eq_zero (eq_zero_of_le_zero H),
+    apply !list.cons_ne_nil H'
+  end
+
+theorem big_sum_dist_left (a : A) {T : Type} (f : T → A) (l : list T) :
+        a * Suml l f = Suml l (λ k, a * f k) :=
+  begin
+    induction l with h tt ih,
+    rewrite [Suml_nil, mul_zero],
+    rewrite [*Suml_cons, left_distrib, ih]
+  end
+
+theorem big_sum_dist_right (a : A) {T : Type} (f : T → A) (l : list T) :
+         Suml l f * a= Suml l (λ k, f k * a) :=
+  begin
+    induction l with h tt ih,
+    rewrite [Suml_nil, zero_mul],
+    rewrite [*Suml_cons, right_distrib, ih]
+  end
+
+theorem Suml_nonneg_of_nonneg {T : Type} (l : list T) (f : T → A)
+        (H : Π (i : ℕ) (Hi : i < list.length l), f (list.ith l i Hi) ≥ 0) : Suml l f ≥ (0 : A) :=
+  begin
+    induction l with h tt ih,
+    rewrite Suml_nil,
+    apply le.refl,
+    rewrite Suml_cons,
+    have Hh : f h ≥ 0, begin
+      note Hl := H 0 !length_cons_pos,
+      rewrite list.ith_zero at Hl,
+      apply Hl
+    end,
+    have Htt : Suml tt f ≥ 0, begin
+      apply ih,
+      intro i Hi,
+      have Hsucc : succ i < list.length (list.cons h tt),
+        by rewrite list.length_cons; apply nat.add_lt_add_right Hi,
+      note Ho := H (succ i) Hsucc,
+      rewrite list.ith_succ at Ho,
+      apply Ho
+    end,
+    exact add_nonneg Hh Htt
+  end
+
+theorem Suml_le_of_le {T : Type} (l : list T) (f g : T → A) (H : ∀ t : T, f t ≤ g t) :
+        Suml l f ≤ Suml l g :=
+  begin
+    induction l,
+    {rewrite *Suml_nil, apply le.refl},
+    {rewrite *Suml_cons,
+    apply add_le_add,
+    apply H,
+    assumption}
+  end
+
+theorem inner_sum_assoc {S T : Type} (l1 : list S) (l2 : list T) (f : S → A) (g : S → T → A) :
+        Suml l1 (λ s, f s * Suml l2 (λ t, g s t)) = Suml l1 (λ s, Suml l2 (λ t, f s * g s t)) :=
+  begin
+    congruence,
+    apply funext,
+    intro s,
+    rewrite big_sum_dist_left
+  end
+
+-- clean this up...
+theorem dot_mul_assoc (y : rvector A m) (M : matrix A m n) (x : cvector A n) :
+        y ⬝ (M ⬝ x) = (y ⬝ M) ⬝ x :=
+  begin
+    rewrite ↑mul,
+    repeat (apply funext; intro),
+    rewrite [fin_one_eq_zero x_1, fin_one_eq_zero x_2, ↑c_dot, ↑c_ith, *row_of_rvector, *col_of_cvector],
+    rewrite [inner_sum_assoc, Suml_assoc],
+    congruence,
+    apply funext,
+    intro b,
+    unfold cvector_of_rvector,
+    rewrite big_sum_dist_right,
+    congruence,
+    apply funext,
+    intro b,
+    unfold row_of, unfold col_of,
+    rewrite *mul.assoc
+  end
+
+theorem cvector_of_rvector_nonneg_of_nonneg {u : rvector A n} (Hu : nonneg u) : nonneg (cvector_of_rvector u) :=
+  λ i j, !Hu
+
+theorem c_ith_cvector_of_rvector_eq_c_ith (u : rvector A n) (i : fin n) :
+        c_ith (cvector_of_rvector u) i = r_ith u i :=
+  rfl
+
+theorem c_dot_nonneg_of_nonneg (u v : cvector A m) (Hu : nonneg u) (Hv : nonneg v) : c_dot u v ≥ 0 :=
+  begin
+    unfold c_dot,
+    apply Suml_nonneg_of_nonneg,
+    intros,
+    apply mul_nonneg,
+    apply Hu,
+    apply Hv
+  end
+
+theorem row_of_nonneg_of_nonneg {M : matrix A m n} (HM : nonneg M) (i : fin m) : nonneg (row_of M i) :=
+  λ a b, !HM
+
+theorem col_of_nonneg_of_nonneg {M : matrix A m n} (HM : nonneg M) (i : fin n) : nonneg (col_of M i) :=
+  λ a b, !HM
+
+theorem mul_nonneg_of_nonneg (M : matrix A m n) (N : matrix A n k) (HM : nonneg M) (HN : nonneg N) :
+        nonneg (M ⬝ N) :=
+  begin
+    intros,
+    unfold mul,
+    apply c_dot_nonneg_of_nonneg,
+    apply cvector_of_rvector_nonneg_of_nonneg,
+    apply row_of_nonneg_of_nonneg HM,
+    apply col_of_nonneg_of_nonneg HN
+  end
+
+/-
+ One direction of Farkas' lemma
+-/
+
+theorem farkas_rl (M : matrix A m n) (b : cvector A m)
+        (H : ∃ y : rvector A m, nonneg (y ⬝ M) ∧ (y ⬝ b) !fin.zero !fin.zero < 0) :
+        ¬ ∃ x : cvector A n, nonneg x ∧ M ⬝ x = b :=
+  begin
+    intro HexX,
+    cases HexX with x Hx,
+    cases Hx with Nx Mxb,
+    cases H with y Hy,
+    cases Hy with NA Nmyb,
+    rewrite [-Mxb at Nmyb, dot_mul_assoc at Nmyb],
+    apply not_le_of_gt Nmyb,
+    apply mul_nonneg_of_nonneg,
+    repeat assumption
+  end
+
+
+/-
+ This is the useful formulation of the above for proving unsat:
+ If you can find a nonnegative row vector c such that c ⬝ M = 0 and c ⬝ b < 0,
+   then the system M ⬝ x ≤ b is unsat.
+-/
+theorem farkas_rl' (M : matrix A m n) (b : cvector A m)
+        (H : ∃ c : rvector A m, nonneg c ∧ c ⬝ M = (λ x y, (0 : A)) ∧ (c ⬝ b) !fin.zero !fin.zero < 0) :
+        ¬ ∃ x : cvector A n, ∀ i, (M ⬝ x) i !fin.zero ≤ c_ith b i :=
+  begin
+    intro HexX,
+    cases HexX with x Hx,
+    cases H with c Hc,
+    cases Hc with Hcn Hc,
+    cases Hc with HcM Hcb,
+    have H : c ⬝ (M ⬝ x) = (λ a b, 0), begin
+      rewrite [dot_mul_assoc, HcM, ↑mul],
+      repeat (apply funext; intro),
+      rewrite [fin_one_eq_zero, row_of_rvector, ↑c_dot],
+      have Hz : (λ i, c_ith (cvector_of_rvector (λ (x : fin 1) (y : fin n), 0)) i * c_ith (col_of x x_2) i)
+                  = (λ i, 0), begin
+       apply funext, intro i,
+       rewrite [ c_ith_cvector_of_rvector_eq_c_ith, ↑r_ith, zero_mul]
+      end,
+      rewrite [Hz, Suml_zero]
+    end,
+    have H' : (c ⬝ (M ⬝ x)) !fin.zero !fin.zero ≤ (c ⬝ b) !fin.zero !fin.zero, begin
+      rewrite ↑mul at {2, 3},
+      rewrite [*col_of_cvector, *row_of_rvector],
+      unfold c_dot,
+      apply Suml_le_of_le,
+      intro t,
+      apply mul_le_mul_of_nonneg_left,
+      apply Hx,
+      apply Hcn
+    end,
+    have HZ : (0 : A) < 0, from calc
+        0 = (c ⬝ (M ⬝ x)) !fin.zero !fin.zero : by rewrite H
+      ... ≤ (c ⬝ b) !fin.zero !fin.zero : H'
+      ... < 0 : Hcb,
+    exact not_lt_self _ HZ
+  end
+
+section
+open list
+definition decidable_quant [instance] (P : fin n → Prop) [∀ k, decidable (P k)] : decidable (∀ k, P k) :=
+  if H : all (fin.upto n) P then
+    decidable.inl (λ k, have Hk : k ∈ fin.upto n, from !fin.mem_upto, of_mem_of_all Hk H)
+  else
+    decidable.inr (λ Hpk, H (all_of_forall (λ a Ha, Hpk a)))
+
+definition matrix_decidable_eq [instance] [decidable_eq A] : decidable_eq (matrix A m n) :=
+  λ M N : matrix A m n,
+  if H : ∀ i : fin m, ∀ j : fin n, M i j = N i j then
+    decidable.inl (funext (λ i, funext (λ j, H i j)))
+  else
+    decidable.inr (begin intro Heq, apply H, intros, congruence, exact Heq end)
+end
+
+section test
+open list rat  -- why aren't rats pretty printing right?
+definition c1 : cvector ℚ _ := cvector_of_list [3, 4, 2]
+definition c2 : rvector ℚ _ := rvector_of_list [1, 0, 2]
+
+definition m1 : matrix ℚ 2 2 := λ a b, fin.val a + fin.val b
+eval col_of m1 (fin.mk 1 dec_trivial)
+
+eval c_dot c1 (cvector_of_rvector c2)
+
+example : row_of c2 !fin.zero !fin.zero (fin.mk 1 dec_trivial) = c2 !fin.zero (fin.mk 1 dec_trivial) := rfl
+
+example : row_of c2 !fin.zero = c2 := rfl
+
+eval (c2 ⬝ c1) !fin.zero !fin.zero
+
+end test
+
+end
+check farkas_rl
+end matrix