Prosified Extensional

bc911257 · Adam Chlipala · 2ccd7485 · bc911257 · bc911257
Commit bc911257 authored Dec 16, 2009 by Adam Chlipala
Show whitespace changes
Inline Side-by-side

Showing with 467 additions and 352 deletions

Extensional.v src/Extensional.v +445 -352

Tactics.v src/Tactics.v +22 -0

No files found.
--- a/src/Extensional.v
+++ b/src/Extensional.v
@@ -18,16 +18,23 @@ Set Implicit Arguments.
 (** %\chapter{Extensional Transformations}% *)
-(** TODO: Prose for this chapter *)
+(** Last chapter's constant folding example was particularly easy to verify, because that transformation used the same source and target language.  In this chapter, we verify a different translation, illustrating the added complexities in translating between languages.
+   Program transformations can be classified as %\textit{%#<i>#intensional#</i>#%}%, when they require some notion of inequality between variables; or %\textit{%#<i>#extensional#</i>#%}%, otherwise.  This chapter's example is extensional, and the next chapter deals with the trickier intensional case. *)
-(** * Simply-Typed Lambda Calculus *)
-Module STLC.
+(** * CPS Conversion for Simply-Typed Lambda Calculus *)
-  Module Source.
+(** A convenient method for compiling functional programs begins with conversion to %\textit{%#<i>#continuation-passing style#</i>#%}%, or CPS.  In this restricted form, function calls never return; instead, we pass explicit return pointers, much as in assembly language.  Additionally, we make order of evaluation explicit, breaking complex expressions into sequences of primitive operations.
+   Our translation will operate over the same source language that we used in the first part of last chapter, so we omit most of the language definition.  However, we do make one significant change: since we will be working with multiple languages that involve similar constructs, we use Coq's %\textit{%#<i>#notation scope#</i>#%}% mechanism to disambiguate.  For instance, the span of code dealing with type notations looks like this: *)
+(* begin hide *)
+Module Source.
  Inductive type : Type :=
  | TNat : type
  | Arrow : type -> type -> type.
+(* end hide *)
  Notation "'Nat'" := TNat : source_scope.
  Infix "-->" := Arrow (right associativity, at level 60) : source_scope.
@@ -36,6 +43,9 @@ Module STLC.
  Bind Scope source_scope with type.
  Delimit Scope source_scope with source.
+  (** We explicitly place our notations inside a scope named [source_scope], and we associate a delimiting key [source] with [source_scope].  Without further commands, our notations would only be used in expressions like [(...)%source].  We also open our scope locally within this module, so that we avoid repeating [%source] in many places.  Further, we %\textit{%#<i>#bind#</i>#%}% our scope to [type].  In some circumstances where Coq is able to infer that some subexpression has type [type], that subexpression will automatically be parsed in [source_scope]. *)
+(* begin hide *)
  Section vars.
    Variable var : type -> Type.
@@ -102,6 +112,9 @@ Module STLC.
    end.
  Definition ExpDenote t (e : Exp t) := expDenote (e _).
+(* end hide *)
+  (** The other critical new ingredient is a generalization of the [Closed] relation from two chapters ago.  The new relation [exp_equiv] characters when two expressions may be considered syntactically equal.  We need to be able to handle cases where each expression uses a different [var] type.  Intuitively, we will want to compare expressions that use their variables to store source-level and target-level values.  We express pairs of equivalent variables using a list parameter to the relation; variable expressions will be considered equivalent if and only if their variables belong to this list.  The rule for function abstraction extends the list in a higher-order way.  The remaining rules just implement the obvious congruence over expressions. *)
 (* begin thide *)
  Section exp_equiv.
@@ -129,20 +142,22 @@ Module STLC.
      -> exp_equiv G (Abs f1) (Abs f2).
  End exp_equiv.
+  (** It turns out that, for any parametric expression [E], any two instantiations of [E] with particular [var] types must be equivalent, with respect to an empty variable list.  The parametricity of Gallina guarantees this, in much the same way that it guaranteed the truth of the axiom about [Closed].  Thus, we assert an analogous axiom here. *)
  Axiom Exp_equiv : forall t (E : Exp t) var1 var2,
    exp_equiv nil (E var1) (E var2).
 (* end thide *)
-  End Source.
+End Source.
+(** Now we need to define the CPS language, where binary function types are replaced with unary continuation types, and we add product types because they will be useful in our translation. *)
-  Module CPS.
+Module CPS.
  Inductive type : Type :=
  | TNat : type
  | Cont : type -> type
-    | TUnit : type
  | Prod : type -> type -> type.
  Notation "'Nat'" := TNat : cps_scope.
-    Notation "'Unit'" := TUnit : cps_scope.
  Notation "t --->" := (Cont t) (at level 61) : cps_scope.
  Infix "**" := Prod (right associativity, at level 60) : cps_scope.
@@ -152,6 +167,8 @@ Module STLC.
  Section vars.
    Variable var : type -> Type.
+    (** A CPS program is a series of bindings of primitive operations (primops), followed by either a halt with a final program result or by a call to a continuation. The arguments to these program-ending operations are enforced to be variables.  To use the values of compound expressions instead, those expressions must be decomposed into bindings of primops.  The primop language itself similarly forces variables for all arguments besides bodies of function abstractions. *)
    Inductive prog : Type :=
    | PHalt :
      var Nat
@@ -166,10 +183,6 @@ Module STLC.
      -> prog
    with primop : type -> Type :=
-      | Var : forall t,
-        var t
-        -> primop t
    | Const : nat -> primop Nat
    | Plus : var Nat -> var Nat -> primop Nat
@@ -192,7 +205,6 @@ Module STLC.
  Implicit Arguments PHalt [var].
  Implicit Arguments App [var t].
-    Implicit Arguments Var [var t].
  Implicit Arguments Const [var].
  Implicit Arguments Plus [var].
  Implicit Arguments Abs [var t].
@@ -207,8 +219,6 @@ Module STLC.
  Notation "! <- p ; e" := (Bind p (fun _ => e))
    (right associativity, at level 76, p at next level) : cps_scope.
-    Notation "# v" := (Var v) (at level 70) : cps_scope.
  Notation "^ n" := (Const n) (at level 70) : cps_scope.
  Infix "+^" := Plus (left associativity, at level 79) : cps_scope.
@@ -223,14 +233,17 @@ Module STLC.
  Open Scope cps_scope.
+  (** In interpreting types, we treat continuations as functions with codomain [nat], choosing [nat] as our arbitrary program result type. *)
  Fixpoint typeDenote (t : type) : Set :=
    match t with
      | Nat => nat
      | t' ---> => typeDenote t' -> nat
-        | Unit => unit
      | t1 ** t2 => (typeDenote t1 * typeDenote t2)%type
    end.
+  (** A mutually-recursive definition establishes the meanings of programs and primops. *)
  Fixpoint progDenote (e : prog typeDenote) : nat :=
    match e with
      | PHalt n => n
@@ -240,8 +253,6 @@ Module STLC.
  with primopDenote t (p : primop typeDenote t) : typeDenote t :=
    match p with
-        | Var _ v => v
      | Const n => n
      | Plus n1 n2 => n1 + n2
@@ -256,25 +267,31 @@ Module STLC.
  Definition Primop t := forall var, primop var t.
  Definition ProgDenote (E : Prog) := progDenote (E _).
  Definition PrimopDenote t (P : Primop t) := primopDenote (P _).
-  End CPS.
+End CPS.
-  Import Source CPS.
+Import Source CPS.
+(** The translation itself begins with a type-level compilation function.  We change every function into a continuation whose argument is a pair, consisting of the translation of the original argument and of an explicit return pointer. *)
 (* begin thide *)
-  Fixpoint cpsType (t : Source.type) : CPS.type :=
+Fixpoint cpsType (t : Source.type) : CPS.type :=
  match t with
    | Nat => Nat%cps
    | t1 --> t2 => (cpsType t1 ** (cpsType t2 --->) --->)%cps
  end%source.
-  Reserved Notation "x <-- e1 ; e2" (right associativity, at level 76, e1 at next level).
+(** Now we can define the expression translation.  The notation [x <-- e1; e2] stands for translating source-level expression [e1], binding [x] to the CPS-level result of running the translated program, and then evaluating CPS-level expression [e2] in that context. *)
+Reserved Notation "x <-- e1 ; e2" (right associativity, at level 76, e1 at next level).
-  Section cpsExp.
+Section cpsExp.
  Variable var : CPS.type -> Type.
  Import Source.
  Open Scope cps_scope.
+  (** We implement a well-known variety of higher-order, one-pass CPS translation.  The translation [cpsExp] is parameterized not only by the expression [e] to translate, but also by a meta-level continuation.  The idea is that [cpsExp] evaluates the translation of [e] and calls the continuation on the result.  With this convention, [cpsExp] itself is a natural match for the notation we just reserved. *)
  Fixpoint cpsExp t (e : exp (fun t => var (cpsType t)) t)
    : (var (cpsType t) -> prog var) -> prog var :=
    match e with
@@ -305,31 +322,105 @@ Module STLC.
    end
    where "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)).
-  End cpsExp.
+End cpsExp.
-  Notation "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)) : cps_scope.
+(** Since notations do not survive the closing of sections, we redefine the notation associated with [cpsExp]. *)
-  Notation "! <-- e1 ; e2" := (cpsExp e1 (fun _ => e2))
-    (right associativity, at level 76, e1 at next level) : cps_scope.
-  Implicit Arguments cpsExp [var t].
+Notation "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)) : cps_scope.
-  Definition CpsExp (E : Exp Nat) : Prog :=
-    fun var => cpsExp (E _) (PHalt (var := _)).
+Implicit Arguments cpsExp [var t].
-(* end thide *)
+(** We wrap [cpsExp] into the parametric version [CpsExp], passing an always-halt continuation at the root of the recursion. *)
-  Eval compute in CpsExp zero.
+Definition CpsExp (E : Exp Nat) : Prog :=
-  Eval compute in CpsExp one.
+  fun _ => cpsExp (E _) (PHalt (var := _)).
-  Eval compute in CpsExp zpo.
+(* end thide *)
-  Eval compute in CpsExp app_ident.
-  Eval compute in CpsExp app_ident'.
-  Eval compute in ProgDenote (CpsExp zero).
+Eval compute in CpsExp zero.
-  Eval compute in ProgDenote (CpsExp one).
+(** %\vspace{-.15in}% [[
-  Eval compute in ProgDenote (CpsExp zpo).
+     = fun var : type -> Type => x <- ^0; Halt x
-  Eval compute in ProgDenote (CpsExp app_ident).
+     : Prog
-  Eval compute in ProgDenote (CpsExp app_ident').
+   ]] *)
+Eval compute in CpsExp one.
+(** %\vspace{-.15in}% [[
+     = fun var : type -> Type => x <- ^1; Halt x
+     : Prog
+   ]] *)
+Eval compute in CpsExp zpo.
+(** %\vspace{-.15in}% [[
+     = fun var : type -> Type => x <- ^0; x0 <- ^1; x1 <- (x +^ x0); Halt x1
+     : Prog
+   ]] *)
+Eval compute in CpsExp app_ident.
+(** %\vspace{-.15in}% [[
+     = fun var : type -> Type =>
+       f <- (\ p, x <- #1 p; kf <- #2 p; kf @@ x);
+       x <- ^0;
+       x0 <- ^1; x1 <- (x +^ x0); kf <- (\ r, Halt r); p <- [x1, kf]; f @@ p
+     : Prog
+   ]] *)
+Eval compute in CpsExp app_ident'.
+(** %\vspace{-.15in}% [[
+     = fun var : type -> Type =>
+       f <-
+       (\ p,
+        x <- #1 p;
+        kf <- #2 p;
+        f <-
+        (\ p0,
+         x0 <- #1 p0;
+         kf0 <- #2 p0; kf1 <- (\ r, kf0 @@ r); p1 <- [x0, kf1]; x @@ p1);
+        kf @@ f);
+       f0 <- (\ p, x <- #1 p; kf <- #2 p; kf @@ x);
+       kf <-
+       (\ r,
+        x <- ^0;
+        x0 <- ^1;
+        x1 <- (x +^ x0); kf <- (\ r0, Halt r0); p <- [x1, kf]; r @@ p);
+       p <- [f0, kf]; f @@ p
+     : Prog
+   ]] *)
+Eval compute in ProgDenote (CpsExp zero).
+(** %\vspace{-.15in}% [[
+     = 0
+     : nat
+   ]] *)
+Eval compute in ProgDenote (CpsExp one).
+(** %\vspace{-.15in}% [[
+     = 1
+     : nat
+   ]] *)
+Eval compute in ProgDenote (CpsExp zpo).
+(** %\vspace{-.15in}% [[
+     = 1
+     : nat
+   ]] *)
+Eval compute in ProgDenote (CpsExp app_ident).
+(** %\vspace{-.15in}% [[
+     = 1
+     : nat
+   ]] *)
+Eval compute in ProgDenote (CpsExp app_ident').
+(** %\vspace{-.15in}% [[
+     = 1
+     : nat
+   ]] *)
+(** Our main inductive lemma about [cpsExp] needs a notion of compatibility between source-level and CPS-level values.  We express compatibility with a %\textit{%#<i>#logical relation#</i>#%}%; that is, we define a binary relation by recursion on type structure, and the function case of the relation considers functions related if they map related arguments to related results.  In detail, the function case is slightly more complicated, since it must deal with our continuation-based calling convention. *)
 (* begin thide *)
-  Fixpoint lr (t : Source.type) : Source.typeDenote t -> CPS.typeDenote (cpsType t) -> Prop :=
+Fixpoint lr (t : Source.type)
+  : Source.typeDenote t -> CPS.typeDenote (cpsType t) -> Prop :=
  match t with
    | Nat => fun n1 n2 => n1 = n2
    | t1 --> t2 => fun f1 f2 =>
@@ -339,13 +430,17 @@ Module STLC.
          /\ lr _ (f1 x1) r
  end%source.
-  Lemma cpsExp_correct : forall G t (e1 : exp _ t) (e2 : exp _ t),
+(** The main lemma is now easily stated and proved.  The most surprising aspect of the statement is the presence of %\textit{%#<i>#two#</i>#%}% versions of the expression to be compiled.  The first, [e1], uses a [var] choice that makes it a suitable argument to [expDenote].  The second expression, [e2], uses a [var] choice that makes its compilation, [cpsExp e2 k], a suitable argument to [progDenote].  We use [exp_equiv] to assert that [e1] and [e2] have the same underlying structure, up to a variable correspondence list [G].  A hypothesis about [G] ensures that all of its pairs of variables belong to the logical relation [lr].  We also use [lr], in concert with some quantification over continuations and program results, in the conclusion of the lemma.
+   The lemma's proof should be unsurprising by now.  It uses our standard bag of Ltac tricks to help out with quantifier instantiation; [crush] and [eauto] can handle the rest. *)
+Lemma cpsExp_correct : forall G t (e1 : exp _ t) (e2 : exp _ t),
  exp_equiv G e1 e2
  -> (forall t v1 v2, In (existT _ t (v1, v2)) G -> lr t v1 v2)
  -> forall k, exists r,
    progDenote (cpsExp e2 k) = progDenote (k r)
    /\ lr t (expDenote e1) r.
-    induction 1; crush; fold typeDenote in *;
+  induction 1; crush;
    repeat (match goal with
              | [ H : forall k, exists r, progDenote (cpsExp ?E k) = _ /\ _
                  |- context[cpsExp ?E ?K] ] =>
@@ -361,28 +456,26 @@ Module STLC.
                      end
                end
            end; crush); eauto.
-  Qed.
+Qed.
-  Lemma vars_easy : forall (t : Source.type) (v1 : Source.typeDenote t)
+(** A simple lemma establishes the degenerate case of [cpsExp_correct]'s hypothesis about [G]. *)
-    (v2 : typeDenote (cpsType t)),
-    In
+Lemma vars_easy : forall t v1 v2,
-    (existT
+  In (existT (fun t0 => (Source.typeDenote t0 * typeDenote (cpsType t0))%type) t
-      (fun t0 : Source.type =>
-        (Source.typeDenote t0 * typeDenote (cpsType t0))%type) t
    (v1, v2)) nil -> lr t v1 v2.
  crush.
-  Qed.
+Qed.
-  Theorem CpsExp_correct : forall (E : Exp Nat),
+(** A manual application of [cpsExp_correct] proves a version applicable to [CpsExp].  This is where we use the axiom [Exp_equiv]. *)
+Theorem CpsExp_correct : forall (E : Exp Nat),
  ProgDenote (CpsExp E) = ExpDenote E.
  unfold ProgDenote, CpsExp, ExpDenote; intros;
    generalize (cpsExp_correct (e1 := E _) (e2 := E _)
      (Exp_equiv _ _ _) vars_easy (PHalt (var := _))); crush.
-  Qed.
+Qed.
 (* end thide *)
-End STLC.
 (** * Exercises *)

--- a/src/Tactics.v
+++ b/src/Tactics.v
@@ -156,3 +156,25 @@ Ltac clear_all :=
  repeat match goal with
           | [ H : _ |- _ ] => clear H
         end.
+Ltac guess tac H :=
+  repeat match type of H with
+           | forall x : ?T, _ =>
+             match type of T with
+               | Prop =>
+                 (let H' := fresh "H'" in
+                   assert (H' : T); [
+                     solve [ tac ]
+                     | generalize (H H'); clear H H'; intro H ])
+                 || fail 1
+               | _ =>
+                 let x := fresh "x" in
+                   evar (x : T);
+                   let x' := eval cbv delta [x] in x in
+                     clear x; generalize (H x'); clear H; intro H
+             end
+         end.
+Ltac guessKeep tac H :=
+  let H' := fresh "H'" in
+    generalize H; intro H'; guess tac H'.