Commit bc911257 authored by Adam Chlipala's avatar Adam Chlipala

Prosified Extensional

parent 2ccd7485
...@@ -18,16 +18,23 @@ Set Implicit Arguments. ...@@ -18,16 +18,23 @@ Set Implicit Arguments.
(** %\chapter{Extensional Transformations}% *) (** %\chapter{Extensional Transformations}% *)
(** TODO: Prose for this chapter *) (** Last chapter's constant folding example was particularly easy to verify, because that transformation used the same source and target language. In this chapter, we verify a different translation, illustrating the added complexities in translating between languages.
Program transformations can be classified as %\textit{%#<i>#intensional#</i>#%}%, when they require some notion of inequality between variables; or %\textit{%#<i>#extensional#</i>#%}%, otherwise. This chapter's example is extensional, and the next chapter deals with the trickier intensional case. *)
(** * Simply-Typed Lambda Calculus *)
Module STLC. (** * CPS Conversion for Simply-Typed Lambda Calculus *)
Module Source.
(** A convenient method for compiling functional programs begins with conversion to %\textit{%#<i>#continuation-passing style#</i>#%}%, or CPS. In this restricted form, function calls never return; instead, we pass explicit return pointers, much as in assembly language. Additionally, we make order of evaluation explicit, breaking complex expressions into sequences of primitive operations.
Our translation will operate over the same source language that we used in the first part of last chapter, so we omit most of the language definition. However, we do make one significant change: since we will be working with multiple languages that involve similar constructs, we use Coq's %\textit{%#<i>#notation scope#</i>#%}% mechanism to disambiguate. For instance, the span of code dealing with type notations looks like this: *)
(* begin hide *)
Module Source.
Inductive type : Type := Inductive type : Type :=
| TNat : type | TNat : type
| Arrow : type -> type -> type. | Arrow : type -> type -> type.
(* end hide *)
Notation "'Nat'" := TNat : source_scope. Notation "'Nat'" := TNat : source_scope.
Infix "-->" := Arrow (right associativity, at level 60) : source_scope. Infix "-->" := Arrow (right associativity, at level 60) : source_scope.
...@@ -36,6 +43,9 @@ Module STLC. ...@@ -36,6 +43,9 @@ Module STLC.
Bind Scope source_scope with type. Bind Scope source_scope with type.
Delimit Scope source_scope with source. Delimit Scope source_scope with source.
(** We explicitly place our notations inside a scope named [source_scope], and we associate a delimiting key [source] with [source_scope]. Without further commands, our notations would only be used in expressions like [(...)%source]. We also open our scope locally within this module, so that we avoid repeating [%source] in many places. Further, we %\textit{%#<i>#bind#</i>#%}% our scope to [type]. In some circumstances where Coq is able to infer that some subexpression has type [type], that subexpression will automatically be parsed in [source_scope]. *)
(* begin hide *)
Section vars. Section vars.
Variable var : type -> Type. Variable var : type -> Type.
...@@ -102,6 +112,9 @@ Module STLC. ...@@ -102,6 +112,9 @@ Module STLC.
end. end.
Definition ExpDenote t (e : Exp t) := expDenote (e _). Definition ExpDenote t (e : Exp t) := expDenote (e _).
(* end hide *)
(** The other critical new ingredient is a generalization of the [Closed] relation from two chapters ago. The new relation [exp_equiv] characters when two expressions may be considered syntactically equal. We need to be able to handle cases where each expression uses a different [var] type. Intuitively, we will want to compare expressions that use their variables to store source-level and target-level values. We express pairs of equivalent variables using a list parameter to the relation; variable expressions will be considered equivalent if and only if their variables belong to this list. The rule for function abstraction extends the list in a higher-order way. The remaining rules just implement the obvious congruence over expressions. *)
(* begin thide *) (* begin thide *)
Section exp_equiv. Section exp_equiv.
...@@ -129,20 +142,22 @@ Module STLC. ...@@ -129,20 +142,22 @@ Module STLC.
-> exp_equiv G (Abs f1) (Abs f2). -> exp_equiv G (Abs f1) (Abs f2).
End exp_equiv. End exp_equiv.
(** It turns out that, for any parametric expression [E], any two instantiations of [E] with particular [var] types must be equivalent, with respect to an empty variable list. The parametricity of Gallina guarantees this, in much the same way that it guaranteed the truth of the axiom about [Closed]. Thus, we assert an analogous axiom here. *)
Axiom Exp_equiv : forall t (E : Exp t) var1 var2, Axiom Exp_equiv : forall t (E : Exp t) var1 var2,
exp_equiv nil (E var1) (E var2). exp_equiv nil (E var1) (E var2).
(* end thide *) (* end thide *)
End Source. End Source.
(** Now we need to define the CPS language, where binary function types are replaced with unary continuation types, and we add product types because they will be useful in our translation. *)
Module CPS. Module CPS.
Inductive type : Type := Inductive type : Type :=
| TNat : type | TNat : type
| Cont : type -> type | Cont : type -> type
| TUnit : type
| Prod : type -> type -> type. | Prod : type -> type -> type.
Notation "'Nat'" := TNat : cps_scope. Notation "'Nat'" := TNat : cps_scope.
Notation "'Unit'" := TUnit : cps_scope.
Notation "t --->" := (Cont t) (at level 61) : cps_scope. Notation "t --->" := (Cont t) (at level 61) : cps_scope.
Infix "**" := Prod (right associativity, at level 60) : cps_scope. Infix "**" := Prod (right associativity, at level 60) : cps_scope.
...@@ -152,6 +167,8 @@ Module STLC. ...@@ -152,6 +167,8 @@ Module STLC.
Section vars. Section vars.
Variable var : type -> Type. Variable var : type -> Type.
(** A CPS program is a series of bindings of primitive operations (primops), followed by either a halt with a final program result or by a call to a continuation. The arguments to these program-ending operations are enforced to be variables. To use the values of compound expressions instead, those expressions must be decomposed into bindings of primops. The primop language itself similarly forces variables for all arguments besides bodies of function abstractions. *)
Inductive prog : Type := Inductive prog : Type :=
| PHalt : | PHalt :
var Nat var Nat
...@@ -166,10 +183,6 @@ Module STLC. ...@@ -166,10 +183,6 @@ Module STLC.
-> prog -> prog
with primop : type -> Type := with primop : type -> Type :=
| Var : forall t,
var t
-> primop t
| Const : nat -> primop Nat | Const : nat -> primop Nat
| Plus : var Nat -> var Nat -> primop Nat | Plus : var Nat -> var Nat -> primop Nat
...@@ -192,7 +205,6 @@ Module STLC. ...@@ -192,7 +205,6 @@ Module STLC.
Implicit Arguments PHalt [var]. Implicit Arguments PHalt [var].
Implicit Arguments App [var t]. Implicit Arguments App [var t].
Implicit Arguments Var [var t].
Implicit Arguments Const [var]. Implicit Arguments Const [var].
Implicit Arguments Plus [var]. Implicit Arguments Plus [var].
Implicit Arguments Abs [var t]. Implicit Arguments Abs [var t].
...@@ -207,8 +219,6 @@ Module STLC. ...@@ -207,8 +219,6 @@ Module STLC.
Notation "! <- p ; e" := (Bind p (fun _ => e)) Notation "! <- p ; e" := (Bind p (fun _ => e))
(right associativity, at level 76, p at next level) : cps_scope. (right associativity, at level 76, p at next level) : cps_scope.
Notation "# v" := (Var v) (at level 70) : cps_scope.
Notation "^ n" := (Const n) (at level 70) : cps_scope. Notation "^ n" := (Const n) (at level 70) : cps_scope.
Infix "+^" := Plus (left associativity, at level 79) : cps_scope. Infix "+^" := Plus (left associativity, at level 79) : cps_scope.
...@@ -223,14 +233,17 @@ Module STLC. ...@@ -223,14 +233,17 @@ Module STLC.
Open Scope cps_scope. Open Scope cps_scope.
(** In interpreting types, we treat continuations as functions with codomain [nat], choosing [nat] as our arbitrary program result type. *)
Fixpoint typeDenote (t : type) : Set := Fixpoint typeDenote (t : type) : Set :=
match t with match t with
| Nat => nat | Nat => nat
| t' ---> => typeDenote t' -> nat | t' ---> => typeDenote t' -> nat
| Unit => unit
| t1 ** t2 => (typeDenote t1 * typeDenote t2)%type | t1 ** t2 => (typeDenote t1 * typeDenote t2)%type
end. end.
(** A mutually-recursive definition establishes the meanings of programs and primops. *)
Fixpoint progDenote (e : prog typeDenote) : nat := Fixpoint progDenote (e : prog typeDenote) : nat :=
match e with match e with
| PHalt n => n | PHalt n => n
...@@ -240,8 +253,6 @@ Module STLC. ...@@ -240,8 +253,6 @@ Module STLC.
with primopDenote t (p : primop typeDenote t) : typeDenote t := with primopDenote t (p : primop typeDenote t) : typeDenote t :=
match p with match p with
| Var _ v => v
| Const n => n | Const n => n
| Plus n1 n2 => n1 + n2 | Plus n1 n2 => n1 + n2
...@@ -256,25 +267,31 @@ Module STLC. ...@@ -256,25 +267,31 @@ Module STLC.
Definition Primop t := forall var, primop var t. Definition Primop t := forall var, primop var t.
Definition ProgDenote (E : Prog) := progDenote (E _). Definition ProgDenote (E : Prog) := progDenote (E _).
Definition PrimopDenote t (P : Primop t) := primopDenote (P _). Definition PrimopDenote t (P : Primop t) := primopDenote (P _).
End CPS. End CPS.
Import Source CPS. Import Source CPS.
(** The translation itself begins with a type-level compilation function. We change every function into a continuation whose argument is a pair, consisting of the translation of the original argument and of an explicit return pointer. *)
(* begin thide *) (* begin thide *)
Fixpoint cpsType (t : Source.type) : CPS.type := Fixpoint cpsType (t : Source.type) : CPS.type :=
match t with match t with
| Nat => Nat%cps | Nat => Nat%cps
| t1 --> t2 => (cpsType t1 ** (cpsType t2 --->) --->)%cps | t1 --> t2 => (cpsType t1 ** (cpsType t2 --->) --->)%cps
end%source. end%source.
Reserved Notation "x <-- e1 ; e2" (right associativity, at level 76, e1 at next level). (** Now we can define the expression translation. The notation [x <-- e1; e2] stands for translating source-level expression [e1], binding [x] to the CPS-level result of running the translated program, and then evaluating CPS-level expression [e2] in that context. *)
Reserved Notation "x <-- e1 ; e2" (right associativity, at level 76, e1 at next level).
Section cpsExp. Section cpsExp.
Variable var : CPS.type -> Type. Variable var : CPS.type -> Type.
Import Source. Import Source.
Open Scope cps_scope. Open Scope cps_scope.
(** We implement a well-known variety of higher-order, one-pass CPS translation. The translation [cpsExp] is parameterized not only by the expression [e] to translate, but also by a meta-level continuation. The idea is that [cpsExp] evaluates the translation of [e] and calls the continuation on the result. With this convention, [cpsExp] itself is a natural match for the notation we just reserved. *)
Fixpoint cpsExp t (e : exp (fun t => var (cpsType t)) t) Fixpoint cpsExp t (e : exp (fun t => var (cpsType t)) t)
: (var (cpsType t) -> prog var) -> prog var := : (var (cpsType t) -> prog var) -> prog var :=
match e with match e with
...@@ -305,31 +322,105 @@ Module STLC. ...@@ -305,31 +322,105 @@ Module STLC.
end end
where "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)). where "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)).
End cpsExp. End cpsExp.
Notation "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)) : cps_scope. (** Since notations do not survive the closing of sections, we redefine the notation associated with [cpsExp]. *)
Notation "! <-- e1 ; e2" := (cpsExp e1 (fun _ => e2))
(right associativity, at level 76, e1 at next level) : cps_scope.
Implicit Arguments cpsExp [var t]. Notation "x <-- e1 ; e2" := (cpsExp e1 (fun x => e2)) : cps_scope.
Definition CpsExp (E : Exp Nat) : Prog :=
fun var => cpsExp (E _) (PHalt (var := _)). Implicit Arguments cpsExp [var t].
(* end thide *)
(** We wrap [cpsExp] into the parametric version [CpsExp], passing an always-halt continuation at the root of the recursion. *)
Eval compute in CpsExp zero. Definition CpsExp (E : Exp Nat) : Prog :=
Eval compute in CpsExp one. fun _ => cpsExp (E _) (PHalt (var := _)).
Eval compute in CpsExp zpo. (* end thide *)
Eval compute in CpsExp app_ident.
Eval compute in CpsExp app_ident'.
Eval compute in ProgDenote (CpsExp zero). Eval compute in CpsExp zero.
Eval compute in ProgDenote (CpsExp one). (** %\vspace{-.15in}% [[
Eval compute in ProgDenote (CpsExp zpo). = fun var : type -> Type => x <- ^0; Halt x
Eval compute in ProgDenote (CpsExp app_ident). : Prog
Eval compute in ProgDenote (CpsExp app_ident'). ]] *)
Eval compute in CpsExp one.
(** %\vspace{-.15in}% [[
= fun var : type -> Type => x <- ^1; Halt x
: Prog
]] *)
Eval compute in CpsExp zpo.
(** %\vspace{-.15in}% [[
= fun var : type -> Type => x <- ^0; x0 <- ^1; x1 <- (x +^ x0); Halt x1
: Prog
]] *)
Eval compute in CpsExp app_ident.
(** %\vspace{-.15in}% [[
= fun var : type -> Type =>
f <- (\ p, x <- #1 p; kf <- #2 p; kf @@ x);
x <- ^0;
x0 <- ^1; x1 <- (x +^ x0); kf <- (\ r, Halt r); p <- [x1, kf]; f @@ p
: Prog
]] *)
Eval compute in CpsExp app_ident'.
(** %\vspace{-.15in}% [[
= fun var : type -> Type =>
f <-
(\ p,
x <- #1 p;
kf <- #2 p;
f <-
(\ p0,
x0 <- #1 p0;
kf0 <- #2 p0; kf1 <- (\ r, kf0 @@ r); p1 <- [x0, kf1]; x @@ p1);
kf @@ f);
f0 <- (\ p, x <- #1 p; kf <- #2 p; kf @@ x);
kf <-
(\ r,
x <- ^0;
x0 <- ^1;
x1 <- (x +^ x0); kf <- (\ r0, Halt r0); p <- [x1, kf]; r @@ p);
p <- [f0, kf]; f @@ p
: Prog
]] *)
Eval compute in ProgDenote (CpsExp zero).
(** %\vspace{-.15in}% [[
= 0
: nat
]] *)
Eval compute in ProgDenote (CpsExp one).
(** %\vspace{-.15in}% [[
= 1
: nat
]] *)
Eval compute in ProgDenote (CpsExp zpo).
(** %\vspace{-.15in}% [[
= 1
: nat
]] *)
Eval compute in ProgDenote (CpsExp app_ident).
(** %\vspace{-.15in}% [[
= 1
: nat
]] *)
Eval compute in ProgDenote (CpsExp app_ident').
(** %\vspace{-.15in}% [[
= 1
: nat
]] *)
(** Our main inductive lemma about [cpsExp] needs a notion of compatibility between source-level and CPS-level values. We express compatibility with a %\textit{%#<i>#logical relation#</i>#%}%; that is, we define a binary relation by recursion on type structure, and the function case of the relation considers functions related if they map related arguments to related results. In detail, the function case is slightly more complicated, since it must deal with our continuation-based calling convention. *)
(* begin thide *) (* begin thide *)
Fixpoint lr (t : Source.type) : Source.typeDenote t -> CPS.typeDenote (cpsType t) -> Prop := Fixpoint lr (t : Source.type)
: Source.typeDenote t -> CPS.typeDenote (cpsType t) -> Prop :=
match t with match t with
| Nat => fun n1 n2 => n1 = n2 | Nat => fun n1 n2 => n1 = n2
| t1 --> t2 => fun f1 f2 => | t1 --> t2 => fun f1 f2 =>
...@@ -339,13 +430,17 @@ Module STLC. ...@@ -339,13 +430,17 @@ Module STLC.
/\ lr _ (f1 x1) r /\ lr _ (f1 x1) r
end%source. end%source.
Lemma cpsExp_correct : forall G t (e1 : exp _ t) (e2 : exp _ t), (** The main lemma is now easily stated and proved. The most surprising aspect of the statement is the presence of %\textit{%#<i>#two#</i>#%}% versions of the expression to be compiled. The first, [e1], uses a [var] choice that makes it a suitable argument to [expDenote]. The second expression, [e2], uses a [var] choice that makes its compilation, [cpsExp e2 k], a suitable argument to [progDenote]. We use [exp_equiv] to assert that [e1] and [e2] have the same underlying structure, up to a variable correspondence list [G]. A hypothesis about [G] ensures that all of its pairs of variables belong to the logical relation [lr]. We also use [lr], in concert with some quantification over continuations and program results, in the conclusion of the lemma.
The lemma's proof should be unsurprising by now. It uses our standard bag of Ltac tricks to help out with quantifier instantiation; [crush] and [eauto] can handle the rest. *)
Lemma cpsExp_correct : forall G t (e1 : exp _ t) (e2 : exp _ t),
exp_equiv G e1 e2 exp_equiv G e1 e2
-> (forall t v1 v2, In (existT _ t (v1, v2)) G -> lr t v1 v2) -> (forall t v1 v2, In (existT _ t (v1, v2)) G -> lr t v1 v2)
-> forall k, exists r, -> forall k, exists r,
progDenote (cpsExp e2 k) = progDenote (k r) progDenote (cpsExp e2 k) = progDenote (k r)
/\ lr t (expDenote e1) r. /\ lr t (expDenote e1) r.
induction 1; crush; fold typeDenote in *; induction 1; crush;
repeat (match goal with repeat (match goal with
| [ H : forall k, exists r, progDenote (cpsExp ?E k) = _ /\ _ | [ H : forall k, exists r, progDenote (cpsExp ?E k) = _ /\ _
|- context[cpsExp ?E ?K] ] => |- context[cpsExp ?E ?K] ] =>
...@@ -361,28 +456,26 @@ Module STLC. ...@@ -361,28 +456,26 @@ Module STLC.
end end
end end
end; crush); eauto. end; crush); eauto.
Qed. Qed.
Lemma vars_easy : forall (t : Source.type) (v1 : Source.typeDenote t) (** A simple lemma establishes the degenerate case of [cpsExp_correct]'s hypothesis about [G]. *)
(v2 : typeDenote (cpsType t)),
In Lemma vars_easy : forall t v1 v2,
(existT In (existT (fun t0 => (Source.typeDenote t0 * typeDenote (cpsType t0))%type) t
(fun t0 : Source.type =>
(Source.typeDenote t0 * typeDenote (cpsType t0))%type) t
(v1, v2)) nil -> lr t v1 v2. (v1, v2)) nil -> lr t v1 v2.
crush. crush.
Qed. Qed.
Theorem CpsExp_correct : forall (E : Exp Nat), (** A manual application of [cpsExp_correct] proves a version applicable to [CpsExp]. This is where we use the axiom [Exp_equiv]. *)
Theorem CpsExp_correct : forall (E : Exp Nat),
ProgDenote (CpsExp E) = ExpDenote E. ProgDenote (CpsExp E) = ExpDenote E.
unfold ProgDenote, CpsExp, ExpDenote; intros; unfold ProgDenote, CpsExp, ExpDenote; intros;
generalize (cpsExp_correct (e1 := E _) (e2 := E _) generalize (cpsExp_correct (e1 := E _) (e2 := E _)
(Exp_equiv _ _ _) vars_easy (PHalt (var := _))); crush. (Exp_equiv _ _ _) vars_easy (PHalt (var := _))); crush.
Qed. Qed.
(* end thide *) (* end thide *)
End STLC.
(** * Exercises *) (** * Exercises *)
......
...@@ -156,3 +156,25 @@ Ltac clear_all := ...@@ -156,3 +156,25 @@ Ltac clear_all :=
repeat match goal with repeat match goal with
| [ H : _ |- _ ] => clear H | [ H : _ |- _ ] => clear H
end. end.
Ltac guess tac H :=
repeat match type of H with
| forall x : ?T, _ =>
match type of T with
| Prop =>
(let H' := fresh "H'" in
assert (H' : T); [
solve [ tac ]
| generalize (H H'); clear H H'; intro H ])
|| fail 1
| _ =>
let x := fresh "x" in
evar (x : T);
let x' := eval cbv delta [x] in x in
clear x; generalize (H x'); clear H; intro H
end
end.
Ltac guessKeep tac H :=
let H' := fresh "H'" in
generalize H; intro H'; guess tac H'.
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment