[sledge semantics] Refactor the memory model

Summary:
LLVM and llair have similar memory models, and we don't want to
duplicate any definitions or theorems. This adds a new memory model
theory which should be understandable in its own right. A heap is a
mapping from addresses to bytes, alongside a set of valid addresses, and
intervals that have been allocated already. Primitives are defined for
allocating and de-allocating as well as reading and writing chuncks of
bytes.

There is also a generic type of structured values, and functions for
converting them to/from byte arrays.

Reviewed By: jberdine

Differential Revision: D17074470

fbshipit-source-id: bdab6089f
master
Scott Owens 5 years ago committed by Facebook Github Bot
parent 28e84f275e
commit 9f44bbc264

@ -8,7 +8,7 @@
(* A mini-LLAIR model, based on the files in sledge/src/llair *) (* A mini-LLAIR model, based on the files in sledge/src/llair *)
open HolKernel boolLib bossLib Parse; open HolKernel boolLib bossLib Parse;
open settingsTheory; open settingsTheory memory_modelTheory;
new_theory "llair"; new_theory "llair";
@ -120,25 +120,19 @@ End
(* ----- Semantic states ----- *) (* ----- Semantic states ----- *)
(* TODO Given the similarities with LLVM, consider moving some definitions into
* a common predecessor theory *)
Datatype:
addr = A num
End
(* These are the values that can be stored in registers. The implementation uses (* These are the values that can be stored in registers. The implementation uses
* integers with a bit-width to represent numbers, and keeps locations and sizes * integers with a bit-width to represent numbers, and keeps locations and sizes
* separate. * separate.
*) *)
Datatype: Datatype:
v = flat_v =
| LocV num | LocV num
| SizeV num | SizeV num
| IntV int num | IntV int num
| AggV (v list)
End End
Type v = ``:flat_v reg_v``
Datatype: Datatype:
pc = <| l : label; i : num |> pc = <| l : label; i : num |>
End End
@ -153,15 +147,7 @@ Datatype:
globals : var |-> word64; globals : var |-> word64;
locals : var |-> v; locals : var |-> v;
stack : frame list; stack : frame list;
(* The set of allocated ranges. heap : unit heap |>
* The llvm model had a bool to indicate whether the range is free-able
* or not, since the memory that the globals is in should never be freed.
* llair does not currently catch this error, so we won't either. If
* llair wants to catch the error in the future, then we can adapt the
* semantics. *)
allocations : (num # num) set;
(* A byte addressed heap *)
heap : addr |-> word8 |>
End End
(* ----- Semantic transitions ----- *) (* ----- Semantic transitions ----- *)

@ -9,7 +9,7 @@
* are relevant for the LLVM -> LLAIR translation, especially exceptions. *) * are relevant for the LLVM -> LLAIR translation, especially exceptions. *)
open HolKernel boolLib bossLib Parse; open HolKernel boolLib bossLib Parse;
open settingsTheory; open settingsTheory memory_modelTheory;
new_theory "llvm"; new_theory "llvm";
@ -137,20 +137,17 @@ End
(* ----- Semantic states ----- *) (* ----- Semantic states ----- *)
Datatype: Datatype:
addr = A num flat_v =
End
Datatype:
v =
| W1V word1 | W1V word1
| W8V word8 | W8V word8
| W32V word32 | W32V word32
| W64V word64 | W64V word64
| AggV (v list)
| PtrV word64 | PtrV word64
| UndefV | UndefV
End End
Type v = ``:flat_v reg_v``
Datatype: Datatype:
pv = <| poison : bool; value : v |> pv = <| poison : bool; value : v |>
End End
@ -170,11 +167,7 @@ Datatype:
globals : glob_var |-> (num # word64); globals : glob_var |-> (num # word64);
locals : reg |-> pv; locals : reg |-> pv;
stack : frame list; stack : frame list;
(* The set of allocated ranges. The bool indicates whether the range is heap : bool heap |>
* free-able or not *)
allocations : (bool # num # num) set;
(* A byte addressed heap, with a poison tag *)
heap : addr |-> bool # word8 |>
End End
(* ----- Things about types ----- *) (* ----- Things about types ----- *)
@ -217,11 +210,11 @@ Definition indices_ok_def:
End End
Inductive value_type: Inductive value_type:
(value_type (IntT W1) (W1V w1)) (value_type (IntT W1) (FlatV (W1V w1)))
(value_type (IntT W8) (W8V w8)) (value_type (IntT W8) (FlatV (W8V w8)))
(value_type (IntT W32) (W32V w32)) (value_type (IntT W32) (FlatV (W32V w32)))
(value_type (IntT W64) (W64V w64)) (value_type (IntT W64) (FlatV (W64V w64)))
(value_type (PtrT _) (PtrV w64)) (value_type (PtrT _) (FlatV (PtrV w64)))
(every (value_type t) vs length vs = n first_class_type t (every (value_type t) vs length vs = n first_class_type t
value_type (ArrT n t) (AggV vs)) value_type (ArrT n t) (AggV vs))
@ -230,30 +223,19 @@ Inductive value_type:
value_type (StrT ts) (AggV vs)) value_type (StrT ts) (AggV vs))
End End
(* ----- Semantic transitions ----- *) Definition extract_type_def:
(extract_type t [] = Some t)
Definition w64_cast_def: (extract_type (ArrT n t) (i::idx) =
(w64_cast w (IntT W1) = Some (W1V (w2w w))) if i < n then
(w64_cast w (IntT W8) = Some (W8V (w2w w))) extract_type t idx
(w64_cast w (IntT W32) = Some (W32V (w2w w))) else
(w64_cast w (IntT W64) = Some (W64V w)) None)
(w64_cast _ _ = None) (extract_type (StrT ts) (i::idx) =
End if i < length ts then
extract_type (el i ts) idx
Definition cast_w64_def: else
(cast_w64 (W1V w) = Some (w2w w)) None)
(cast_w64 (W8V w) = Some (w2w w)) (extract_type _ _ = None)
(cast_w64 (W32V w) = Some (w2w w))
(cast_w64 (W64V w) = Some w)
(cast_w64 _ = None)
End
Definition cast_num_def:
cast_num v = option_map w2n (cast_w64 v)
End
Definition bool_to_v_def:
bool_to_v b = if b then W1V 1w else W1V 0w
End End
(* Calculate the offset given by a list of indices *) (* Calculate the offset given by a list of indices *)
@ -273,26 +255,52 @@ Definition get_offset_def:
(get_offset _ _ = Some 0) (get_offset _ _ = Some 0)
End End
(* ----- Semantic transitions ----- *)
Definition w64_cast_def:
(w64_cast w (IntT W1) = Some (FlatV (W1V (w2w w))))
(w64_cast w (IntT W8) = Some (FlatV (W8V (w2w w))))
(w64_cast w (IntT W32) = Some (FlatV (W32V (w2w w))))
(w64_cast w (IntT W64) = Some (FlatV (W64V w)))
(w64_cast _ _ = None)
End
Definition cast_w64_def:
(cast_w64 (FlatV (W1V w)) = Some (w2w w))
(cast_w64 (FlatV (W8V w)) = Some (w2w w))
(cast_w64 (FlatV (W32V w)) = Some (w2w w))
(cast_w64 (FlatV (W64V w)) = Some w)
(cast_w64 _ = None)
End
Definition cast_num_def:
cast_num v = option_map w2n (cast_w64 v)
End
Definition bool_to_v_def:
bool_to_v b = if b then FlatV (W1V 1w) else FlatV (W1V 0w)
End
Definition eval_const_def: Definition eval_const_def:
(eval_const g (IntC W1 i) = W1V (i2w i)) (eval_const g (IntC W1 i) = FlatV (W1V (i2w i)))
(eval_const g (IntC W8 i) = W8V (i2w i)) (eval_const g (IntC W8 i) = FlatV (W8V (i2w i)))
(eval_const g (IntC W32 i) = W32V (i2w i)) (eval_const g (IntC W32 i) = FlatV (W32V (i2w i)))
(eval_const g (IntC W64 i) = W64V (i2w i)) (eval_const g (IntC W64 i) = FlatV (W64V (i2w i)))
(eval_const g (StrC tconsts) = AggV (map (eval_const g) (map snd tconsts))) (eval_const g (StrC tconsts) = AggV (map (eval_const g) (map snd tconsts)))
(eval_const g (ArrC tconsts) = AggV (map (eval_const g) (map snd tconsts))) (eval_const g (ArrC tconsts) = AggV (map (eval_const g) (map snd tconsts)))
(eval_const g (GepC ty ptr (t, idx) indices) = (eval_const g (GepC ty ptr (t, idx) indices) =
case (eval_const g ptr, cast_num (eval_const g idx)) of case (eval_const g ptr, cast_num (eval_const g idx)) of
| (PtrV w, Some n) => | (FlatV (PtrV w), Some n) =>
let ns = map (λ(t,ci). case cast_num (eval_const g ci) of None => 0 | Some n => n) indices in let ns = map (λ(t,ci). case cast_num (eval_const g ci) of None => 0 | Some n => n) indices in
(case get_offset ty ns of (case get_offset ty ns of
| None => UndefV | None => FlatV UndefV
| Some off => PtrV (n2w (w2n w + sizeof ty * n + off))) | Some off => FlatV (PtrV (n2w (w2n w + sizeof ty * n + off))))
| _ => UndefV) | _ => FlatV UndefV)
(eval_const g (GlobalC var) = (eval_const g (GlobalC var) =
case flookup g var of case flookup g var of
| None => PtrV 0w | None => FlatV (PtrV 0w)
| Some (s,w) => PtrV w) | Some (s,w) => FlatV (PtrV w))
(eval_const g UndefC = UndefV) (eval_const g UndefC = FlatV UndefV)
Termination Termination
WF_REL_TAC `measure (const_size o snd)` >> rw [listTheory.MEM_MAP] >> WF_REL_TAC `measure (const_size o snd)` >> rw [listTheory.MEM_MAP] >>
TRY TRY
@ -306,140 +314,64 @@ End
Definition eval_def: Definition eval_def:
(eval s (Variable v) = (eval s (Variable v) =
case flookup s.locals v of case flookup s.locals v of
| None => <| poison := F; value := W1V 0w |> | None => <| poison := F; value := FlatV (W1V 0w) |>
| Some v => v) | Some v => v)
(eval s (Constant c) = <| poison := F; value := eval_const s.globals c |>) (eval s (Constant c) = <| poison := F; value := eval_const s.globals c |>)
End End
Definition v2n_def: Definition v2n_def:
(v2n (W1V b) = Some (if T then 1 else 0)) (v2n (FlatV (W1V b)) = Some (if T then 1 else 0))
(v2n (W8V w8) = Some (w2n w8)) (v2n (FlatV (W8V w8)) = Some (w2n w8))
(v2n (W32V w32) = Some (w2n w32)) (v2n (FlatV (W32V w32)) = Some (w2n w32))
(v2n (W64V w64) = Some (w2n w64)) (v2n (FlatV (W64V w64)) = Some (w2n w64))
(v2n _ = None) (v2n _ = None)
End End
Definition interval_to_set_def: Definition type_to_shape_def:
interval_to_set (_, start,stop) = (type_to_shape (IntT s) = Flat (sizeof (IntT s)) (IntT s))
{ n | start n n < stop } (type_to_shape (PtrT t) = Flat (sizeof (PtrT t)) (PtrT t))
End (type_to_shape (ArrT n t) = Array (type_to_shape t) n)
(type_to_shape (StrT ts) = Tuple (map type_to_shape ts))
Definition interval_ok_def: Termination
interval_ok ((_:bool), i1, i2) WF_REL_TAC `measure ty_size` >> rw [] >>
i1 i2 i2 < 2 ** 64 Induct_on `ts` >> rw [definition "ty_size_def"] >>
End res_tac >> simp []
Definition is_allocated_def:
is_allocated b1 allocs
interval_ok b1
∃b2. b2 allocs fst b1 = fst b2 interval_to_set b1 interval_to_set b2
End
Definition is_free_def:
is_free b1 allocs
interval_ok b1
∀b2. b2 allocs interval_to_set b1 interval_to_set b2 =
End
Definition get_bytes_def:
get_bytes h (_, start, stop) =
map
(λoff.
case flookup h (A (start + off)) of
| None => (F, 0w)
| Some w => w)
(count_list (stop - start))
End End
Definition set_bytes_def: Definition convert_value_def:
(set_bytes p [] n h = h) (convert_value (IntT W1) w = W1V (w2w w))
(set_bytes p (b::bs) n h = (convert_value (IntT W8) w = W8V (w2w w))
set_bytes p bs (Suc n) (h |+ (A n, (p, b)))) (convert_value (IntT W32) w = W32V (w2w w))
(convert_value (IntT W64) w = W64V w)
(convert_value (PtrT _) w = PtrV w)
End End
(* Allocate a free chunk of memory, and write non-deterministic bytes into it *) Definition bytes_to_llvm_value_def:
Inductive allocate: bytes_to_llvm_value t bs =
v2n v.value = Some m (bytes_to_value (λn t w. convert_value t w) (type_to_shape t) bs)
b = (T, w2n w, w2n w + m * len)
is_free b s.allocations
length bytes = m * len
allocate s v len
(<| poison := v.poison; value := PtrV w |>,
s with <| allocations := { b } s.allocations;
heap := set_bytes v.poison bytes (w2n w) s.heap |>)
End End
Definition deallocate_def: Definition unconvert_value_def:
deallocate addrs allocs h = (unconvert_value (W1V w) = (1, w2w w))
let to_remove = { (T, n, stop) | A n set addrs (T, n, stop) allocs } in (unconvert_value (W8V w) = (1, w2w w))
(allocs DIFF to_remove, fdiff h (image A (bigunion (image interval_to_set to_remove)))) (unconvert_value (W32V w) = (4, w2w w))
(unconvert_value (W64V w) = (8, w))
(unconvert_value (PtrV w) = (8, w))
End End
(* Read len bytes from the list of bytes, and convert it into a word value, Definition llvm_value_to_bytes_def:
* little-endian encoding *) llvm_value_to_bytes v =
Definition le_read_w_def: value_to_bytes unconvert_value v
le_read_w len (bs : word8 list) =
if length bs < len then
(l2w 256 (map w2n bs), [])
else
(l2w 256 (map w2n (take len bs)), drop len bs)
End
(* Return len bytes that are the little-endian encoding of the argument word *)
Definition le_write_w_def:
le_write_w len w =
let (l : word8 list) = map n2w (w2l 256 w) in
take len (l ++ replicate (len - length l) 0w)
End
Definition bytes_to_value_def:
(bytes_to_value (IntT W1) (b::bs) = (W1V (w2w b), bs))
(bytes_to_value (IntT W8) (b::bs) = (W8V b, bs))
(bytes_to_value (IntT W32) bs = (W32V ## I) (le_read_w 4 bs))
(bytes_to_value (IntT W64) bs = (W64V ## I) (le_read_w 8 bs))
(bytes_to_value (PtrT _) bs = (PtrV ## I) (le_read_w 8 bs))
(bytes_to_value (ArrT n t) bs = (AggV ## I) (read_array n t bs))
(bytes_to_value (StrT ts) bs = (AggV ## I) (read_str ts bs))
(read_array 0 t bs = ([], bs))
(read_array (Suc n) t bs =
let (v, bs) = bytes_to_value t bs in
let (rest, bs) = read_array n t bs in
(v::rest, bs))
(read_str [] bs = ([], bs))
(read_str (t::ts) bs =
let (v, bs) = bytes_to_value t bs in
let (rest, bs) = read_str ts bs in
(v::rest, bs))
Termination
WF_REL_TAC `measure (λx. case x of
| INL (t, bs) => ty_size t
| INR (INL (n, t, bs)) => n + ty_size t
| INR (INR (ts, bs)) => ty1_size ts)`
End
Definition value_to_bytes_def:
(value_to_bytes (W1V w) = [w2w w])
(value_to_bytes (W8V w) = [w])
(value_to_bytes (W32V w) = le_write_w 4 w)
(value_to_bytes (W64V w) = le_write_w 8 w)
(value_to_bytes (PtrV n) = le_write_w 8 n)
(value_to_bytes (AggV vs) = flat (map value_to_bytes vs))
Termination
WF_REL_TAC `measure v_size` >>
Induct >> rw [definition "v_size_def"] >>
TRY (first_x_assum drule) >>
decide_tac
End End
Definition do_sub_def: Definition do_sub_def:
do_sub (nuw:bool) (nsw:bool) (v1:pv) (v2:pv) = do_sub (nuw:bool) (nsw:bool) (v1:pv) (v2:pv) =
let (diff, u_overflow, s_overflow) = let (diff, u_overflow, s_overflow) =
case (v1.value, v2.value) of case (v1.value, v2.value) of
| (W1V w1, W1V w2) => (W1V ## I) (add_with_carry (w1, ¬w2, T)) | (FlatV (W1V w1), FlatV (W1V w2)) => (FlatV o W1V ## I) (add_with_carry (w1, ¬w2, T))
| (W8V w1, W8V w2) => (W8V ## I) (add_with_carry (w1, ¬w2, T)) | (FlatV (W8V w1), FlatV (W8V w2)) => (FlatV o W8V ## I) (add_with_carry (w1, ¬w2, T))
| (W32V w1, W32V w2) => (W32V ## I) (add_with_carry (w1, ¬w2, T)) | (FlatV (W32V w1), FlatV (W32V w2)) => (FlatV o W32V ## I) (add_with_carry (w1, ¬w2, T))
| (W64V w1, W64V w2) => (W64V ## I) (add_with_carry (w1, ¬w2, T)) | (FlatV (W64V w1), FlatV (W64V w2)) => (FlatV o W64V ## I) (add_with_carry (w1, ¬w2, T))
in in
let p = ((nuw u_overflow) (nsw s_overflow) v1.poison v2.poison) in let p = ((nuw u_overflow) (nsw s_overflow) v1.poison v2.poison) in
<| poison := p; value := diff |> <| poison := p; value := diff |>
@ -456,11 +388,11 @@ Definition do_icmp_def:
<| poison := (v1.poison v2.poison); <| poison := (v1.poison v2.poison);
value := bool_to_v ( value := bool_to_v (
case (v1.value, v2.value) of case (v1.value, v2.value) of
| (W1V w1, W1V w2) => (get_comp c) w1 w2 | (FlatV (W1V w1), FlatV (W1V w2)) => (get_comp c) w1 w2
| (W8V w1, W8V w2) => (get_comp c) w1 w2 | (FlatV (W8V w1), FlatV (W8V w2)) => (get_comp c) w1 w2
| (W32V w1, W32V w2) => (get_comp c) w1 w2 | (FlatV (W32V w1), FlatV (W32V w2)) => (get_comp c) w1 w2
| (W64V w1, W64V w2) => (get_comp c) w1 w2 | (FlatV (W64V w1), FlatV (W64V w2)) => (get_comp c) w1 w2
| (PtrV w1, PtrV w2) => (get_comp c) w1 w2) |> | (FlatV (PtrV w1), FlatV (PtrV w2)) => (get_comp c) w1 w2) |>
End End
Definition do_phi_def: Definition do_phi_def:
@ -468,21 +400,6 @@ Definition do_phi_def:
option_map (λarg. (id, eval s arg)) (alookup entries from_l) option_map (λarg. (id, eval s arg)) (alookup entries from_l)
End End
Definition extract_type_def:
(extract_type t [] = Some t)
(extract_type (ArrT n t) (i::idx) =
if i < n then
extract_type t idx
else
None)
(extract_type (StrT ts) (i::idx) =
if i < length ts then
extract_type (el i ts) idx
else
None)
(extract_type _ _ = None)
End
Definition extract_value_def: Definition extract_value_def:
(extract_value v [] = Some v) (extract_value v [] = Some v)
(extract_value (AggV vs) (i::indices) = (extract_value (AggV vs) (i::indices) =
@ -519,7 +436,7 @@ End
Inductive step_instr: Inductive step_instr:
(s.stack = fr::st (s.stack = fr::st
deallocate fr.stack_allocs s.allocations s.heap = (new_allocs, new_h) deallocate fr.stack_allocs s.heap = new_h
step_instr prog s step_instr prog s
(Ret (t, a)) (Ret (t, a))
@ -528,7 +445,6 @@ Inductive step_instr:
globals := s.globals; globals := s.globals;
locals := fr.saved_locals; locals := fr.saved_locals;
stack := st; stack := st;
allocations := new_allocs;
heap := new_h |>)) heap := new_h |>))
(* Do the phi assignments in parallel. The manual says "For the purposes of the (* Do the phi assignments in parallel. The manual says "For the purposes of the
@ -542,7 +458,7 @@ Inductive step_instr:
* %r2 = phi [%r1, %l] * %r2 = phi [%r1, %l]
* %r1 = phi [0, %l] * %r1 = phi [0, %l]
*) *)
(eval s a = <| poison := p; value := W1V tf |> (eval s a = <| poison := p; value := FlatV (W1V tf) |>
l = Some (if tf = 1w then l1 else l2) l = Some (if tf = 1w then l1 else l2)
alookup prog s.ip.f = Some d alookup prog s.ip.f = Some d
alookup d.blocks l = Some <| h := Head phis None; body := b |> alookup d.blocks l = Some <| h := Head phis None; body := b |>
@ -579,27 +495,29 @@ Inductive step_instr:
(inc_pc (update_result r (inc_pc (update_result r
<| poison := (v1.poison v2.poison); value := result |> s))) <| poison := (v1.poison v2.poison); value := result |> s)))
(allocate s (eval s a1) (sizeof t) (v2, s2) (eval s a1 = v
v2n v.value = Some n
allocate s.heap (n * sizeof t) v.poison (v2, new_h)
step_instr prog s step_instr prog s
(Alloca r t (t1, a1)) (Alloca r t (t1, a1))
(inc_pc (update_result r v2 s2))) (inc_pc (update_result r v2 (s with heap := new_h))))
(eval s a1 = <| poison := p1; value := PtrV w |> (eval s a1 = <| poison := p1; value := FlatV (PtrV w) |>
interval = (freeable, w2n w, w2n w + sizeof t) interval = Interval freeable (w2n w) (w2n w + sizeof t)
is_allocated interval s.allocations is_allocated interval s.heap
pbytes = get_bytes s.heap interval pbytes = get_bytes s.heap interval
step_instr prog s step_instr prog s
(Load r t (t1, a1)) (Load r t (t1, a1))
(inc_pc (update_result r <| poison := (T set (map fst pbytes)); (inc_pc (update_result r <| poison := (T set (map fst pbytes));
value := fst (bytes_to_value t (map snd pbytes)) |> value := fst (bytes_to_llvm_value t (map snd pbytes)) |>
s))) s)))
(eval s a2 = <| poison := p2; value := PtrV w |> (eval s a2 = <| poison := p2; value := FlatV (PtrV w) |>
interval = (freeable, w2n w, w2n w + sizeof t) interval = Interval freeable (w2n w) (w2n w + sizeof t)
is_allocated interval s.allocations is_allocated interval s.heap
bytes = value_to_bytes (eval s a1).value bytes = llvm_value_to_bytes (eval s a1).value
length bytes = sizeof t length bytes = sizeof t
step_instr prog s step_instr prog s
@ -607,7 +525,7 @@ Inductive step_instr:
(inc_pc (s with heap := set_bytes p2 bytes (w2n w) s.heap))) (inc_pc (s with heap := set_bytes p2 bytes (w2n w) s.heap)))
(map (eval s o snd) tindices = i1::indices (map (eval s o snd) tindices = i1::indices
(eval s a1).value = PtrV w1 (eval s a1).value = FlatV (PtrV w1)
cast_num i1.value = Some n cast_num i1.value = Some n
map (λx. cast_num x.value) indices = map Some ns map (λx. cast_num x.value) indices = map Some ns
get_offset t1 ns = Some off get_offset t1 ns = Some off
@ -616,11 +534,11 @@ Inductive step_instr:
(Gep r t ((PtrT t1), a1) tindices) (Gep r t ((PtrT t1), a1) tindices)
(inc_pc (update_result r (inc_pc (update_result r
<| poison := (v1.poison i1.poison exists (λv. v.poison) indices); <| poison := (v1.poison i1.poison exists (λv. v.poison) indices);
value := PtrV (n2w (w2n w1 + sizeof t1 * n + off)) |> value := FlatV (PtrV (n2w (w2n w1 + sizeof t1 * n + off))) |>
s))) s)))
(eval s a1 = v1 (eval s a1 = v1
v1.value = PtrV w v1.value = FlatV (PtrV w)
w64_cast w t = Some int_v w64_cast w t = Some int_v
step_instr prog s step_instr prog s
@ -632,7 +550,7 @@ Inductive step_instr:
step_instr prog s step_instr prog s
(Inttoptr r (t1, a1) t) (Inttoptr r (t1, a1) t)
(inc_pc (update_result r <| poison := v1.poison; value := PtrV w |> s))) (inc_pc (update_result r <| poison := v1.poison; value := FlatV (PtrV w) |> s)))
(step_instr prog s (step_instr prog s
(Icmp r c t a1 a2) (Icmp r c t a1 a2)
@ -645,7 +563,6 @@ Inductive step_instr:
<| ip := <| f := fname; b := None; i := 0 |>; <| ip := <| f := fname; b := None; i := 0 |>;
locals := alist_to_fmap (zip (map snd d.params, map (eval s o snd) targs)); locals := alist_to_fmap (zip (map snd d.params, map (eval s o snd) targs));
globals := s.globals; globals := s.globals;
allocations:= s.allocations;
stack := stack :=
<| ret := s.ip with i := s.ip.i + 1; <| ret := s.ip with i := s.ip.i + 1;
saved_locals := s.locals; saved_locals := s.locals;
@ -682,29 +599,13 @@ End
(* ----- Invariants on state ----- *) (* ----- Invariants on state ----- *)
(* The allocations are of intervals that don't overlap *)
Definition allocations_ok_def:
allocations_ok s
∀i1 i2.
i1 s.allocations i2 s.allocations
interval_ok i1 interval_ok i2
(interval_to_set i1 interval_to_set i2 i1 = i2)
End
(* The heap maps exactly the address in the allocations *)
Definition heap_ok_def:
heap_ok s
∀n. flookup s.heap (A n) None ∃i. i s.allocations n interval_to_set i
End
(* All global variables are allocated in non-freeable memory *) (* All global variables are allocated in non-freeable memory *)
Definition globals_ok_def: Definition globals_ok_def:
globals_ok s globals_ok s
∀g n w. ∀g n w.
flookup s.globals g = Some (n, w) flookup s.globals g = Some (n, w)
is_allocated (F, w2n w, w2n w + n) s.allocations is_allocated (Interval F (w2n w) (w2n w + n)) s.heap
End End
(* Instruction pointer points to an instruction *) (* Instruction pointer points to an instruction *)
@ -733,7 +634,7 @@ End
Definition frame_ok_def: Definition frame_ok_def:
frame_ok p s f frame_ok p s f
ip_ok p f.ret ip_ok p f.ret
every (λn. ∃start stop. n = A start (T, start, stop) s.allocations) f.stack_allocs every (λn. ∃start stop. n = A start Interval T start stop s.heap.allocations) f.stack_allocs
End End
(* The frames are all of, and no two stack allocations have the same address *) (* The frames are all of, and no two stack allocations have the same address *)
@ -745,7 +646,7 @@ End
Definition state_invariant_def: Definition state_invariant_def:
state_invariant p s state_invariant p s
ip_ok p s.ip allocations_ok s heap_ok s globals_ok s stack_ok p s ip_ok p s.ip heap_ok s.heap globals_ok s stack_ok p s
End End
(* ----- Initial state ----- *) (* ----- Initial state ----- *)
@ -758,19 +659,19 @@ Definition is_init_state_def:
s.ip.i = 0 s.ip.i = 0
s.locals = fempty s.locals = fempty
s.stack = [] s.stack = []
allocations_ok s
globals_ok s globals_ok s
heap_ok s heap_ok s.heap
fdom s.globals = fdom global_init fdom s.globals = fdom global_init
s.heap.valid_addresses = { A n | n < dimword (:64) }
(* The initial allocations for globals are not freeable *) (* The initial allocations for globals are not freeable *)
s.allocations { (F, start, stop) | T } s.heap.allocations { Interval F start stop | T }
(* The heap starts with the initial values of the globals written to their (* The heap starts with the initial values of the globals written to their
* addresses *) * addresses *)
∀g w t v n. ∀g w t v n.
flookup s.globals g = Some (n, w) flookup global_init g = Some (t,v) flookup s.globals g = Some (n, w) flookup global_init g = Some (t,v)
∃bytes. ∃bytes.
get_bytes s.heap (F, w2n w, w2n w + sizeof t) = map (λb. (F,b)) bytes get_bytes s.heap (Interval F (w2n w) (w2n w + sizeof t)) = map (λb. (F,b)) bytes
bytes_to_value t bytes = (v, []) bytes_to_llvm_value t bytes = (v, [])
End End
export_theory(); export_theory();

@ -11,393 +11,95 @@ open HolKernel boolLib bossLib Parse;
open pairTheory listTheory rich_listTheory arithmeticTheory wordsTheory; open pairTheory listTheory rich_listTheory arithmeticTheory wordsTheory;
open pred_setTheory finite_mapTheory; open pred_setTheory finite_mapTheory;
open logrootTheory numposrepTheory; open logrootTheory numposrepTheory;
open settingsTheory llvmTheory; open settingsTheory miscTheory llvmTheory memory_modelTheory;
new_theory "llvm_prop"; new_theory "llvm_prop";
numLib.prefer_num(); numLib.prefer_num();
(* ----- Theorems about list library functions ----- *)
(* Could be upstreamed to HOL *)
Theorem dropWhile_map:
∀P f l. dropWhile P (map f l) = map f (dropWhile (P o f) l)
Proof
Induct_on `l` >> rw []
QED
Theorem dropWhile_prop:
∀P l x. x < length l - length (dropWhile P l) P (el x l)
Proof
Induct_on `l` >> rw [] >>
Cases_on `x` >> fs []
QED
Theorem dropWhile_rev_take:
∀P n l x.
let len = length (dropWhile P (reverse (take n l))) in
x + len < n n length l P (el (x + len) l)
Proof
rw [] >>
`P (el ((n - 1 - x - length (dropWhile P (reverse (take n l))))) (reverse (take n l)))`
by (irule dropWhile_prop >> simp [LENGTH_REVERSE]) >>
rfs [EL_REVERSE, EL_TAKE, PRE_SUB1]
QED
Theorem take_replicate:
∀m n x. take m (replicate n x) = replicate (min m n) x
Proof
Induct_on `n` >> rw [TAKE_def, MIN_DEF] >> fs [] >>
Cases_on `m` >> rw []
QED
Theorem length_take_less_eq:
∀n l. length (take n l) n
Proof
Induct_on `l` >> rw [TAKE_def] >>
Cases_on `n` >> fs []
QED
Theorem flat_drop:
∀n m ls. flat (drop m ls) = drop (length (flat (take m ls))) (flat ls)
Proof
Induct_on `ls` >> rw [DROP_def, DROP_APPEND] >>
irule (GSYM DROP_LENGTH_TOO_LONG) >> simp []
QED
Theorem take_is_prefix:
∀n l. take n l l
Proof
Induct_on `l` >> rw [TAKE_def]
QED
Theorem sum_prefix:
∀l1 l2. l1 l2 sum l1 sum l2
Proof
Induct >> rw [] >> Cases_on `l2` >> fs []
QED
Theorem flookup_fdiff:
∀m s k.
flookup (fdiff m s) k =
if k s then None else flookup m k
Proof
rw [FDIFF_def, FLOOKUP_DRESTRICT] >> fs []
QED
(* ----- Theorems about log ----- *)
(* Could be upstreamed to HOL *)
Theorem mul_div_bound:
∀m n. n 0 m - (n - 1) n * (m DIV n) n * (m DIV n) m
Proof
rw [] >>
`0 < n` by decide_tac >>
drule DIVISION >> disch_then (qspec_then `m` mp_tac) >>
decide_tac
QED
Theorem exp_log_bound:
∀b n. 1 < b n 0 n DIV b + 1 b ** (log b n) b ** (log b n) n
Proof
rw [] >> `0 < n` by decide_tac >>
drule LOG >> disch_then drule >> rw [] >>
fs [ADD1, EXP_ADD] >>
simp [DECIDE ``∀x y. x + 1 y x < y``] >>
`∃x. b = Suc x` by intLib.COOPER_TAC >>
`b * (n DIV b) < b * b ** log b n` suffices_by metis_tac [LESS_MULT_MONO] >>
pop_assum kall_tac >>
`b 0` by decide_tac >>
drule mul_div_bound >> disch_then (qspec_then `n` mp_tac) >>
decide_tac
QED
Theorem log_base_power:
∀n b. 1 < b log b (b ** n) = n
Proof
Induct >> rw [EXP, LOG_1] >>
Cases_on `n` >> rw [LOG_BASE] >>
first_x_assum drule >> rw [] >>
simp [Once EXP, LOG_MULT]
QED
Theorem log_change_base_power:
∀m n b. 1 < b m 0 n 0 log (b ** n) m = log b m DIV n
Proof
rw [] >> irule LOG_UNIQUE >>
rw [ADD1, EXP_MUL, LEFT_ADD_DISTRIB] >>
qmatch_goalsub_abbrev_tac `x DIV _` >>
drule mul_div_bound >> disch_then (qspec_then `x` mp_tac) >> rw []
>- (
irule LESS_LESS_EQ_TRANS >>
qexists_tac `b ** (x+1)` >> rw [] >>
unabbrev_all_tac >>
simp [EXP_ADD] >>
`b * (m DIV b + 1) b * b ** log b m`
by metis_tac [exp_log_bound, LESS_MONO_MULT, MULT_COMM] >>
`m < b * (m DIV b + 1)` suffices_by decide_tac >>
simp [LEFT_ADD_DISTRIB] >>
`b 0` by decide_tac >>
`m - (b - 1) b * (m DIV b)` by metis_tac [mul_div_bound] >>
fs [])
>- (
irule LESS_EQ_TRANS >>
qexists_tac `b ** (log b m)` >> rw [] >>
unabbrev_all_tac >>
metis_tac [exp_log_bound])
QED
(* ----- Theorems about word stuff ----- *)
Theorem l2n_padding:
∀ws n. l2n 256 (ws ++ map w2n (replicate n 0w)) = l2n 256 ws
Proof
Induct >> rw [l2n_def] >>
Induct_on `n` >> rw [l2n_def]
QED
Theorem l2n_0:
∀l b. b 0 every ($> b) l (l2n b l = 0 every ($= 0) l)
Proof
Induct >> rw [l2n_def] >>
eq_tac >> rw []
QED
Theorem mod_n2l:
∀d n. 0 < d map (\x. x MOD d) (n2l d n) = n2l d n
Proof
rw [] >> drule n2l_BOUND >> disch_then (qspec_then `n` mp_tac) >>
qspec_tac (`n2l d n`, `l`) >>
Induct >> rw []
QED
(* ----- Theorems about converting between values and byte lists ----- *) (* ----- Theorems about converting between values and byte lists ----- *)
Theorem le_write_w_length: Theorem value_type_is_fc:
l x. length (le_write_w l w) = l ∀t v. value_type t v first_class_type t
Proof Proof
rw [le_write_w_def] ho_match_mp_tac value_type_ind >> rw [first_class_type_def] >>
fs [LIST_REL_EL_EQN, EVERY_EL]
QED QED
Theorem v2b_size: Theorem sizeof_type_to_shape:
∀t v. value_type t v length (value_to_bytes v) = sizeof t ∀t. first_class_type t sizeof (type_to_shape t) = sizeof t
Proof Proof
ho_match_mp_tac value_type_ind >> recInduct type_to_shape_ind >>
rw [value_to_bytes_def, sizeof_def] rw [type_to_shape_def, memory_modelTheory.sizeof_def, llvmTheory.sizeof_def,
>- metis_tac [le_write_w_length] first_class_type_def, EVERY_MEM] >>
>- metis_tac [le_write_w_length] qid_spec_tac `vs` >> Induct_on `ts` >> rw [] >> fs []
>- metis_tac [le_write_w_length]
>- (Induct_on `vs` >> rw [ADD1] >> fs [])
>- (
pop_assum mp_tac >>
qid_spec_tac `vs` >> qid_spec_tac `ts` >>
ho_match_mp_tac LIST_REL_ind >> rw [])
QED QED
Theorem b2v_size: Theorem value_type_to_shape:
(∀t bs. first_class_type t sizeof t length bs ∀t v.
∃v. bytes_to_value t bs = (v, drop (sizeof t) bs)) value_type t v
(∀n t bs. first_class_type t n * sizeof t length bs ∀s.
∃vs. read_array n t bs = (vs, drop (n * sizeof t) bs)) value_shape (\n t x. n = fst (unconvert_value x) value_type t (FlatV x)) (type_to_shape t) v
(∀ts bs. every first_class_type ts sum (map sizeof ts) length bs
∃vs. read_str ts bs = (vs, drop (sum (map sizeof ts)) bs))
Proof Proof
ho_match_mp_tac bytes_to_value_ind >> ho_match_mp_tac value_type_ind >>
rw [sizeof_def, bytes_to_value_def, le_read_w_def] >> rw [memory_modelTheory.sizeof_def, llvmTheory.sizeof_def, type_to_shape_def,
fs [first_class_type_def] unconvert_value_def, value_shape_def] >>
>- (simp [PAIR_MAP] >> metis_tac [SND]) fs [value_shapes_list_rel, LIST_REL_CONJ, ETA_THM, EVERY2_MAP] >>
>- ( metis_tac [value_type_rules]
pairarg_tac >> rw [] >> pairarg_tac >> rw [] >>
fs [ADD1] >> rw [] >> fs [DROP_DROP_T, LEFT_ADD_DISTRIB])
>- fs [DROP_DROP_T, LEFT_ADD_DISTRIB]
QED QED
Theorem b2v_smaller: Theorem llvm_v2b_size:
∀t bs. first_class_type t sizeof t length bs ∀t v. value_type t v length (llvm_value_to_bytes v) = sizeof t
length (snd (bytes_to_value t bs)) = length bs - sizeof t
Proof Proof
rw [] >> imp_res_tac b2v_size >> rw [llvm_value_to_bytes_def] >>
Cases_on `bytes_to_value t bs` >> fs [] drule value_type_to_shape >> rw [] >>
drule value_type_is_fc >> rw [] >>
drule sizeof_type_to_shape >>
disch_then (mp_tac o GSYM) >> rw [] >>
irule v2b_size >> rw [] >>
qmatch_assum_abbrev_tac `value_shape f _ _` >>
qexists_tac `f` >> rw [] >>
unabbrev_all_tac >> fs []
QED QED
Theorem b2v_append: Theorem b2llvm_v_size:
(∀t bs. first_class_type t sizeof t length bs ∀t bs. first_class_type t sizeof t length bs
bytes_to_value t (bs ++ bs') = (I ## (λx. x ++ bs')) (bytes_to_value t bs)) ∃v. bytes_to_llvm_value t bs = (v, drop (sizeof t) bs)
(∀n t bs. first_class_type t n * sizeof t length bs
∃vs. read_array n t (bs ++ bs') = (I ## (λx. x ++ bs')) (read_array n t bs))
(∀ts bs. every first_class_type ts sum (map sizeof ts) length bs
∃vs. read_str ts (bs ++ bs') = (I ## (λx. x ++ bs')) (read_str ts bs))
Proof Proof
ho_match_mp_tac bytes_to_value_ind >> rw [bytes_to_llvm_value_def] >>
rw [sizeof_def, bytes_to_value_def, le_read_w_def] >> drule sizeof_type_to_shape >> disch_then (mp_tac o GSYM) >> rw [] >>
fs [first_class_type_def, TAKE_APPEND, DROP_APPEND, fs [PAIR_MAP] >>
DECIDE ``!x y. x y x - y = 0n``, ETA_THM] metis_tac [SND, b2v_size]
>- (simp [PAIR_MAP] >> metis_tac [SND])
>- (simp [PAIR_MAP] >> metis_tac [SND])
>- (
rpt (pairarg_tac >> simp []) >> fs [ADD1] >>
BasicProvers.VAR_EQ_TAC >> fs [LEFT_ADD_DISTRIB] >>
first_x_assum irule >>
`sizeof t length bs` by decide_tac >>
imp_res_tac b2v_smaller >> rfs [])
>- (
rpt (pairarg_tac >> simp []) >> fs [ADD1] >>
BasicProvers.VAR_EQ_TAC >> fs [LEFT_ADD_DISTRIB] >>
first_x_assum irule >>
`sizeof t length bs` by decide_tac >>
imp_res_tac b2v_smaller >> rfs [])
QED QED
Theorem le_read_write: Theorem b2llvm_v_smaller:
∀n w bs. ∀t bs. first_class_type t sizeof t length bs
n 0 dimword (:'a) 256 ** n le_read_w n (le_write_w n (w :'a word) bs) = (w, bs) length (snd (bytes_to_llvm_value t bs)) = length bs - sizeof t
Proof Proof
rw [le_read_w_def, le_write_w_length] rw [bytes_to_llvm_value_def] >>
>- ( metis_tac [b2v_smaller, sizeof_type_to_shape]
`take n (le_write_w n w bs) = le_write_w n w`
by metis_tac [le_write_w_length, TAKE_LENGTH_APPEND] >>
simp [le_write_w_def, w2l_def, l2w_def] >>
Cases_on `w` >> simp [] >> fs [l2n_padding, TAKE_APPEND, take_replicate] >>
simp [MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF, mod_n2l] >>
rename1 `n2l 256 m` >>
`length (n2l 256 m) n`
by (
rw [LENGTH_n2l] >>
`256 = 2 ** 8` by EVAL_TAC >>
ASM_REWRITE_TAC [] >> simp [log_change_base_power, GSYM LESS_EQ] >>
`n2w m 0w` by simp [] >>
drule LOG2_w2n_lt >> rw [] >> fs [bitTheory.LOG2_def, dimword_def] >>
`8 * (log 2 m DIV 8) log 2 m` by metis_tac [mul_div_bound, EVAL ``8 0n``] >>
`LOG 2 (2 ** dimindex (:'a)) LOG 2 (256 ** n)` by simp [LOG_LE_MONO] >>
pop_assum mp_tac >>
`256 = 2 ** 8` by EVAL_TAC >>
ASM_REWRITE_TAC [EXP_MUL] >> simp [log_base_power]) >>
simp [mod_n2l, l2n_n2l, TAKE_LENGTH_TOO_LONG])
>- metis_tac [le_write_w_length, DROP_LENGTH_APPEND]
QED QED
Theorem le_write_read: Theorem b2llvm_v_append:
∀n w bs bs'. ∀t bs bs'. first_class_type t sizeof t length bs
256 ** n dimword (:'a) bytes_to_llvm_value t (bs ++ bs') = (I ## (λx. x ++ bs')) (bytes_to_llvm_value t bs)
n length bs
le_read_w n bs = (w:'a word, bs')
le_write_w n w ++ bs' = bs
Proof Proof
rw [le_read_w_def] >> rw [bytes_to_llvm_value_def] >>
qmatch_goalsub_abbrev_tac `l2w _ l` >> drule sizeof_type_to_shape >> disch_then (mp_tac o GSYM) >> rw [] >> fs [] >>
`le_write_w n (l2w 256 l) = take n bs` suffices_by metis_tac [TAKE_DROP] >> rw [PAIR_MAP, b2v_append]
simp [le_write_w_def, w2l_l2w] >>
`l2n 256 l < 256 ** n`
by (
`n length bs` by decide_tac >>
metis_tac [l2n_lt, LENGTH_TAKE, LENGTH_MAP, EVAL ``0n < 256``]) >>
fs [] >>
`every ($> 256) l`
by (
simp [EVERY_MAP, Abbr `l`] >> irule EVERY_TAKE >> simp [] >>
rpt (pop_assum kall_tac) >>
Induct_on `bs` >> rw [] >>
Cases_on `h` >> fs []) >>
rw [n2l_l2n]
>- (
rw [TAKE_def, take_replicate] >>
Cases_on `n` >> fs [] >>
rfs [l2n_0] >> unabbrev_all_tac >> fs [EVERY_MAP] >>
ONCE_REWRITE_TAC [GSYM REPLICATE] >>
qmatch_goalsub_abbrev_tac `take n _` >>
qpat_assum `¬(_ < _)` mp_tac >>
qpat_assum `every (\x. 0 = w2n x) _` mp_tac >>
rpt (pop_assum kall_tac) >>
qid_spec_tac `bs` >>
Induct_on `n` >> rw [] >>
Cases_on `bs` >> rw [] >> fs [] >>
Cases_on `h` >> fs [] >>
first_x_assum irule >> rw [] >>
irule MONO_EVERY >>
qexists_tac `(λx. 0 = w2n x)` >> rw []) >>
fs [MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >>
`exists (\y. 0 y) l`
by (
fs [l2n_eq_0, combinTheory.o_DEF] >> fs [EXISTS_MEM, EVERY_MEM] >>
qexists_tac `x` >> rfs [MOD_MOD, GREATER_DEF]) >>
simp [LOG_l2n_dropWhile] >>
`length (dropWhile ($= 0) (reverse l)) 0`
by (
Cases_on `l` >> fs [dropWhile_eq_nil, combinTheory.o_DEF, EXISTS_REVERSE]) >>
`0 < length (dropWhile ($= 0) (reverse l))` by decide_tac >>
fs [SUC_PRE] >>
`map n2w l = take n bs`
by (simp [Abbr `l`, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF, n2w_w2n]) >>
simp [TAKE_TAKE_MIN] >>
`length l = n` by simp [Abbr `l`] >>
`length (dropWhile ($= 0) (reverse l)) n`
by metis_tac [LESS_EQ_TRANS, LENGTH_dropWhile_LESS_EQ, LENGTH_REVERSE] >>
rw [MIN_DEF] >> fs []
>- (
simp [TAKE_APPEND, TAKE_TAKE_MIN, MIN_DEF, take_replicate] >>
`replicate (length l length (dropWhile ($= 0) (reverse l))) 0w =
take (length l (length (dropWhile ($= 0) (reverse l)))) (drop (length (dropWhile ($= 0) (reverse l))) bs)`
suffices_by (rw [] >> irule take_drop_partition >> simp []) >>
rw [LIST_EQ_REWRITE, EL_REPLICATE, EL_TAKE, EL_DROP] >>
`length (dropWhile ($= 0) (reverse l)) =
length (dropWhile (λx. 0 = w2n x) (reverse (take (length l) bs)))`
by (
`reverse l = reverse (take (length l) (map w2n bs))` by metis_tac [] >>
ONCE_ASM_REWRITE_TAC [] >>
qpat_x_assum `Abbrev (l = _)` kall_tac >>
simp [GSYM MAP_TAKE, GSYM MAP_REVERSE, dropWhile_map, combinTheory.o_DEF]) >>
fs [] >>
`x + length (dropWhile (λx. 0 = w2n x) (reverse (take (length l) bs))) < length l` by decide_tac >>
drule (SIMP_RULE std_ss [LET_THM] dropWhile_rev_take) >>
rw [] >>
REWRITE_TAC [GSYM w2n_11, word_0_n2w] >>
simp [])
>- rw [TAKE_APPEND, TAKE_TAKE]
QED QED
Theorem b2v_v2b: Theorem b2v_llvm_v2b:
∀v t bs. value_type t v bytes_to_value t (value_to_bytes v ++ bs) = (v, bs) ∀v t bs. value_type t v bytes_to_llvm_value t (llvm_value_to_bytes v ++ bs) = (v, bs)
Proof Proof
gen_tac >> completeInduct_on `v_size v` >> rw [bytes_to_llvm_value_def, llvm_value_to_bytes_def] >>
rw [] >> drule value_type_to_shape >> rw [] >>
pop_assum mp_tac >> simp [value_type_cases] >> qmatch_assum_abbrev_tac `value_shape f _ _` >>
rw [] >> irule b2v_v2b >>
rw [bytes_to_value_def, value_to_bytes_def, le_read_write] qexists_tac `f` >> rw [] >>
>- wordsLib.WORD_DECIDE_TAC unabbrev_all_tac >> fs [] >>
>- ( fs [unconvert_value_def, convert_value_def, value_type_cases] >>
qmatch_abbrev_tac `_ x = _` >> wordsLib.WORD_DECIDE_TAC
`x = (vs, bs)` suffices_by (simp [PAIR_MAP] >> metis_tac [PAIR_EQ, FST, SND]) >>
unabbrev_all_tac >>
qid_spec_tac `bs` >> Induct_on `vs` >> simp [bytes_to_value_def] >>
rw [] >> fs [v_size_def] >>
pairarg_tac >> fs [] >>
pairarg_tac >> fs [] >>
rename1 `value_type t v1` >>
first_x_assum (qspec_then `v_size v1` mp_tac) >> simp [] >>
disch_then (qspec_then `v1` mp_tac) >> simp [] >>
disch_then (qspec_then `t` mp_tac) >> simp [] >>
qmatch_assum_abbrev_tac `bytes_to_value _ (_ ++ bs1 ++ _) = _` >>
disch_then (qspec_then `bs1++bs` mp_tac) >> simp [] >>
unabbrev_all_tac >> strip_tac >> fs [] >>
first_x_assum (qspec_then `bs` mp_tac) >> rw [])
>- (
qmatch_abbrev_tac `_ x = _` >>
`x = (vs, bs)` suffices_by (simp [PAIR_MAP] >> metis_tac [PAIR_EQ, FST, SND]) >>
unabbrev_all_tac >>
pop_assum mp_tac >>
qid_spec_tac `bs` >> qid_spec_tac `ts` >> Induct_on `vs` >> simp [bytes_to_value_def] >>
rw [] >> fs [v_size_def, bytes_to_value_def] >>
pairarg_tac >> fs [] >>
pairarg_tac >> fs [] >>
rename1 `value_type t v1` >>
first_x_assum (qspec_then `v_size v1` mp_tac) >> simp [] >>
disch_then (qspec_then `v1` mp_tac) >> simp [] >>
disch_then (qspec_then `t` mp_tac) >> simp [] >>
qmatch_assum_abbrev_tac `bytes_to_value _ (_ ++ bs1 ++ _) = _` >>
disch_then (qspec_then `bs1++bs` mp_tac) >> simp [] >>
unabbrev_all_tac >> strip_tac >> fs [] >>
first_x_assum drule >> metis_tac [PAIR_EQ])
QED QED
(* ----- Theorems about insert/extract value and get_offset ----- *) (* ----- Theorems about insert/extract value and get_offset ----- *)
@ -482,7 +184,7 @@ Theorem offset_size_leq:
n sizeof t n sizeof t
Proof Proof
recInduct get_offset_ind >> rw [get_offset_def, sizeof_def, indices_in_range_def] >> recInduct get_offset_ind >> rw [get_offset_def, llvmTheory.sizeof_def, indices_in_range_def] >>
BasicProvers.EVERY_CASE_TAC >> fs [] >> rw [] >> rfs [] BasicProvers.EVERY_CASE_TAC >> fs [] >> rw [] >> rfs []
>- ( >- (
`x + i * sizeof t (i + 1) * sizeof t` by decide_tac >> `x + i * sizeof t (i + 1) * sizeof t` by decide_tac >>
@ -495,13 +197,6 @@ Proof
drule sum_prefix >> rw [SUM_APPEND] drule sum_prefix >> rw [SUM_APPEND]
QED QED
Theorem value_type_is_fc:
∀t v. value_type t v first_class_type t
Proof
ho_match_mp_tac value_type_ind >> rw [first_class_type_def] >>
fs [LIST_REL_EL_EQN, EVERY_EL]
QED
Theorem extract_type_fc: Theorem extract_type_fc:
∀t is t'. extract_type t is = Some t' first_class_type t first_class_type t' ∀t is t'. extract_type t is = Some t' first_class_type t first_class_type t'
Proof Proof
@ -517,7 +212,7 @@ Theorem extract_offset_size:
sizeof t' sizeof t - n sizeof t' sizeof t - n
Proof Proof
recInduct get_offset_ind >> rw [get_offset_def, extract_type_def] >> recInduct get_offset_ind >> rw [get_offset_def, extract_type_def] >>
BasicProvers.EVERY_CASE_TAC >> fs [sizeof_def] >> rfs [] >> rw [ETA_THM] BasicProvers.EVERY_CASE_TAC >> fs [llvmTheory.sizeof_def] >> rfs [] >> rw [ETA_THM]
>- ( >- (
`sizeof t (v1 i) * sizeof t` suffices_by decide_tac >> `sizeof t (v1 i) * sizeof t` suffices_by decide_tac >>
`1 v1 - i` by decide_tac >> `1 v1 - i` by decide_tac >>
@ -529,6 +224,12 @@ Proof
Induct_on `ts` >> rw [TAKE_def, EL_CONS, PRE_SUB1] Induct_on `ts` >> rw [TAKE_def, EL_CONS, PRE_SUB1]
QED QED
Theorem llvm_value_to_bytes_agg:
∀vs. llvm_value_to_bytes (AggV vs) = flat (map llvm_value_to_bytes vs)
Proof
Induct >> rw [] >> fs [llvm_value_to_bytes_def, value_to_bytes_def]
QED
Theorem read_from_offset_extract: Theorem read_from_offset_extract:
∀t indices n v t'. ∀t indices n v t'.
indices_in_range t indices indices_in_range t indices
@ -536,55 +237,55 @@ Theorem read_from_offset_extract:
value_type t v value_type t v
extract_type t indices = Some t' extract_type t indices = Some t'
extract_value v indices = Some (fst (bytes_to_value t' (drop n (value_to_bytes v)))) extract_value v indices = Some (fst (bytes_to_llvm_value t' (drop n (llvm_value_to_bytes v))))
Proof Proof
recInduct get_offset_ind >> recInduct get_offset_ind >>
rw [extract_value_def, get_offset_def, extract_type_def, indices_in_range_def] >> rw [extract_value_def, get_offset_def, extract_type_def, indices_in_range_def] >>
simp [DROP_0] simp [DROP_0]
>- metis_tac [APPEND_NIL, FST, b2v_v2b] >> >- metis_tac [APPEND_NIL, FST, b2v_llvm_v2b] >>
qpat_x_assum `value_type _ _` mp_tac >> qpat_x_assum `value_type _ _` mp_tac >>
simp [Once value_type_cases] >> rw [] >> simp [extract_value_def] >> simp [Once value_type_cases] >> rw [] >> simp [extract_value_def] >>
qpat_x_assum `_ = Some n` mp_tac >> CASE_TAC >> rw [] >> rfs [] >> qpat_x_assum `_ = Some n` mp_tac >> CASE_TAC >> rw [] >> rfs [] >>
simp [value_to_bytes_def] simp [llvm_value_to_bytes_agg]
>- ( >- (
`value_type t (el i vs)` by metis_tac [EVERY_EL] >> `value_type t (el i vs)` by metis_tac [EVERY_EL] >>
first_x_assum drule >> first_x_assum drule >>
rw [] >> simp [GSYM DROP_DROP_T, ETA_THM] >> rw [] >> simp [GSYM DROP_DROP_T, ETA_THM] >>
`i * sizeof t = length (flat (take i (map value_to_bytes vs)))` `i * sizeof t = length (flat (take i (map llvm_value_to_bytes vs)))`
by ( by (
simp [LENGTH_FLAT, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >> simp [LENGTH_FLAT, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >>
`map (λx. length (value_to_bytes x)) vs = replicate (length vs) (sizeof t)` `map (λx. length (llvm_value_to_bytes x)) vs = replicate (length vs) (sizeof t)`
by ( by (
qpat_x_assum `every _ _` mp_tac >> rpt (pop_assum kall_tac) >> qpat_x_assum `every _ _` mp_tac >> rpt (pop_assum kall_tac) >>
Induct_on `vs` >> rw [v2b_size]) >> Induct_on `vs` >> rw [llvm_v2b_size]) >>
rw [take_replicate, MIN_DEF]) >> rw [take_replicate, MIN_DEF]) >>
rw [GSYM flat_drop, GSYM MAP_DROP] >> rw [GSYM flat_drop, GSYM MAP_DROP] >>
drule DROP_CONS_EL >> simp [DROP_APPEND] >> disch_then kall_tac >> drule DROP_CONS_EL >> simp [DROP_APPEND] >> disch_then kall_tac >>
`first_class_type t'` by metis_tac [value_type_is_fc, extract_type_fc] >> `first_class_type t'` by metis_tac [value_type_is_fc, extract_type_fc] >>
`sizeof t' length (drop x (value_to_bytes (el i vs)))` `sizeof t' length (drop x (llvm_value_to_bytes (el i vs)))`
by (simp [LENGTH_DROP] >> drule v2b_size >> rw [] >> metis_tac [extract_offset_size]) >> by (simp [LENGTH_DROP] >> drule llvm_v2b_size >> rw [] >> metis_tac [extract_offset_size]) >>
simp [b2v_append]) simp [b2llvm_v_append])
>- metis_tac [LIST_REL_LENGTH] >- metis_tac [LIST_REL_LENGTH]
>- ( >- (
`value_type (el i ts) (el i vs)` by metis_tac [LIST_REL_EL_EQN] >> `value_type (el i ts) (el i vs)` by metis_tac [LIST_REL_EL_EQN] >>
first_x_assum drule >> first_x_assum drule >>
rw [] >> simp [GSYM DROP_DROP_T, ETA_THM] >> rw [] >> simp [GSYM DROP_DROP_T, ETA_THM] >>
`sum (map sizeof (take i ts)) = length (flat (take i (map value_to_bytes vs)))` `sum (map sizeof (take i ts)) = length (flat (take i (map llvm_value_to_bytes vs)))`
by ( by (
simp [LENGTH_FLAT, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >> simp [LENGTH_FLAT, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >>
`map sizeof ts = map (\x. length (value_to_bytes x)) vs` `map sizeof ts = map (\x. length (llvm_value_to_bytes x)) vs`
by ( by (
qpat_x_assum `list_rel _ _ _` mp_tac >> rpt (pop_assum kall_tac) >> qpat_x_assum `list_rel _ _ _` mp_tac >> rpt (pop_assum kall_tac) >>
qid_spec_tac `ts` >> qid_spec_tac `ts` >>
Induct_on `vs` >> rw [] >> rw [v2b_size]) >> Induct_on `vs` >> rw [] >> rw [llvm_v2b_size]) >>
rw []) >> rw []) >>
rw [GSYM flat_drop, GSYM MAP_DROP] >> rw [GSYM flat_drop, GSYM MAP_DROP] >>
`i < length vs` by metis_tac [LIST_REL_LENGTH] >> `i < length vs` by metis_tac [LIST_REL_LENGTH] >>
drule DROP_CONS_EL >> simp [DROP_APPEND] >> disch_then kall_tac >> drule DROP_CONS_EL >> simp [DROP_APPEND] >> disch_then kall_tac >>
`first_class_type t'` by metis_tac [value_type_is_fc, extract_type_fc] >> `first_class_type t'` by metis_tac [value_type_is_fc, extract_type_fc] >>
`sizeof t' length (drop x (value_to_bytes (el i vs)))` `sizeof t' length (drop x (llvm_value_to_bytes (el i vs)))`
by (simp [LENGTH_DROP] >> drule v2b_size >> rw [] >> metis_tac [extract_offset_size]) >> by (simp [LENGTH_DROP] >> drule llvm_v2b_size >> rw [] >> metis_tac [extract_offset_size]) >>
simp [b2v_append]) simp [b2llvm_v_append])
QED QED
(* ----- Theorems about the step function ----- *) (* ----- Theorems about the step function ----- *)
@ -615,53 +316,28 @@ Proof
globals_ok_def, stack_ok_def, heap_ok_def, EVERY_EL, frame_ok_def] globals_ok_def, stack_ok_def, heap_ok_def, EVERY_EL, frame_ok_def]
QED QED
Theorem flookup_set_bytes:
∀poison bytes n h n'.
flookup (set_bytes poison bytes n h) (A n') =
if n n' n' < n + length bytes then
Some (poison, el (n' - n) bytes)
else
flookup h (A n')
Proof
Induct_on `bytes` >> rw [set_bytes_def, EL_CONS, PRE_SUB1] >>
fs [ADD1, FLOOKUP_UPDATE] >>
`n = n'` by decide_tac >>
rw []
QED
Theorem allocate_invariant: Theorem allocate_invariant:
∀p s1 v1 t v2 s2. ∀p s1 v1 t v2 h2.
state_invariant p s1 allocate s1 v1 t (v2,s2) state_invariant p s2 state_invariant p s1 allocate s1.heap v1 t (v2,h2) state_invariant p (s1 with heap := h2)
Proof Proof
rw [allocate_cases, state_invariant_def, ip_ok_def, heap_ok_def, rw [state_invariant_def, ip_ok_def, globals_ok_def, stack_ok_def]
globals_ok_def, stack_ok_def] >> >- metis_tac [allocate_heap_ok]
rw [] >> fs [] >- (fs [is_allocated_def] >> metis_tac [allocate_unchanged, SUBSET_DEF])
>- ( >- (
fs [allocations_ok_def] >> rpt gen_tac >> disch_tac >> fs [is_free_def] >> rw [] >> fs [EVERY_EL, frame_ok_def, allocate_unchanged] >> rw [] >>
metis_tac [INTER_COMM]) metis_tac [allocate_unchanged, SUBSET_DEF])
>- (
rw [flookup_set_bytes]
>- rw [RIGHT_AND_OVER_OR, EXISTS_OR_THM, interval_to_set_def] >>
eq_tac >> rw [] >> fs [interval_to_set_def] >>
metis_tac [])
>- (fs [is_allocated_def] >> metis_tac [])
>- (fs [EVERY_EL, frame_ok_def] >> rw [] >> metis_tac [])
QED QED
Theorem set_bytes_invariant: Theorem set_bytes_invariant:
∀s poison bytes n prog b. ∀s poison bytes n prog b.
state_invariant prog s is_allocated (b, n, n + length bytes) s.allocations state_invariant prog s is_allocated (Interval b n (n + length bytes)) s.heap
state_invariant prog (s with heap := set_bytes poison bytes n s.heap) state_invariant prog (s with heap := set_bytes poison bytes n s.heap)
Proof Proof
rw [state_invariant_def] rw [state_invariant_def]
>- (fs [allocations_ok_def] >> rw [] >> metis_tac []) >- metis_tac [set_bytes_heap_ok]
>- ( >- (fs [globals_ok_def, is_allocated_def, set_bytes_unchanged] >> metis_tac [])
fs [heap_ok_def, flookup_set_bytes] >> rw [] >> >- (fs [stack_ok_def, EVERY_EL, frame_ok_def, set_bytes_unchanged])
fs [is_allocated_def, interval_to_set_def, SUBSET_DEF] >>
metis_tac [LESS_EQ_REFL, DECIDE ``!x y. x < x + SUC y``])
>- (fs [globals_ok_def] >> metis_tac [])
>- (fs [stack_ok_def, EVERY_EL, frame_ok_def])
QED QED
Theorem step_instr_invariant: Theorem step_instr_invariant:
@ -676,8 +352,10 @@ Proof
>- ( >- (
fs [stack_ok_def] >> rfs [EVERY_EL, frame_ok_def] >> fs [stack_ok_def] >> rfs [EVERY_EL, frame_ok_def] >>
first_x_assum (qspec_then `0` mp_tac) >> simp []) first_x_assum (qspec_then `0` mp_tac) >> simp [])
>- (fs [deallocate_def, allocations_ok_def] >> rw [] >> metis_tac [])
>- ( >- (
fs [heap_ok_def, deallocate_def, allocations_ok_def] >> rw []
>- metis_tac []
>- metis_tac [] >>
fs [deallocate_def, heap_ok_def] >> rw [flookup_fdiff] >> fs [deallocate_def, heap_ok_def] >> rw [flookup_fdiff] >>
eq_tac >> rw [] eq_tac >> rw []
>- metis_tac [optionTheory.NOT_IS_SOME_EQ_NONE] >- metis_tac [optionTheory.NOT_IS_SOME_EQ_NONE]
@ -686,7 +364,7 @@ Proof
>- ( >- (
fs [globals_ok_def, deallocate_def] >> rw [] >> fs [globals_ok_def, deallocate_def] >> rw [] >>
first_x_assum drule >> rw [] >> fs [is_allocated_def] >> first_x_assum drule >> rw [] >> fs [is_allocated_def] >>
qexists_tac `b2` >> rw [] >> CCONTR_TAC >> fs []) qexists_tac `b2` >> rw [] >> CCONTR_TAC >> fs [interval_freeable_def])
>- ( >- (
fs [stack_ok_def, EVERY_MEM, frame_ok_def, deallocate_def] >> rfs [] >> fs [stack_ok_def, EVERY_MEM, frame_ok_def, deallocate_def] >> rfs [] >>
rw [] rw []
@ -702,8 +380,6 @@ Proof
rw [ip_ok_def] >> fs [prog_ok_def, NOT_NIL_EQ_LENGTH_NOT_0] >> rw [ip_ok_def] >> fs [prog_ok_def, NOT_NIL_EQ_LENGTH_NOT_0] >>
qpat_x_assum `alookup _ (Fn "main") = _` kall_tac >> qpat_x_assum `alookup _ (Fn "main") = _` kall_tac >>
last_x_assum drule >> disch_then drule >> fs []) last_x_assum drule >> disch_then drule >> fs [])
>- (fs [allocations_ok_def] >> metis_tac [])
>- (fs [heap_ok_def] >> metis_tac [])
>- (fs [globals_ok_def] >> metis_tac []) >- (fs [globals_ok_def] >> metis_tac [])
>- (fs [stack_ok_def, frame_ok_def, EVERY_MEM] >> metis_tac [])) >- (fs [stack_ok_def, frame_ok_def, EVERY_MEM] >> metis_tac []))
>- ( (* Br *) >- ( (* Br *)
@ -712,8 +388,6 @@ Proof
rw [ip_ok_def] >> fs [prog_ok_def, NOT_NIL_EQ_LENGTH_NOT_0] >> rw [ip_ok_def] >> fs [prog_ok_def, NOT_NIL_EQ_LENGTH_NOT_0] >>
qpat_x_assum `alookup _ (Fn "main") = _` kall_tac >> qpat_x_assum `alookup _ (Fn "main") = _` kall_tac >>
last_x_assum drule >> disch_then drule >> fs []) last_x_assum drule >> disch_then drule >> fs [])
>- (fs [allocations_ok_def] >> metis_tac [])
>- (fs [heap_ok_def] >> metis_tac [])
>- (fs [globals_ok_def] >> metis_tac []) >- (fs [globals_ok_def] >> metis_tac [])
>- (fs [stack_ok_def, frame_ok_def, EVERY_MEM] >> metis_tac [])) >- (fs [stack_ok_def, frame_ok_def, EVERY_MEM] >> metis_tac []))
>- ( >- (
@ -752,7 +426,6 @@ Proof
>- ( (* Call *) >- ( (* Call *)
rw [state_invariant_def] rw [state_invariant_def]
>- (fs [prog_ok_def, ip_ok_def] >> metis_tac [NOT_NIL_EQ_LENGTH_NOT_0]) >- (fs [prog_ok_def, ip_ok_def] >> metis_tac [NOT_NIL_EQ_LENGTH_NOT_0])
>- (fs [state_invariant_def, allocations_ok_def] >> metis_tac [])
>- (fs [state_invariant_def, heap_ok_def] >> metis_tac []) >- (fs [state_invariant_def, heap_ok_def] >> metis_tac [])
>- (fs [state_invariant_def, globals_ok_def] >> metis_tac []) >- (fs [state_invariant_def, globals_ok_def] >> metis_tac [])
>- ( >- (

@ -344,7 +344,7 @@ Definition generate_move_blocks_list_def:
(used_names, new_blocks :: new_blocks2)) (used_names, new_blocks :: new_blocks2))
End End
(* Givel an association list of labels and phi-block pairs, remove the phi's, (* Given an association list of labels and phi-block pairs, remove the phi's,
* by generating an extra block along each control flow edge that does the move * by generating an extra block along each control flow edge that does the move
* corresponding to the relevant phis. *) * corresponding to the relevant phis. *)
Definition remove_phis_def: Definition remove_phis_def:

@ -0,0 +1,570 @@
(*
* Copyright (c) Facebook, Inc. and its affiliates.
*
* This source code is licensed under the MIT license found in the
* LICENSE file in the root directory of this source tree.
*)
(* A simple, concrete memory model where the heap is an array of bytes. This is
* how llair views memory, and how we give semantics to llvm. Although LLVM's
* real memory model is still a subject of research, this is mostly to do with
* enabling the right collection of compiler optimisations. Since we only want to
* think about LLVM semantics after optimisation, the concrete model is likely to
* be sufficient. *)
open HolKernel boolLib bossLib Parse;
open arithmeticTheory listTheory rich_listTheory pairTheory;
open logrootTheory numposrepTheory wordsTheory pred_setTheory finite_mapTheory;
open settingsTheory miscTheory;
new_theory "memory_model";
numLib.prefer_num ();
(* Heap addresses *)
Datatype:
addr = A num
End
(* Values that fit in registers *)
Datatype:
reg_v =
| FlatV 'a
| AggV (reg_v list)
End
(* An interval of allocated memory.
* Args: whether it's freeable, the starting address (inclusive), and the ending address
* (exclusive)
*)
Datatype:
interval = Interval bool num num
End
Datatype:
heap = <| memory : addr |-> 'a # word8;
allocations : interval set;
valid_addresses : addr set|>
End
(* shapes statically describe the shape of a value in a register. Flat shapes
* take a given number of bytes, Array shapes are replicated a certain number of
* times
*)
Datatype:
shape =
| Flat num 'a
| Array shape num
| Tuple (shape list)
End
(* Does a value have a given shape. The function argument answers the question
* for flat values/shapes.
* We use mutual recursion instead of list_rel to work around a HOL bug. *)
Definition value_shape_def:
(value_shape f (Flat n t) (FlatV x) f n t x)
(value_shape f (Array s n) (AggV vs)
every (value_shape f s) vs length vs = n)
(value_shape f (Tuple ss) (AggV vs)
value_shapes f ss vs)
(value_shape _ _ _ F)
(value_shapes f [] [] T)
(value_shapes f (s::ss) (v::vs)
value_shape f s v value_shapes f ss vs)
(value_shapes _ _ _ F)
Termination
WF_REL_TAC `measure (\x. case x of | INL (_, x, _) => shape_size (\x.0) x | INR (_, y, _) => shape1_size (\x.0) y)`
End
Theorem value_shapes_list_rel:
∀f ss vs. value_shapes f ss vs list_rel (value_shape f) ss vs
Proof
Induct_on `ss` >> Cases_on `vs` >> rw [value_shape_def]
QED
Theorem value_shape_cases:
∀f s v.
value_shape f s v
(∃n t x. s = Flat n t v = FlatV x f n t x)
(∃s2 n vs. s = Array s2 n v = AggV vs
every (value_shape f s2) vs length vs = n)
(∃ss vs. s = Tuple ss v = AggV vs value_shapes f ss vs)
Proof
rw [] >>
Cases_on `s` >> Cases_on `v` >> rw [value_shape_def] >> metis_tac []
QED
Definition sizeof_def:
(sizeof (Flat n t) = n)
(sizeof (Array s n) = n * sizeof s)
(sizeof (Tuple ss) = sum (map sizeof ss))
Termination
WF_REL_TAC `measure (shape_size (\x.0))` >> rw [] >>
Induct_on `ss` >> rw [definition "shape_size_def"] >>
res_tac >> decide_tac
End
Definition interval_to_set_def:
interval_to_set (Interval _ start stop) =
{ n | start n n < stop }
End
Definition interval_ok_def:
interval_ok (Interval b i1 i2) valid_addresses
i1 i2 image A (interval_to_set (Interval b i1 i2)) valid_addresses
End
Definition interval_freeable_def:
interval_freeable (Interval b _ _) b
End
Definition is_allocated_def:
is_allocated b1 h
interval_ok b1 h.valid_addresses
∃b2. b2 h.allocations (interval_freeable b1 interval_freeable b2)
interval_to_set b1 interval_to_set b2
End
Definition is_free_def:
is_free b1 h
interval_ok b1 h.valid_addresses
∀b2. b2 h.allocations interval_to_set b1 interval_to_set b2 =
End
(* The allocations are of intervals that don't overlap *)
Definition allocations_ok_def:
allocations_ok h
∀i1 i2.
i1 h.allocations i2 h.allocations
interval_ok i1 h.valid_addresses interval_ok i2 h.valid_addresses
(interval_to_set i1 interval_to_set i2 i1 = i2)
End
(* The heap maps exactly the address in the allocations *)
Definition heap_ok_def:
heap_ok h
allocations_ok h
∀n. flookup h.memory (A n) None ∃i. i h.allocations n interval_to_set i
End
Definition get_bytes_def:
get_bytes h (Interval _ start stop) =
map
(λoff.
case flookup h.memory (A (start + off)) of
| None => (F, 0w)
| Some w => w)
(count_list (stop - start))
End
Definition set_bytes_def:
(set_bytes p [] n h = h)
(set_bytes p (b::bs) n h =
set_bytes p bs (Suc n) (h with memory := h.memory |+ (A n, (p, b))))
End
(* Allocate a free chunk of memory, and write non-deterministic bytes into it *)
Inductive allocate:
b = Interval T p (p + size)
is_free b h
length bytes = size
allocate h size tag (w, set_bytes tag bytes p
<| memory := h.memory;
allocations := { b } h.allocations;
valid_addresses := h.valid_addresses |>)
End
Definition deallocate_def:
deallocate addrs h =
let to_remove = { Interval T n stop | A n set addrs Interval T n stop h.allocations } in
<| memory := fdiff h.memory (image A (bigunion (image interval_to_set to_remove)));
allocations := h.allocations DIFF to_remove;
valid_addresses := h.valid_addresses |>
End
(* Read len bytes from the list of bytes, and convert it into a word value,
* little-endian encoding *)
Definition le_read_w_def:
le_read_w len (bs : word8 list) =
if length bs < len then
(l2w 256 (map w2n bs), [])
else
(l2w 256 (map w2n (take len bs)), drop len bs)
End
(* Return len bytes that are the little-endian encoding of the argument word *)
Definition le_write_w_def:
le_write_w len w =
let (l : word8 list) = map n2w (w2l 256 w) in
take len (l ++ replicate (len - length l) 0w)
End
(* Read a from a list of bytes bs to build a register value described by a
* shape. The function f is applied to the word read from a flat list of bytes
* in little-endian order. *)
Definition bytes_to_value_def:
(bytes_to_value f (Flat n t) bs = (FlatV o f n t ## I) (le_read_w n bs))
(bytes_to_value f (Array s n) bs = (AggV ## I) (read_array f n s bs))
(bytes_to_value f (Tuple ts) bs = (AggV ## I) (read_str f ts bs))
(read_array f 0 s bs = ([], bs))
(read_array f (Suc n) s bs =
let (v, bs) = bytes_to_value f s bs in
let (rest, bs) = read_array f n s bs in
(v::rest, bs))
(read_str f [] bs = ([], bs))
(read_str f (s::ss) bs =
let (v, bs) = bytes_to_value f s bs in
let (rest, bs) = read_str f ss bs in
(v::rest, bs))
Termination
WF_REL_TAC `measure (λx. case x of
| INL (_, t, bs) => shape_size (\x.0) t
| INR (INL (_, n, t, bs)) => n + shape_size (\x.0) t
| INR (INR (_, ts, bs)) => shape1_size (\x.0) ts)`
End
(* Convert the given value to a list of bytes, the function gives the size, and
* a machine word for a flat value *)
Definition value_to_bytes_def:
(value_to_bytes f (FlatV x) =
let (size, word) = f x in
le_write_w size word)
(value_to_bytes f (AggV vs) = flat (map (value_to_bytes f) vs))
Termination
WF_REL_TAC `measure (reg_v_size (\x. 0) o snd)` >>
Induct >> rw [definition "reg_v_size_def"] >>
TRY (first_x_assum drule) >>
decide_tac
End
(* ----- Theorems about converting between values and byte lists ----- *)
Theorem le_write_w_length:
∀l x. length (le_write_w l w) = l
Proof
rw [le_write_w_def]
QED
Theorem v2b_size_lem:
(∀(f:num->'a->'b->bool) s v. (∀n t x. f n t x fst (g x) = n) value_shape f s v length (value_to_bytes g v) = sizeof s)
(∀(f:num->'a->'b->bool) ss vs. (∀n t x. f n t x fst (g x) = n) value_shapes f ss vs sum (map (length o value_to_bytes g) vs) = sum (map sizeof ss))
Proof
ho_match_mp_tac value_shape_ind >>
rw [value_to_bytes_def, sizeof_def, value_shape_def]
>- (
pairarg_tac >> simp [] >>
metis_tac [FST, le_write_w_length])
>- (
simp [LENGTH_FLAT, MAP_MAP_o, combinTheory.o_DEF] >>
Induct_on `vs` >> rw [ADD1] >> fs [LEFT_ADD_DISTRIB] >>
metis_tac [])
>- (fs [LENGTH_FLAT, ETA_THM, MAP_MAP_o, combinTheory.o_DEF] >> metis_tac [])
>- metis_tac [ADD_COMM]
QED
Theorem v2b_size:
∀f s v g. (∀n t x. f n t x fst (g x) = n) value_shape f s v length (value_to_bytes g v) = sizeof s
Proof
metis_tac [v2b_size_lem]
QED
Theorem b2v_size_lem:
(∀(f:num->'c ->'a word -> 'b) s bs. sizeof s length bs
∃v. bytes_to_value f s bs = (v, drop (sizeof s) bs))
(∀(f:num->'c ->'a word -> 'b) n s bs. n * sizeof s length bs
∃vs. read_array f n s bs = (vs, drop (n * sizeof s) bs))
(∀(f:num->'c ->'a word -> 'b) ss bs. sum (map sizeof ss) length bs
∃vs. read_str f ss bs = (vs, drop (sum (map sizeof ss)) bs))
Proof
ho_match_mp_tac bytes_to_value_ind >>
rw [sizeof_def, bytes_to_value_def, le_read_w_def] >>
fs []
>- (simp [PAIR_MAP] >> metis_tac [SND])
>- (
pairarg_tac >> rw [] >> pairarg_tac >> rw [] >>
fs [ADD1] >> rw [] >> fs [DROP_DROP_T, LEFT_ADD_DISTRIB])
>- fs [DROP_DROP_T, LEFT_ADD_DISTRIB]
QED
Theorem b2v_size:
∀f s bs. sizeof s length bs
∃v. bytes_to_value f s bs = (v, drop (sizeof s) bs)
Proof
metis_tac [b2v_size_lem]
QED
Theorem b2v_smaller:
∀f s bs. sizeof s length bs
length (snd (bytes_to_value f s bs)) = length bs - sizeof s
Proof
rw [] >> imp_res_tac b2v_size >>
Cases_on `bytes_to_value f s bs` >> fs [] >>
first_x_assum (qspec_then `f` mp_tac) >> rw []
QED
Theorem b2v_append_lem:
(∀(f:num->'c->'a word -> 'b) s bs. sizeof s length bs
bytes_to_value f s (bs ++ bs') = (I ## (λx. x ++ bs')) (bytes_to_value f s bs))
(∀(f:num->'c->'a word -> 'b) n s bs. n * sizeof s length bs
∃vs. read_array f n s (bs ++ bs') = (I ## (λx. x ++ bs')) (read_array f n s bs))
(∀(f:num->'c->'a word -> 'b) ss bs. sum (map sizeof ss) length bs
∃vs. read_str f ss (bs ++ bs') = (I ## (λx. x ++ bs')) (read_str f ss bs))
Proof
ho_match_mp_tac bytes_to_value_ind >>
rw [sizeof_def, bytes_to_value_def, le_read_w_def] >>
fs [TAKE_APPEND, DROP_APPEND,
DECIDE ``!x y. x y x - y = 0n``, ETA_THM]
>- (simp [PAIR_MAP] >> metis_tac [SND])
>- (simp [PAIR_MAP] >> metis_tac [SND])
>- (
rpt (pairarg_tac >> simp []) >> fs [ADD1] >>
BasicProvers.VAR_EQ_TAC >> fs [LEFT_ADD_DISTRIB] >>
first_x_assum irule >>
`sizeof s length bs` by decide_tac >>
qspec_then `f` drule b2v_smaller >>
disch_then (qspec_then `f` mp_tac) >>
rw [])
>- (
rpt (pairarg_tac >> simp []) >> fs [ADD1] >>
BasicProvers.VAR_EQ_TAC >> fs [LEFT_ADD_DISTRIB] >>
first_x_assum irule >>
`sizeof s length bs` by decide_tac >>
qspec_then `f` drule b2v_smaller >>
disch_then (qspec_then `f` mp_tac) >>
rw [])
QED
Theorem b2v_append:
∀f s bs bs'. sizeof s length bs
bytes_to_value f s (bs ++ bs') = (I ## (λx. x ++ bs')) (bytes_to_value f s bs)
Proof
metis_tac [b2v_append_lem]
QED
Theorem le_read_write:
∀n w bs.
w2n w < 256 ** n le_read_w n (le_write_w n w bs) = (w, bs)
Proof
rw [le_read_w_def, le_write_w_length]
>- (
`take n (le_write_w n w bs) = le_write_w n w`
by metis_tac [le_write_w_length, TAKE_LENGTH_APPEND] >>
simp [le_write_w_def, w2l_def, l2w_def] >>
Cases_on `w` >> simp [] >> fs [l2n_padding, TAKE_APPEND, take_replicate] >>
simp [MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF, mod_n2l] >>
rename1 `n2l 256 m` >>
Cases_on `n = 0` >> fs [] >>
`length (n2l 256 m) n`
by (
rw [LENGTH_n2l] >>
`256 = 2 ** 8` by EVAL_TAC >>
ASM_REWRITE_TAC [] >> simp [log_change_base_power, GSYM LESS_EQ] >>
`n2w m 0w` by simp [] >>
rw [] >> fs [bitTheory.LOG2_def, dimword_def] >>
`8 * (log 2 m DIV 8) log 2 m` by metis_tac [mul_div_bound, EVAL ``8 0n``] >>
`LOG 2 m LOG 2 (256 ** n)` by simp [LOG_LE_MONO] >>
pop_assum mp_tac >>
`256 = 2 ** 8` by EVAL_TAC >>
ASM_REWRITE_TAC [EXP_MUL] >> simp [log_base_power] >>
Cases_on `log 2 m DIV 8 = n` >> rw [] >>
CCONTR_TAC >> fs [] >>
`log 2 m = (8 * (log 2 m DIV 8))` by intLib.COOPER_TAC >> fs [] >>
`2 ** log 2 m = 2 ** (8 * (log 2 m DIV 8))` by rw [] >>
fs [EXP_EXP_MULT] >>
`2 ** log 2 m m` by rw [exp_log_bound] >>
decide_tac) >>
simp [mod_n2l, l2n_n2l, TAKE_LENGTH_TOO_LONG])
>- metis_tac [le_write_w_length, DROP_LENGTH_APPEND]
QED
Theorem le_write_read:
∀n w bs bs'.
256 ** n dimword (:'a)
n length bs
le_read_w n bs = (w:'a word, bs')
le_write_w n w ++ bs' = bs
Proof
rw [le_read_w_def] >>
qmatch_goalsub_abbrev_tac `l2w _ l` >>
`le_write_w n (l2w 256 l) = take n bs` suffices_by metis_tac [TAKE_DROP] >>
simp [le_write_w_def, w2l_l2w] >>
`l2n 256 l < 256 ** n`
by (
`n length bs` by decide_tac >>
metis_tac [l2n_lt, LENGTH_TAKE, LENGTH_MAP, EVAL ``0n < 256``]) >>
fs [] >>
`every ($> 256) l`
by (
simp [EVERY_MAP, Abbr `l`] >> irule EVERY_TAKE >> simp [] >>
rpt (pop_assum kall_tac) >>
Induct_on `bs` >> rw [] >>
Cases_on `h` >> fs []) >>
rw [n2l_l2n]
>- (
rw [TAKE_def, take_replicate] >>
Cases_on `n` >> fs [] >>
rfs [l2n_0] >> unabbrev_all_tac >> fs [EVERY_MAP] >>
ONCE_REWRITE_TAC [GSYM REPLICATE] >>
qmatch_goalsub_abbrev_tac `take n _` >>
qpat_assum `¬(_ < _)` mp_tac >>
qpat_assum `every (\x. 0 = w2n x) _` mp_tac >>
rpt (pop_assum kall_tac) >>
qid_spec_tac `bs` >>
Induct_on `n` >> rw [] >>
Cases_on `bs` >> rw [] >> fs [] >>
Cases_on `h` >> fs [] >>
first_x_assum irule >> rw [] >>
irule MONO_EVERY >>
qexists_tac `(λx. 0 = w2n x)` >> rw []) >>
fs [MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF] >>
`exists (\y. 0 y) l`
by (
fs [l2n_eq_0, combinTheory.o_DEF] >> fs [EXISTS_MEM, EVERY_MEM] >>
qexists_tac `x` >> rfs [MOD_MOD, GREATER_DEF]) >>
simp [LOG_l2n_dropWhile] >>
`length (dropWhile ($= 0) (reverse l)) 0`
by (
Cases_on `l` >> fs [dropWhile_eq_nil, combinTheory.o_DEF, EXISTS_REVERSE]) >>
`0 < length (dropWhile ($= 0) (reverse l))` by decide_tac >>
fs [SUC_PRE] >>
`map n2w l = take n bs`
by (simp [Abbr `l`, MAP_TAKE, MAP_MAP_o, combinTheory.o_DEF, n2w_w2n]) >>
simp [TAKE_TAKE_MIN] >>
`length l = n` by simp [Abbr `l`] >>
`length (dropWhile ($= 0) (reverse l)) n`
by metis_tac [LESS_EQ_TRANS, LENGTH_dropWhile_LESS_EQ, LENGTH_REVERSE] >>
rw [MIN_DEF] >> fs []
>- (
simp [TAKE_APPEND, TAKE_TAKE_MIN, MIN_DEF, take_replicate] >>
`replicate (length l length (dropWhile ($= 0) (reverse l))) 0w =
take (length l (length (dropWhile ($= 0) (reverse l)))) (drop (length (dropWhile ($= 0) (reverse l))) bs)`
suffices_by (rw [] >> irule take_drop_partition >> simp []) >>
rw [LIST_EQ_REWRITE, EL_REPLICATE, EL_TAKE, EL_DROP] >>
`length (dropWhile ($= 0) (reverse l)) =
length (dropWhile (λx. 0 = w2n x) (reverse (take (length l) bs)))`
by (
`reverse l = reverse (take (length l) (map w2n bs))` by metis_tac [] >>
ONCE_ASM_REWRITE_TAC [] >>
qpat_x_assum `Abbrev (l = _)` kall_tac >>
simp [GSYM MAP_TAKE, GSYM MAP_REVERSE, dropWhile_map, combinTheory.o_DEF]) >>
fs [] >>
`x + length (dropWhile (λx. 0 = w2n x) (reverse (take (length l) bs))) < length l` by decide_tac >>
drule (SIMP_RULE std_ss [LET_THM] dropWhile_rev_take) >>
rw [] >>
REWRITE_TAC [GSYM w2n_11, word_0_n2w] >>
simp [])
>- rw [TAKE_APPEND, TAKE_TAKE]
QED
Theorem b2v_v2b_lem:
(∀f s v.
value_shape f s v
(∀x t n. f n t x fst (h x) = n g n t (snd (h x)) = x w2n (snd (h x)) < 256 ** n)
∀bs.
bytes_to_value (g:num -> 'c -> 'a word -> 'b) s (value_to_bytes h v ++ bs) = (v, bs))
(∀f ss vs.
value_shapes f ss vs
(∀x t n. f n t x fst (h x) = n g n t (snd (h x)) = x w2n (snd (h x)) < 256 ** n)
∀bs.
read_str (g:num -> 'c -> 'a word -> 'b) ss (flat (map (value_to_bytes h) vs) ++ bs) = (vs, bs))
Proof
ho_match_mp_tac value_shape_ind >> rw [value_shape_def] >>
fs [bytes_to_value_def, value_to_bytes_def] >> rw []
>- (
pairarg_tac >> fs [] >>
first_x_assum drule >> simp [] >> rw [] >>
simp [le_read_write])
>- (
qmatch_abbrev_tac `_ x = _` >>
`x = (vs, bs)` suffices_by (simp [PAIR_MAP] >> metis_tac [PAIR_EQ, FST, SND]) >>
unabbrev_all_tac >>
qid_spec_tac `bs` >> Induct_on `vs` >> simp [bytes_to_value_def] >>
rw [] >> fs [definition "reg_v_size_def"] >>
pairarg_tac >> fs [] >>
pairarg_tac >> fs [] >>
rename1 `value_shape _ s v1` >>
qpat_x_assum `_ !bs. P bs` mp_tac >> impl_tac >> simp [] >>
metis_tac [APPEND_ASSOC, PAIR_EQ])
>- (
qmatch_abbrev_tac `_ x = _` >>
`x = (vs, bs)` suffices_by (simp [PAIR_MAP] >> metis_tac [PAIR_EQ, FST, SND]) >>
metis_tac [])
>- (
pairarg_tac >> fs [] >>
pairarg_tac >> fs [] >>
metis_tac [APPEND_ASSOC, PAIR_EQ])
QED
Theorem b2v_v2b:
∀f g h s v bs.
value_shape f s v
(∀x n t. f n t x fst (h x) = n g n t (snd (h x)) = x w2n (snd (h x)) < 256 ** n)
bytes_to_value g s (value_to_bytes h v ++ bs) = (v, bs)
Proof
metis_tac [b2v_v2b_lem]
QED
Theorem flookup_set_bytes:
∀tag bytes n h n'.
flookup ((set_bytes tag bytes n h).memory) (A n') =
if n n' n' < n + length bytes then
Some (tag, el (n' - n) bytes)
else
flookup h.memory (A n')
Proof
Induct_on `bytes` >> rw [set_bytes_def, EL_CONS, PRE_SUB1] >>
fs [ADD1, FLOOKUP_UPDATE] >>
`n = n'` by decide_tac >>
rw []
QED
Theorem set_bytes_unchanged:
∀t bs p h. (set_bytes t bs p h).valid_addresses = h.valid_addresses
(set_bytes t bs p h).allocations = h.allocations
Proof
Induct_on `bs` >> rw [set_bytes_def]
QED
Theorem allocate_unchanged:
∀h1 v1 t h2 v2.
allocate h1 v1 t (v2, h2)
h1.valid_addresses = h2.valid_addresses
h1.allocations h2.allocations
Proof
rw [allocate_cases] >> rw [set_bytes_unchanged]
QED
Theorem allocate_heap_ok:
∀h1 v1 t v2 h2. heap_ok h1 allocate h1 v1 t (v2,h2) heap_ok h2
Proof
rw [allocate_cases, heap_ok_def]
>- (
fs [allocations_ok_def] >> rpt gen_tac >> disch_tac >> fs [is_free_def] >> rw [] >>
fs [set_bytes_unchanged] >> metis_tac [INTER_COMM])
>- (
rw [flookup_set_bytes, set_bytes_unchanged]
>- rw [RIGHT_AND_OVER_OR, EXISTS_OR_THM, interval_to_set_def] >>
eq_tac >> rw [] >> fs [interval_to_set_def] >>
metis_tac [])
QED
Theorem set_bytes_heap_ok:
∀h tag bytes n b.
heap_ok h is_allocated (Interval b n (n + length bytes)) h
heap_ok (set_bytes tag bytes n h)
Proof
rw [heap_ok_def]
>- (fs [allocations_ok_def] >> rw [set_bytes_unchanged] >> metis_tac [])
>- (
fs [flookup_set_bytes, set_bytes_unchanged] >> rw [] >>
fs [is_allocated_def, interval_to_set_def, SUBSET_DEF] >>
metis_tac [LESS_EQ_REFL, DECIDE ``!x y. x < x + SUC y``])
QED
export_theory ();

@ -0,0 +1,172 @@
(*
* Copyright (c) Facebook, Inc. and its affiliates.
*
* This source code is licensed under the MIT license found in the
* LICENSE file in the root directory of this source tree.
*)
(* Misc. theorems that aren't specific to the semantics of LLVM or Sledge. These
* could be upstreamed to HOL, and should eventually. *)
open HolKernel boolLib bossLib Parse;
open listTheory rich_listTheory arithmeticTheory wordsTheory;
open finite_mapTheory open logrootTheory numposrepTheory;
open settingsTheory;
new_theory "misc";
numLib.prefer_num ();
(* ----- Theorems about list library functions ----- *)
Theorem dropWhile_map:
∀P f l. dropWhile P (map f l) = map f (dropWhile (P o f) l)
Proof
Induct_on `l` >> rw []
QED
Theorem dropWhile_prop:
∀P l x. x < length l - length (dropWhile P l) P (el x l)
Proof
Induct_on `l` >> rw [] >>
Cases_on `x` >> fs []
QED
Theorem dropWhile_rev_take:
∀P n l x.
let len = length (dropWhile P (reverse (take n l))) in
x + len < n n length l P (el (x + len) l)
Proof
rw [] >>
`P (el ((n - 1 - x - length (dropWhile P (reverse (take n l))))) (reverse (take n l)))`
by (irule dropWhile_prop >> simp [LENGTH_REVERSE]) >>
rfs [EL_REVERSE, EL_TAKE, PRE_SUB1]
QED
Theorem take_replicate:
∀m n x. take m (replicate n x) = replicate (min m n) x
Proof
Induct_on `n` >> rw [TAKE_def, MIN_DEF] >> fs [] >>
Cases_on `m` >> rw []
QED
Theorem length_take_less_eq:
∀n l. length (take n l) n
Proof
Induct_on `l` >> rw [TAKE_def] >>
Cases_on `n` >> fs []
QED
Theorem flat_drop:
∀n m ls. flat (drop m ls) = drop (length (flat (take m ls))) (flat ls)
Proof
Induct_on `ls` >> rw [DROP_def, DROP_APPEND] >>
irule (GSYM DROP_LENGTH_TOO_LONG) >> simp []
QED
Theorem take_is_prefix:
∀n l. take n l l
Proof
Induct_on `l` >> rw [TAKE_def]
QED
Theorem sum_prefix:
∀l1 l2. l1 l2 sum l1 sum l2
Proof
Induct >> rw [] >> Cases_on `l2` >> fs []
QED
Theorem flookup_fdiff:
∀m s k.
flookup (fdiff m s) k =
if k s then None else flookup m k
Proof
rw [FDIFF_def, FLOOKUP_DRESTRICT] >> fs []
QED
(* ----- Theorems about log ----- *)
Theorem mul_div_bound:
∀m n. n 0 m - (n - 1) n * (m DIV n) n * (m DIV n) m
Proof
rw [] >>
`0 < n` by decide_tac >>
drule DIVISION >> disch_then (qspec_then `m` mp_tac) >>
decide_tac
QED
Theorem exp_log_bound:
∀b n. 1 < b n 0 n DIV b + 1 b ** (log b n) b ** (log b n) n
Proof
rw [] >> `0 < n` by decide_tac >>
drule LOG >> disch_then drule >> rw [] >>
fs [ADD1, EXP_ADD] >>
simp [DECIDE ``∀x y. x + 1 y x < y``] >>
`∃x. b = Suc x` by intLib.COOPER_TAC >>
`b * (n DIV b) < b * b ** log b n` suffices_by metis_tac [LESS_MULT_MONO] >>
pop_assum kall_tac >>
`b 0` by decide_tac >>
drule mul_div_bound >> disch_then (qspec_then `n` mp_tac) >>
decide_tac
QED
Theorem log_base_power:
∀n b. 1 < b log b (b ** n) = n
Proof
Induct >> rw [EXP, LOG_1] >>
Cases_on `n` >> rw [LOG_BASE] >>
first_x_assum drule >> rw [] >>
simp [Once EXP, LOG_MULT]
QED
Theorem log_change_base_power:
∀m n b. 1 < b m 0 n 0 log (b ** n) m = log b m DIV n
Proof
rw [] >> irule LOG_UNIQUE >>
rw [ADD1, EXP_MUL, LEFT_ADD_DISTRIB] >>
qmatch_goalsub_abbrev_tac `x DIV _` >>
drule mul_div_bound >> disch_then (qspec_then `x` mp_tac) >> rw []
>- (
irule LESS_LESS_EQ_TRANS >>
qexists_tac `b ** (x+1)` >> rw [] >>
unabbrev_all_tac >>
simp [EXP_ADD] >>
`b * (m DIV b + 1) b * b ** log b m`
by metis_tac [exp_log_bound, LESS_MONO_MULT, MULT_COMM] >>
`m < b * (m DIV b + 1)` suffices_by decide_tac >>
simp [LEFT_ADD_DISTRIB] >>
`b 0` by decide_tac >>
`m - (b - 1) b * (m DIV b)` by metis_tac [mul_div_bound] >>
fs [])
>- (
irule LESS_EQ_TRANS >>
qexists_tac `b ** (log b m)` >> rw [] >>
unabbrev_all_tac >>
metis_tac [exp_log_bound])
QED
(* ----- Theorems about word stuff ----- *)
Theorem l2n_padding:
∀ws n. l2n 256 (ws ++ map w2n (replicate n 0w)) = l2n 256 ws
Proof
Induct >> rw [l2n_def] >>
Induct_on `n` >> rw [l2n_def]
QED
Theorem l2n_0:
∀l b. b 0 every ($> b) l (l2n b l = 0 every ($= 0) l)
Proof
Induct >> rw [l2n_def] >>
eq_tac >> rw []
QED
Theorem mod_n2l:
∀d n. 0 < d map (\x. x MOD d) (n2l d n) = n2l d n
Proof
rw [] >> drule n2l_BOUND >> disch_then (qspec_then `n` mp_tac) >>
qspec_tac (`n2l d n`, `l`) >>
Induct >> rw []
QED
export_theory ();
Loading…
Cancel
Save