annotate src/especialize.sml @ 1077:a3273bee05a9

Initial generalization of Especialize, with security bug known
author Adam Chlipala <adamc@hcoop.net>
date Tue, 15 Dec 2009 12:26:00 -0500
parents 066493f7f008
children b9321bcefb42
rev   line source
adamc@443 1 (* Copyright (c) 2008, Adam Chlipala
adamc@443 2 * All rights reserved.
adamc@443 3 *
adamc@443 4 * Redistribution and use in source and binary forms, with or without
adamc@443 5 * modification, are permitted provided that the following conditions are met:
adamc@443 6 *
adamc@443 7 * - Redistributions of source code must retain the above copyright notice,
adamc@443 8 * this list of conditions and the following disclaimer.
adamc@443 9 * - Redistributions in binary form must reproduce the above copyright notice,
adamc@443 10 * this list of conditions and the following disclaimer in the documentation
adamc@443 11 * and/or other materials provided with the distribution.
adamc@443 12 * - The names of contributors may not be used to endorse or promote products
adamc@443 13 * derived from this software without specific prior written permission.
adamc@443 14 *
adamc@443 15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
adamc@443 16 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
adamc@443 17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
adamc@443 18 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
adamc@443 19 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
adamc@443 20 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
adamc@443 21 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
adamc@443 22 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
adamc@443 23 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
adamc@443 24 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
adamc@443 25 * POSSIBILITY OF SUCH DAMAGE.
adamc@443 26 *)
adamc@443 27
adamc@443 28 structure ESpecialize :> ESPECIALIZE = struct
adamc@443 29
adamc@443 30 open Core
adamc@443 31
adamc@443 32 structure E = CoreEnv
adamc@443 33 structure U = CoreUtil
adamc@443 34
adamc@479 35 type skey = exp
adamc@453 36
adamc@453 37 structure K = struct
adamc@479 38 type ord_key = exp list
adamc@479 39 val compare = Order.joinL U.Exp.compare
adamc@443 40 end
adamc@443 41
adamc@453 42 structure KM = BinaryMapFn(K)
adamc@443 43 structure IM = IntBinaryMap
adamc@482 44 structure IS = IntBinarySet
adamc@443 45
adamc@626 46 val freeVars = U.Exp.foldB {kind = fn (_, _, xs) => xs,
adamc@488 47 con = fn (_, _, xs) => xs,
adamc@488 48 exp = fn (bound, e, xs) =>
adamc@488 49 case e of
adamc@488 50 ERel x =>
adamc@488 51 if x >= bound then
adamc@488 52 IS.add (xs, x - bound)
adamc@488 53 else
adamc@488 54 xs
adamc@488 55 | _ => xs,
adamc@488 56 bind = fn (bound, b) =>
adamc@488 57 case b of
adamc@488 58 U.Exp.RelE _ => bound + 1
adamc@488 59 | _ => bound}
adamc@488 60 0 IS.empty
adamc@479 61
adamc@522 62 val isPoly = U.Decl.exists {kind = fn _ => false,
adamc@522 63 con = fn _ => false,
adamc@522 64 exp = fn ECAbs _ => true
adamc@522 65 | _ => false,
adamc@522 66 decl = fn _ => false}
adamc@522 67
adamc@488 68 fun positionOf (v : int, ls) =
adamc@488 69 let
adamc@488 70 fun pof (pos, ls) =
adamc@488 71 case ls of
adamc@488 72 [] => raise Fail "Defunc.positionOf"
adamc@488 73 | v' :: ls' =>
adamc@488 74 if v = v' then
adamc@488 75 pos
adamc@488 76 else
adamc@488 77 pof (pos + 1, ls')
adamc@488 78 in
adamc@488 79 pof (0, ls)
adamc@488 80 end
adamc@488 81
adamc@1077 82 fun squish (untouched, fvs) =
adamc@626 83 U.Exp.mapB {kind = fn _ => fn k => k,
adamc@488 84 con = fn _ => fn c => c,
adamc@488 85 exp = fn bound => fn e =>
adamc@479 86 case e of
adamc@488 87 ERel x =>
adamc@488 88 if x >= bound then
adamc@1077 89 ERel (positionOf (x - bound, fvs) + bound + untouched)
adamc@488 90 else
adamc@488 91 e
adamc@488 92 | _ => e,
adamc@488 93 bind = fn (bound, b) =>
adamc@488 94 case b of
adamc@488 95 U.Exp.RelE _ => bound + 1
adamc@488 96 | _ => bound}
adamc@488 97 0
adamc@453 98
adamc@443 99 type func = {
adamc@443 100 name : string,
adamc@453 101 args : int KM.map,
adamc@443 102 body : exp,
adamc@443 103 typ : con,
adamc@443 104 tag : string
adamc@443 105 }
adamc@443 106
adamc@443 107 type state = {
adamc@443 108 maxName : int,
adamc@443 109 funcs : func IM.map,
adamc@443 110 decls : (string * int * con * exp * string) list
adamc@443 111 }
adamc@443 112
adamc@488 113 fun default (_, x, st) = (x, st)
adamc@443 114
adamc@800 115 structure SS = BinarySetFn(struct
adamc@800 116 type ord_key = string
adamc@800 117 val compare = String.compare
adamc@800 118 end)
adamc@800 119
adamc@800 120 val mayNotSpec = ref SS.empty
adamc@800 121
adamc@453 122 fun specialize' file =
adamc@443 123 let
adamc@488 124 fun bind (env, b) =
adamc@488 125 case b of
adamc@521 126 U.Decl.RelE xt => xt :: env
adamc@521 127 | _ => env
adamc@488 128
adamc@488 129 fun exp (env, e, st : state) =
adamc@482 130 let
adamc@721 131 (*val () = Print.prefaces "exp" [("e", CorePrint.p_exp CoreEnv.empty
adamc@721 132 (e, ErrorMsg.dummySpan))]*)
adamc@721 133
adamc@488 134 fun getApp e =
adamc@482 135 case e of
adamc@488 136 ENamed f => SOME (f, [])
adamc@482 137 | EApp (e1, e2) =>
adamc@488 138 (case getApp (#1 e1) of
adamc@482 139 NONE => NONE
adamc@488 140 | SOME (f, xs) => SOME (f, xs @ [e2]))
adamc@482 141 | _ => NONE
adamc@482 142 in
adamc@482 143 case getApp e of
adamc@721 144 NONE => ((*Print.prefaces "No" [("e", CorePrint.p_exp CoreEnv.empty
adamc@721 145 (e, ErrorMsg.dummySpan))];*)
adamc@721 146 (e, st))
adamc@488 147 | SOME (f, xs) =>
adamc@485 148 case IM.find (#funcs st, f) of
adamc@485 149 NONE => (e, st)
adamc@485 150 | SOME {name, args, body, typ, tag} =>
adamc@488 151 let
adamc@721 152 (*val () = Print.prefaces "Consider" [("e", CorePrint.p_exp CoreEnv.empty
adamc@721 153 (e, ErrorMsg.dummySpan))]*)
adamc@721 154
adamc@488 155 val functionInside = U.Con.exists {kind = fn _ => false,
adamc@488 156 con = fn TFun _ => true
adamc@488 157 | CFfi ("Basis", "transaction") => true
adamc@794 158 | CFfi ("Basis", "eq") => true
adamc@794 159 | CFfi ("Basis", "num") => true
adamc@794 160 | CFfi ("Basis", "ord") => true
adamc@794 161 | CFfi ("Basis", "show") => true
adamc@794 162 | CFfi ("Basis", "read") => true
adamc@794 163 | CFfi ("Basis", "sql_injectable_prim") => true
adamc@794 164 | CFfi ("Basis", "sql_injectable") => true
adamc@488 165 | _ => false}
adamc@488 166 val loc = ErrorMsg.dummySpan
adamc@488 167
adamc@1077 168 fun findSplit (xs, typ, fxs, fvs, ts) =
adamc@488 169 case (#1 typ, xs) of
adamc@488 170 (TFun (dom, ran), e :: xs') =>
adamc@488 171 if functionInside dom then
adamc@488 172 findSplit (xs',
adamc@488 173 ran,
adamc@1077 174 (true, e) :: fxs,
adamc@1077 175 IS.union (fvs, freeVars e),
adamc@1077 176 ts)
adamc@488 177 else
adamc@1077 178 findSplit (xs', ran, (false, e) :: fxs, fvs, dom :: ts)
adamc@1077 179 | _ => (List.revAppend (fxs, map (fn e => (false, e)) xs), fvs, rev ts)
adamc@488 180
adamc@1077 181 val (xs, fvs, ts) = findSplit (xs, typ, [], IS.empty, [])
adamc@1077 182 val fxs = List.mapPartial (fn (true, e) => SOME e | _ => NONE) xs
adamc@1077 183 val untouched = length (List.filter (fn (false, _) => true | _ => false) xs)
adamc@1077 184 val squish = squish (untouched, IS.listItems fvs)
adamc@1077 185 val fxs' = map squish fxs
adamc@488 186 in
adamc@800 187 (*Print.preface ("fxs'", Print.p_list (CorePrint.p_exp CoreEnv.empty) fxs');*)
adamc@1077 188 if List.all (fn (false, _) => true
adamc@1077 189 | (true, (ERel _, _)) => true
adamc@1077 190 | _ => false) xs then
adamc@488 191 (e, st)
adamc@488 192 else
adamc@800 193 case (KM.find (args, fxs'), SS.member (!mayNotSpec, name)) of
adamc@800 194 (SOME f', _) =>
adamc@485 195 let
adamc@488 196 val e = (ENamed f', loc)
adamc@488 197 val e = IS.foldr (fn (arg, e) => (EApp (e, (ERel arg, loc)), loc))
adamc@488 198 e fvs
adamc@1077 199 val e = foldl (fn ((false, arg), e) => (EApp (e, arg), loc)
adamc@1077 200 | (_, e) => e)
adamc@488 201 e xs
adamc@488 202 in
adamc@488 203 (*Print.prefaces "Brand new (reuse)"
adamc@721 204 [("e'", CorePrint.p_exp CoreEnv.empty e)];*)
adamc@488 205 (#1 e, st)
adamc@488 206 end
adamc@818 207 | (_, true) => ((*Print.prefaces ("No(" ^ name ^ ")")
adamc@818 208 [("fxs'",
adamc@818 209 Print.p_list (CorePrint.p_exp CoreEnv.empty) fxs')];*)
adamc@818 210 (e, st))
adamc@800 211 | (NONE, false) =>
adamc@488 212 let
adamc@800 213 (*val () = Print.prefaces "New one"
adamc@800 214 [("f", Print.PD.string (Int.toString f)),
adamc@800 215 ("mns", Print.p_list Print.PD.string
adamc@800 216 (SS.listItems (!mayNotSpec)))]*)
adamc@800 217
adamc@818 218 (*val () = Print.prefaces ("Yes(" ^ name ^ ")")
adamc@818 219 [("fxs'",
adamc@818 220 Print.p_list (CorePrint.p_exp CoreEnv.empty) fxs')]*)
adamc@818 221
adamc@1077 222 fun subBody (body, typ, xs) =
adamc@1077 223 case (#1 body, #1 typ, xs) of
adamc@488 224 (_, _, []) => SOME (body, typ)
adamc@1077 225 | (EAbs (_, _, _, body'), TFun (_, typ'), (b, x) :: xs) =>
adamc@488 226 let
adamc@1077 227 val body'' =
adamc@1077 228 if b then
adamc@1077 229 E.subExpInExp (0, squish x) body'
adamc@1077 230 else
adamc@1077 231 body'
adamc@488 232 in
adamc@488 233 subBody (body'',
adamc@488 234 typ',
adamc@1077 235 xs)
adamc@488 236 end
adamc@488 237 | _ => NONE
adamc@488 238 in
adamc@1077 239 case subBody (body, typ, xs) of
adamc@488 240 NONE => (e, st)
adamc@488 241 | SOME (body', typ') =>
adamc@488 242 let
adamc@488 243 val f' = #maxName st
adamc@488 244 val args = KM.insert (args, fxs', f')
adamc@488 245 val funcs = IM.insert (#funcs st, f, {name = name,
adamc@488 246 args = args,
adamc@488 247 body = body,
adamc@488 248 typ = typ,
adamc@488 249 tag = tag})
adamc@488 250 val st = {
adamc@488 251 maxName = f' + 1,
adamc@488 252 funcs = funcs,
adamc@488 253 decls = #decls st
adamc@488 254 }
adamc@487 255
adamc@488 256 (*val () = Print.prefaces "specExp"
adamc@488 257 [("f", CorePrint.p_exp env (ENamed f, loc)),
adamc@488 258 ("f'", CorePrint.p_exp env (ENamed f', loc)),
adamc@488 259 ("xs", Print.p_list (CorePrint.p_exp env) xs),
adamc@488 260 ("fxs'", Print.p_list
adamc@488 261 (CorePrint.p_exp E.empty) fxs'),
adamc@488 262 ("e", CorePrint.p_exp env (e, loc))]*)
adamc@1077 263
adamc@1077 264 val (body', typ') = foldr (fn (t, (body', typ')) =>
adamc@1077 265 ((EAbs ("x", t, typ', body'), loc),
adamc@1077 266 (TFun (t, typ'), loc)))
adamc@1077 267 (body', typ') ts
adamc@1077 268
adamc@488 269 val (body', typ') = IS.foldl (fn (n, (body', typ')) =>
adamc@488 270 let
adamc@521 271 val (x, xt) = List.nth (env, n)
adamc@488 272 in
adamc@488 273 ((EAbs (x, xt, typ', body'),
adamc@488 274 loc),
adamc@488 275 (TFun (xt, typ'), loc))
adamc@488 276 end)
adamc@488 277 (body', typ') fvs
adamc@800 278 val mns = !mayNotSpec
adamc@800 279 val () = mayNotSpec := SS.add (mns, name)
adamc@800 280 (*val () = Print.preface ("body'", CorePrint.p_exp CoreEnv.empty body')*)
adamc@488 281 val (body', st) = specExp env st body'
adamc@800 282 val () = mayNotSpec := mns
adamc@482 283
adamc@488 284 val e' = (ENamed f', loc)
adamc@488 285 val e' = IS.foldr (fn (arg, e) => (EApp (e, (ERel arg, loc)), loc))
adamc@488 286 e' fvs
adamc@1077 287 val e' = foldl (fn ((false, arg), e) => (EApp (e, arg), loc)
adamc@1077 288 | (_, e) => e)
adamc@488 289 e' xs
adamc@488 290 (*val () = Print.prefaces "Brand new"
adamc@721 291 [("e'", CorePrint.p_exp CoreEnv.empty e'),
adamc@721 292 ("e", CorePrint.p_exp CoreEnv.empty (e, loc)),
adamc@721 293 ("body'", CorePrint.p_exp CoreEnv.empty body')]*)
adamc@488 294 in
adamc@488 295 (#1 e',
adamc@488 296 {maxName = #maxName st,
adamc@488 297 funcs = #funcs st,
adamc@488 298 decls = (name, f', typ', body', tag) :: #decls st})
adamc@488 299 end
adamc@485 300 end
adamc@488 301 end
adamc@485 302 end
adamc@482 303
adamc@626 304 and specExp env = U.Exp.foldMapB {kind = default, con = default, exp = exp, bind = bind} env
adamc@482 305
adamc@626 306 val specDecl = U.Decl.foldMapB {kind = default, con = default, exp = exp, decl = default, bind = bind}
adamc@482 307
adamc@521 308 fun doDecl (d, (st : state, changed)) =
adamc@488 309 let
adamc@521 310 (*val befor = Time.now ()*)
adamc@482 311
adamc@453 312 val funcs = #funcs st
adamc@453 313 val funcs =
adamc@453 314 case #1 d of
adamc@453 315 DValRec vis =>
adamc@453 316 foldl (fn ((x, n, c, e, tag), funcs) =>
adamc@453 317 IM.insert (funcs, n, {name = x,
adamc@453 318 args = KM.empty,
adamc@453 319 body = e,
adamc@453 320 typ = c,
adamc@453 321 tag = tag}))
adamc@453 322 funcs vis
adamc@453 323 | _ => funcs
adamc@453 324
adamc@453 325 val st = {maxName = #maxName st,
adamc@453 326 funcs = funcs,
adamc@453 327 decls = []}
adamc@453 328
adamc@482 329 (*val () = Print.prefaces "decl" [("d", CorePrint.p_decl CoreEnv.empty d)]*)
adamc@521 330
adamc@522 331 val (d', st) =
adamc@522 332 if isPoly d then
adamc@522 333 (d, st)
adamc@522 334 else
adamc@800 335 (mayNotSpec := (case #1 d of
adamc@800 336 DValRec vis => foldl (fn ((x, _, _, _, _), mns) =>
adamc@800 337 SS.add (mns, x)) SS.empty vis
adamc@800 338 | DVal (x, _, _, _, _) => SS.singleton x
adamc@800 339 | _ => SS.empty);
adamc@800 340 specDecl [] st d
adamc@800 341 before mayNotSpec := SS.empty)
adamc@521 342
adamc@482 343 (*val () = print "/decl\n"*)
adamc@443 344
adamc@443 345 val funcs = #funcs st
adamc@443 346 val funcs =
adamc@443 347 case #1 d of
adamc@443 348 DVal (x, n, c, e as (EAbs _, _), tag) =>
adamc@443 349 IM.insert (funcs, n, {name = x,
adamc@453 350 args = KM.empty,
adamc@443 351 body = e,
adamc@443 352 typ = c,
adamc@443 353 tag = tag})
adamc@469 354 | DVal (_, n, _, (ENamed n', _), _) =>
adamc@469 355 (case IM.find (funcs, n') of
adamc@469 356 NONE => funcs
adamc@469 357 | SOME v => IM.insert (funcs, n, v))
adamc@443 358 | _ => funcs
adamc@443 359
adamc@453 360 val (changed, ds) =
adamc@443 361 case #decls st of
adamc@453 362 [] => (changed, [d'])
adamc@453 363 | vis =>
adamc@453 364 (true, case d' of
adamc@453 365 (DValRec vis', _) => [(DValRec (vis @ vis'), ErrorMsg.dummySpan)]
adamc@453 366 | _ => [(DValRec vis, ErrorMsg.dummySpan), d'])
adamc@443 367 in
adamc@802 368 (*Print.prefaces "doDecl" [("d", CorePrint.p_decl E.empty d),
adamc@802 369 ("d'", CorePrint.p_decl E.empty d')];*)
adamc@521 370 (ds, ({maxName = #maxName st,
adamc@453 371 funcs = funcs,
adamc@453 372 decls = []}, changed))
adamc@443 373 end
adamc@443 374
adamc@521 375 val (ds, (_, changed)) = ListUtil.foldlMapConcat doDecl
adamc@521 376 ({maxName = U.File.maxName file + 1,
adamc@488 377 funcs = IM.empty,
adamc@488 378 decls = []},
adamc@488 379 false)
adamc@488 380 file
adamc@443 381 in
adamc@453 382 (changed, ds)
adamc@443 383 end
adamc@443 384
adamc@453 385 fun specialize file =
adamc@453 386 let
adamc@721 387 val file = ReduceLocal.reduce file
adamc@721 388 (*val () = Print.prefaces "Intermediate" [("file", CorePrint.p_file CoreEnv.empty file)]*)
adamc@520 389 (*val file = ReduceLocal.reduce file*)
adamc@453 390 val (changed, file) = specialize' file
adamc@520 391 (*val file = ReduceLocal.reduce file
adamc@520 392 val file = CoreUntangle.untangle file
adamc@488 393 val file = Shake.shake file*)
adamc@453 394 in
adamc@488 395 (*print "Round over\n";*)
adamc@453 396 if changed then
adamc@520 397 let
adamc@721 398 (*val file = ReduceLocal.reduce file*)
adamc@802 399 (*val () = Print.prefaces "Pre-untangle" [("file", CorePrint.p_file CoreEnv.empty file)]*)
adamc@520 400 val file = CoreUntangle.untangle file
adamc@802 401 (*val () = Print.prefaces "Post-untangle" [("file", CorePrint.p_file CoreEnv.empty file)]*)
adamc@520 402 val file = Shake.shake file
adamc@520 403 in
adamc@520 404 (*print "Again!\n";*)
adamc@520 405 specialize file
adamc@520 406 end
adamc@453 407 else
adamc@453 408 file
adamc@453 409 end
adamc@453 410
adamc@443 411 end