From 0edd83555cff06b0cdbb71b3f757a87a3bcbcd89 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Wed, 15 Jun 2022 12:05:10 +0200 Subject: [PATCH 01/10] Remove Env We only use it to pass constructor arguments. As now we store constructor arguments on the underlying object, there no need for it any more. --- .../tools/dotc/transform/init/Semantic.scala | 107 ++++-------------- 1 file changed, 25 insertions(+), 82 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index b6144b677801..e2c1154d9cca 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -144,56 +144,6 @@ object Semantic: def hasField(f: Symbol) = fields.contains(f) - /** The environment stores values for constructor parameters - * - * For performance and usability, we restrict parameters to be either `Cold` - * or `Hot`. - * - * Despite that we have environment for evaluating expressions in secondary - * constructors, we don't need to put environment as the cache key. The - * reason is that constructor parameters are determined by the value of - * `this` --- it suffices to make the value of `this` as part of the cache - * key. - * - * This crucially depends on the fact that in the initialization process - * there can be exactly one call to a specific constructor for a given - * receiver. However, once we relax the design to allow non-hot values to - * methods and functions, we have to put the environment as part of the cache - * key. The reason is that given the same receiver, a method or function may - * be called with different arguments -- they are not decided by the receiver - * anymore. - * - * TODO: remove Env as it is only used to pass value from `callConstructor` -> `eval` -> `init`. - * It goes through `eval` for caching (termination) purposes. - */ - object Env: - opaque type Env = Map[Symbol, Value] - - val empty: Env = Map.empty - - def apply(bindings: Map[Symbol, Value]): Env = bindings - - def apply(ddef: DefDef, args: List[Value])(using Context): Env = - val params = ddef.termParamss.flatten.map(_.symbol) - assert(args.size == params.size, "arguments = " + args.size + ", params = " + params.size) - params.zip(args).toMap - - extension (env: Env) - def lookup(sym: Symbol)(using Context): Value = env(sym) - - def getOrElse(sym: Symbol, default: Value)(using Context): Value = env.getOrElse(sym, default) - - def union(other: Env): Env = env ++ other - - def isHot: Boolean = env.values.forall(_ == Hot) - end Env - - type Env = Env.Env - inline def env(using env: Env) = env - inline def withEnv[T](env: Env)(op: Env ?=> T): T = op(using env) - - import Env.* - object Promoted: class PromotionInfo: var isCurrentObjectPromoted: Boolean = false @@ -399,7 +349,7 @@ object Semantic: // ----- Checker State ----------------------------------- /** The state that threads through the interpreter */ - type Contextual[T] = (Env, Context, Trace, Promoted, Cache, Reporter) ?=> T + type Contextual[T] = (Context, Trace, Promoted, Cache, Reporter) ?=> T // ----- Error Handling ----------------------------------- @@ -692,10 +642,8 @@ object Semantic: outer.instantiate(klass, klass.primaryConstructor, args) else reporter.reportAll(argErrors) - withEnv(if isLocal then env else Env.empty) { - extendTrace(ddef) { - eval(ddef.rhs, ref, cls, cacheResult = true) - } + extendTrace(ddef) { + eval(ddef.rhs, ref, cls, cacheResult = true) } else if ref.canIgnoreMethodCall(target) then Hot @@ -726,15 +674,14 @@ object Semantic: } def callConstructor(ctor: Symbol, args: List[ArgInfo]): Contextual[Value] = log("call " + ctor.show + ", args = " + args.map(_.value.show), printer, (_: Value).show) { - // init "fake" param fields for the secondary constructor - def addParamsAsFields(env: Env, ref: Ref, ctorDef: DefDef) = { - val paramSyms = ctorDef.termParamss.flatten.map(_.symbol) - paramSyms.map { acc => - val value = env.lookup(acc) - ref.updateField(acc, value) - printer.println(acc.show + " initialized with " + value) - } - } + // init "fake" param fields for parameters of primary and secondary constructors + def addParamsAsFields(args: List[Value], ref: Ref, ctorDef: DefDef) = + val params = ctorDef.termParamss.flatten.map(_.symbol) + assert(args.size == params.size, "arguments = " + args.size + ", params = " + params.size) + for (param, value) <- params.zip(args) do + ref.updateField(param, value) + printer.println(param.show + " initialized with " + value) + value match { case Hot | Cold | _: RefSet | _: Fun => report.error("unexpected constructor call, meth = " + ctor + ", value = " + value, trace.toVector.last) @@ -744,13 +691,12 @@ object Semantic: if ctor.hasSource then val cls = ctor.owner.enclosingClass.asClass val ddef = ctor.defTree.asInstanceOf[DefDef] - val env2 = Env(ddef, args.map(_.value).widenArgs) + val args2 = args.map(_.value).widenArgs + addParamsAsFields(args2, ref, ddef) if ctor.isPrimaryConstructor then - given Env = env2 val tpl = cls.defTree.asInstanceOf[TypeDef].rhs.asInstanceOf[Template] extendTrace(cls.defTree) { init(tpl, ref, cls) } else - addParamsAsFields(env2, ref, ddef) val initCall = ddef.rhs match case Block(call :: _, _) => call case call => call @@ -763,14 +709,13 @@ object Semantic: if ctor.hasSource then val cls = ctor.owner.enclosingClass.asClass val ddef = ctor.defTree.asInstanceOf[DefDef] - val env2 = Env(ddef, args.map(_.value).widenArgs) + val args2 = args.map(_.value).widenArgs + addParamsAsFields(args2, ref, ddef) if ctor.isPrimaryConstructor then - given Env = env2 val tpl = cls.defTree.asInstanceOf[TypeDef].rhs.asInstanceOf[Template] extendTrace(cls.defTree) { eval(tpl, ref, cls, cacheResult = true) } ref else - addParamsAsFields(env2, ref, ddef) extendTrace(ddef) { eval(ddef.rhs, ref, cls, cacheResult = true) } else if ref.canIgnoreMethodCall(ctor) then Hot @@ -1057,16 +1002,18 @@ object Semantic: val thisRef = task.value val tpl = thisRef.klass.defTree.asInstanceOf[TypeDef].rhs.asInstanceOf[Template] - val paramValues = tpl.constr.termParamss.flatten.map(param => param.symbol -> Hot).toMap - @tailrec def iterate(): Unit = { given Promoted = Promoted.empty given Trace = Trace.empty.add(thisRef.klass.defTree) - given Env = Env(paramValues) given reporter: Reporter.BufferedReporter = new Reporter.BufferedReporter thisRef.ensureFresh() + + // set up constructor parameters + for param <- tpl.constr.termParamss.flatten do + thisRef.updateField(param.symbol, Hot) + log("checking " + task) { eval(tpl, thisRef, thisRef.klass) } reporter.errors.foreach(_.issue) @@ -1433,7 +1380,7 @@ object Semantic: /** Initialize part of an abstract object in `klass` of the inheritance chain */ def init(tpl: Template, thisV: Ref, klass: ClassSymbol): Contextual[Value] = log("init " + klass.show, printer, (_: Value).show) { val paramsMap = tpl.constr.termParamss.flatten.map { vdef => - vdef.name -> env.lookup(vdef.symbol) + vdef.name -> thisV.objekt.field(vdef.symbol) }.toMap // init param fields @@ -1446,7 +1393,7 @@ object Semantic: // Tasks is used to schedule super constructor calls. // Super constructor calls are delayed until all outers are set. type Tasks = mutable.ArrayBuffer[() => Unit] - def superCall(tref: TypeRef, ctor: Symbol, args: List[ArgInfo], tasks: Tasks)(using Env): Unit = + def superCall(tref: TypeRef, ctor: Symbol, args: List[ArgInfo], tasks: Tasks): Unit = val cls = tref.classSymbol.asClass // update outer for super class val res = outerValue(tref, thisV, klass) @@ -1461,7 +1408,7 @@ object Semantic: } // parents - def initParent(parent: Tree, tasks: Tasks)(using Env) = + def initParent(parent: Tree, tasks: Tasks) = parent match case tree @ Block(stats, NewExpr(tref, New(tpt), ctor, argss)) => // can happen eval(stats, thisV, klass) @@ -1479,8 +1426,6 @@ object Semantic: // see spec 5.1 about "Template Evaluation". // https://www.scala-lang.org/files/archive/spec/2.13/05-classes-and-objects.html if !klass.is(Flags.Trait) then - given Env = Env.empty - // outers are set first val tasks = new mutable.ArrayBuffer[() => Unit] @@ -1526,7 +1471,6 @@ object Semantic: // class body if thisV.isThisRef || !thisV.asInstanceOf[Warm].isPopulatingParams then tpl.body.foreach { case vdef : ValDef if !vdef.symbol.is(Flags.Lazy) && !vdef.rhs.isEmpty => - given Env = Env.empty val res = eval(vdef.rhs, thisV, klass) thisV.updateField(vdef.symbol, res) fieldsChanged = true @@ -1534,10 +1478,9 @@ object Semantic: case _: MemberDef => case tree => - if fieldsChanged && thisV.isThisRef then thisV.asInstanceOf[ThisRef].tryPromoteCurrentObject() + if fieldsChanged && thisV.isThisRef then + thisV.asInstanceOf[ThisRef].tryPromoteCurrentObject() fieldsChanged = false - - given Env = Env.empty eval(tree, thisV, klass) } From 6b49b26cd2077b766149ed31f48188a660747e95 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Wed, 15 Jun 2022 13:50:57 +0200 Subject: [PATCH 02/10] Refactor cache to use immutable maps --- .../tools/dotc/transform/init/Semantic.scala | 105 +++++++++++++----- 1 file changed, 76 insertions(+), 29 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index e2c1154d9cca..d41591850aa3 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -10,7 +10,6 @@ import StdNames.* import NameKinds.OuterSelectName import ast.tpd.* -import util.EqHashMap import config.Printers.init as printer import reporting.trace as log @@ -198,17 +197,51 @@ object Semantic: * Note: It's tempting to use location of trees as key. That should * be avoided as a template may have the same location as its single * statement body. Macros may also create incorrect locations. - * */ object Cache: - opaque type CacheStore = mutable.Map[Value, EqHashMap[Tree, Value]] + /** Cache for expressions + * + * Ref -> Tree -> Value + * + * The first key is the value of `this` for the expression. We do not need + * environment, because the environment is always hot. + */ + private type ExprValueCache = Map[Value, Map[TreeWrapper, Value]] + + /** The heap for abstract objects + * + * The heap objects are immutable. + */ private type Heap = Map[Ref, Objekt] + /** A wrapper for trees for storage in maps based on referential equality of trees. */ + private abstract class TreeWrapper: + def tree: Tree + + override final def equals(other: Any): Boolean = + other match + case that: TreeWrapper => this.tree eq that.tree + case _ => false + + override final def hashCode = tree.hashCode + + /** The immutable wrapper is intended to be stored as key in the heap. */ + private class ImmutableTreeWrapper(val tree: Tree) extends TreeWrapper + + /** For queries on the heap, reuse the same wrapper to avoid unnecessary allocation. */ + private class MutableTreeWrapper extends TreeWrapper: + var queryTree: Tree | Null = null + def tree: Tree = queryTree match + case tree: Tree => tree + case null => ??? + + private val queryTreeMapper: MutableTreeWrapper = new MutableTreeWrapper + class Cache: - private var last: CacheStore = mutable.Map.empty - private var current: CacheStore = mutable.Map.empty - private val stable: CacheStore = mutable.Map.empty + private var last: ExprValueCache = Map.empty + private var current: ExprValueCache = Map.empty + private var stable: ExprValueCache = Map.empty private var changed: Boolean = false /** Abstract heap stores abstract objects @@ -243,8 +276,8 @@ object Semantic: current.contains(value, expr) || stable.contains(value, expr) def apply(value: Value, expr: Tree) = - if current.contains(value, expr) then current(value)(expr) - else stable(value)(expr) + if current.contains(value, expr) then current.get(value, expr) + else stable.get(value, expr) /** Copy the value of `(value, expr)` from the last cache to the current cache * (assuming it's `Hot` if it doesn't exist in the cache). @@ -256,16 +289,16 @@ object Semantic: if last.contains(value, expr) then last.get(value, expr) else - last.put(value, expr, Hot) + this.last = last.updatedNested(value, expr, Hot) Hot end if - current.put(value, expr, assumeValue) + this.current = current.updatedNested(value, expr, assumeValue) val actual = fun if actual != assumeValue then this.changed = true - last.put(value, expr, actual) - current.put(value, expr, actual) + this.last = this.last.updatedNested(value, expr, actual) + this.current = this.current.updatedNested(value, expr, actual) else // It's tempting to cache the value in stable, but it's unsound. // The reason is that the current value may depend on other values @@ -280,12 +313,12 @@ object Semantic: /** Commit current cache to stable cache. */ private def commitToStableCache() = - current.foreach { (v, m) => - // It's useless to cache value for ThisRef. - if v.isWarm then m.iterator.foreach { (e, res) => - stable.put(v, e, res) - } - } + for + (v, m) <- current + if v.isWarm // It's useless to cache value for ThisRef. + (wrapper, res) <- m + do + this.stable = stable.updatedNestedWrapper(v, wrapper.asInstanceOf[ImmutableTreeWrapper], res) /** Prepare cache for the next iteration * @@ -298,7 +331,7 @@ object Semantic: */ def prepareForNextIteration()(using Context) = this.changed = false - this.current = mutable.Map.empty + this.current = Map.empty this.heap = this.heapStable /** Prepare for checking next class @@ -319,8 +352,8 @@ object Semantic: this.commitToStableCache() this.heapStable = this.heap - this.last = mutable.Map.empty - this.current = mutable.Map.empty + this.last = Map.empty + this.current = Map.empty def updateObject(ref: Ref, obj: Objekt) = assert(!this.heapStable.contains(ref)) @@ -331,14 +364,28 @@ object Semantic: def getObject(ref: Ref) = heap(ref) end Cache - extension (cache: CacheStore) - def contains(value: Value, expr: Tree) = cache.contains(value) && cache(value).contains(expr) - def get(value: Value, expr: Tree): Value = cache(value)(expr) - def remove(value: Value, expr: Tree) = cache(value).remove(expr) - def put(value: Value, expr: Tree, result: Value): Unit = { - val innerMap = cache.getOrElseUpdate(value, new EqHashMap[Tree, Value]) - innerMap(expr) = result - } + extension (cache: ExprValueCache) + private def contains(value: Value, expr: Tree) = + queryTreeMapper.queryTree = expr + cache.contains(value) && cache(value).contains(queryTreeMapper) + + private def get(value: Value, expr: Tree): Value = + queryTreeMapper.queryTree = expr + cache(value)(queryTreeMapper) + + private def removed(value: Value, expr: Tree) = + queryTreeMapper.queryTree = expr + val innerMap2 = cache(value).removed(queryTreeMapper) + cache.updated(value, innerMap2) + + private def updatedNested(value: Value, expr: Tree, result: Value): ExprValueCache = + val wrapper = new ImmutableTreeWrapper(expr) + updatedNestedWrapper(value, wrapper, result) + + private def updatedNestedWrapper(value: Value, wrapper: ImmutableTreeWrapper, result: Value): ExprValueCache = + val innerMap = cache.getOrElse(value, Map.empty[TreeWrapper, Value]) + val innerMap2 = innerMap.updated(wrapper, result) + cache.updated(value, innerMap2) end extension end Cache From faccf75432862dbf5dab7a0fae2dc8c33ae80963 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Wed, 15 Jun 2022 14:08:21 +0200 Subject: [PATCH 03/10] Add docs to code --- .../tools/dotc/transform/init/Semantic.scala | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index d41591850aa3..a9d283f88738 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -239,9 +239,24 @@ object Semantic: private val queryTreeMapper: MutableTreeWrapper = new MutableTreeWrapper class Cache: + /** The cache for expression values from last iteration */ private var last: ExprValueCache = Map.empty + + /** The updated cache for expression values based on the cache values from the last iteration */ private var current: ExprValueCache = Map.empty + + /** Global cached values for expressions + * + * The values are only added when a fixed point is reached. + * + * It is intended to improve performance for computation related to warm values. + */ private var stable: ExprValueCache = Map.empty + + /** Whether the current heap is different from the last heap? + * + * `changed == true` implies that the fixed point has been reached. + */ private var changed: Boolean = false /** Abstract heap stores abstract objects From a5d2281211f680746684a6e7938c6a4995abfc53 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Wed, 15 Jun 2022 14:47:51 +0200 Subject: [PATCH 04/10] Try fix assertion errors --- .../tools/dotc/transform/init/Semantic.scala | 51 +++++++++++++++---- 1 file changed, 41 insertions(+), 10 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index a9d283f88738..769e55e8ea88 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -242,7 +242,10 @@ object Semantic: /** The cache for expression values from last iteration */ private var last: ExprValueCache = Map.empty - /** The updated cache for expression values based on the cache values from the last iteration */ + /** The updated cache for expression values based on the cache values from the last iteration + * + * Both `last` and `current` are required to make sure an expression is evaluated once in each iteration. + */ private var current: ExprValueCache = Map.empty /** Global cached values for expressions @@ -294,10 +297,36 @@ object Semantic: if current.contains(value, expr) then current.get(value, expr) else stable.get(value, expr) + /** Conditionally perform an operation + * + * If the operation returns true, the changes are commited. Otherwise, the changes are reverted. + */ + def conditionally[T](fn: => (Boolean, T)): T = + val last2 = this.last + val current2 = this.current + val stable2 = this.stable + val heap2 = this.heap + val heapStable2 = this.heapStable + val changed2 = this.changed + val (commit, value) = fn + + if commit then + this.last = last2 + this.current = current2 + this.stable = stable2 + this.heap = heap2 + this.heapStable = heapStable2 + this.changed = changed2 + + value + /** Copy the value of `(value, expr)` from the last cache to the current cache - * (assuming it's `Hot` if it doesn't exist in the cache). * - * Then, runs `fun` and update the caches if the values change. + * It assumes the value is `Hot` if it doesn't exist in the last cache. + * + * It update the current caches if the values change. + * + * The two caches are required because we want to make sure in a new iteration, an expression is evaluated once. */ def assume(value: Value, expr: Tree, cacheResult: Boolean)(fun: => Value): Contextual[Value] = val assumeValue: Value = @@ -312,7 +341,6 @@ object Semantic: val actual = fun if actual != assumeValue then this.changed = true - this.last = this.last.updatedNested(value, expr, actual) this.current = this.current.updatedNested(value, expr, actual) else // It's tempting to cache the value in stable, but it's unsound. @@ -339,13 +367,13 @@ object Semantic: * * 1. Reset changed flag. * - * 2. Reset current cache (last cache already synced in `assume`). - * - * 3. Revert heap if instable. + * 2. Use current cache as last cache and set current cache to be empty. * + * 3. Revert heap to stable. */ def prepareForNextIteration()(using Context) = this.changed = false + this.last = this.current this.current = Map.empty this.heap = this.heapStable @@ -542,12 +570,15 @@ object Semantic: // We may reset the outers or params of a populated warm object. // This is the case if we need access the field of a warm object, which // requires population of parameters and outers; and later create an - // instance of the exact warm object, which requires initialization check. + // instance of the exact warm object, whose initialization will reset + // the outer and constructor parameters. // // See tests/init/neg/unsound1.scala - assert(!obj.hasField(field) || field.is(Flags.ParamAccessor) && obj.field(field) == value, field.show + " already init, new = " + value + ", old = " + obj.field(field) + ", ref = " + ref) + val changed = !obj.hasField(field) || obj.field(field) != value + def isParamUpdate = field.isOneOf(Flags.ParamAccessor | Flags.Param) && obj.field(field) == value + assert(!obj.hasField(field) || isParamUpdate, field.show + " already init, new = " + value + ", old = " + obj.field(field) + ", ref = " + ref) val obj2 = obj.copy(fields = obj.fields.updated(field, value)) - cache.updateObject(ref, obj2) + if changed then cache.updateObject(ref, obj2) } /** Update the immediate outer of the given `klass` of the abstract object From f088428f372867db52f1549c3d3211fdc32e675f Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Fri, 17 Jun 2022 23:18:04 +0200 Subject: [PATCH 05/10] Avoid concurrency issue --- .../tools/dotc/transform/init/Semantic.scala | 47 +++++++++---------- 1 file changed, 23 insertions(+), 24 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index 769e55e8ea88..dfcb706c8bca 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -236,8 +236,6 @@ object Semantic: case tree: Tree => tree case null => ??? - private val queryTreeMapper: MutableTreeWrapper = new MutableTreeWrapper - class Cache: /** The cache for expression values from last iteration */ private var last: ExprValueCache = Map.empty @@ -288,14 +286,15 @@ object Semantic: /** Used to revert heap to last stable heap. */ private var heapStable: Heap = Map.empty - def hasChanged = changed + /** Used to avoid allocation, its state does not matter */ + private given MutableTreeWrapper = new MutableTreeWrapper - def contains(value: Value, expr: Tree) = - current.contains(value, expr) || stable.contains(value, expr) + def hasChanged = changed - def apply(value: Value, expr: Tree) = - if current.contains(value, expr) then current.get(value, expr) - else stable.get(value, expr) + def get(value: Value, expr: Tree): Option[Value] = + current.get(value, expr) match + case None => stable.get(value, expr) + case res => res /** Conditionally perform an operation * @@ -330,12 +329,12 @@ object Semantic: */ def assume(value: Value, expr: Tree, cacheResult: Boolean)(fun: => Value): Contextual[Value] = val assumeValue: Value = - if last.contains(value, expr) then - last.get(value, expr) - else + last.get(value, expr) match + case Some(value) => value + case None => this.last = last.updatedNested(value, expr, Hot) Hot - end if + this.current = current.updatedNested(value, expr, assumeValue) val actual = fun @@ -408,17 +407,13 @@ object Semantic: end Cache extension (cache: ExprValueCache) - private def contains(value: Value, expr: Tree) = - queryTreeMapper.queryTree = expr - cache.contains(value) && cache(value).contains(queryTreeMapper) + private def get(value: Value, expr: Tree)(using queryWrapper: MutableTreeWrapper): Option[Value] = + queryWrapper.queryTree = expr + cache.get(value).flatMap(_.get(queryWrapper)) - private def get(value: Value, expr: Tree): Value = - queryTreeMapper.queryTree = expr - cache(value)(queryTreeMapper) - - private def removed(value: Value, expr: Tree) = - queryTreeMapper.queryTree = expr - val innerMap2 = cache(value).removed(queryTreeMapper) + private def removed(value: Value, expr: Tree)(using queryWrapper: MutableTreeWrapper) = + queryWrapper.queryTree = expr + val innerMap2 = cache(value).removed(queryWrapper) cache.updated(value, innerMap2) private def updatedNested(value: Value, expr: Tree, result: Value): ExprValueCache = @@ -1167,10 +1162,14 @@ object Semantic: * it is located. * * This method only handles cache logic and delegates the work to `cases`. + * + * The parameter `cacheResult` is used to reduce the size of the cache. */ def eval(expr: Tree, thisV: Ref, klass: ClassSymbol, cacheResult: Boolean = false): Contextual[Value] = log("evaluating " + expr.show + ", this = " + thisV.show + " in " + klass.show, printer, (_: Value).show) { - if (cache.contains(thisV, expr)) cache(thisV, expr) - else cache.assume(thisV, expr, cacheResult) { cases(expr, thisV, klass) } + cache.get(thisV, expr) match + case Some(value) => value + case None => + cache.assume(thisV, expr, cacheResult) { cases(expr, thisV, klass) } } /** Evaluate a list of expressions */ From 1736fb91de72a2ce10c90494c70dd3499d0ea3c4 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Sat, 18 Jun 2022 00:21:31 +0200 Subject: [PATCH 06/10] Restore state if errors are thrown away --- .../tools/dotc/transform/init/Semantic.scala | 110 +++++++++++------- 1 file changed, 68 insertions(+), 42 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index dfcb706c8bca..461175772d8a 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -296,28 +296,28 @@ object Semantic: case None => stable.get(value, expr) case res => res - /** Conditionally perform an operation + /** Backup the state of the cache * - * If the operation returns true, the changes are commited. Otherwise, the changes are reverted. + * All the shared data structures must be immutable. */ - def conditionally[T](fn: => (Boolean, T)): T = - val last2 = this.last - val current2 = this.current - val stable2 = this.stable - val heap2 = this.heap - val heapStable2 = this.heapStable - val changed2 = this.changed - val (commit, value) = fn - - if commit then - this.last = last2 - this.current = current2 - this.stable = stable2 - this.heap = heap2 - this.heapStable = heapStable2 - this.changed = changed2 - - value + def backup(): Cache = + val cache = new Cache + cache.last = this.last + cache.current = this.current + cache.stable = this.stable + cache.heap = this.heap + cache.heapStable = this.heapStable + cache.changed = this.changed + cache + + /** Restore state from a backup */ + def restore(cache: Cache) = + this.last = cache.last + this.current = cache.current + this.stable = cache.stable + this.heap = cache.heap + this.heapStable = cache.heapStable + this.changed = cache.changed /** Copy the value of `(value, expr)` from the last cache to the current cache * @@ -459,21 +459,36 @@ object Semantic: def report(err: Error): Unit def reportAll(errs: Seq[Error]): Unit = for err <- errs do report(err) + /** A TryReporter cannot be simply thrown away + * + * Either `abort` should be called or the errors be reported. + */ + trait TryReporter extends Reporter: + def abort()(using Cache): Unit + def errors: List[Error] + object Reporter: class BufferedReporter extends Reporter: private val buf = new mutable.ArrayBuffer[Error] def errors = buf.toList def report(err: Error) = buf += err + class TryBufferedReporter(backup: Cache) extends BufferedReporter with TryReporter: + def abort()(using Cache): Unit = cache.restore(backup) + class ErrorFound(val error: Error) extends Exception class StopEarlyReporter extends Reporter: def report(err: Error) = throw new ErrorFound(err) - /** Capture all errors and return as a list */ - def errorsIn(fn: Reporter ?=> Unit): List[Error] = - val reporter = new BufferedReporter + /** Capture all errors with a TryReporter + * + * The TryReporter cannot be thrown away: either `abort` must be called or + * the errors must be reported. + */ + def errorsIn(fn: Reporter ?=> Unit)(using Cache): TryReporter = + val reporter = new TryBufferedReporter(cache.backup()) fn(using reporter) - reporter.errors.toList + reporter /** Stop on first error */ def stopEarly(fn: Reporter ?=> Unit): List[Error] = @@ -485,6 +500,11 @@ object Semantic: catch case ex: ErrorFound => ex.error :: Nil + def hasErrors(fn: Reporter ?=> Unit)(using Cache): Boolean = + val backup = cache.backup() + val errors = stopEarly(fn) + cache.restore(backup) + errors.nonEmpty inline def reporter(using r: Reporter): Reporter = r @@ -517,9 +537,8 @@ object Semantic: def widenArg: Contextual[Value] = a match case _: Ref | _: Fun => - val errors = Reporter.stopEarly { a.promote("Argument cannot be promoted to hot") } - if errors.isEmpty then Hot - else Cold + val hasError = Reporter.hasErrors { a.promote("Argument cannot be promoted to hot") } + if hasError then Cold else Hot case RefSet(refs) => refs.map(_.widenArg).join @@ -662,9 +681,11 @@ object Semantic: var allArgsHot = true val allParamTypes = methodType.paramInfoss.flatten.map(_.repeatedToSingle) val errors = allParamTypes.zip(args).flatMap { (info, arg) => - val errors = Reporter.errorsIn { arg.promote } - allArgsHot = allArgsHot && errors.isEmpty - info match + val tryReporter = Reporter.errorsIn { arg.promote } + allArgsHot = allArgsHot && tryReporter.errors.isEmpty + if tryReporter.errors.isEmpty then tryReporter.errors + else + info match case typeParamRef: TypeParamRef => val bounds = typeParamRef.underlying.bounds val isWithinBounds = bounds.lo <:< defn.NothingType && defn.AnyType <:< bounds.hi @@ -673,8 +694,12 @@ object Semantic: // type parameter T with Any as its upper bound and Nothing as its lower bound. // the other arguments should either correspond to a parameter type that is T // or that does not contain T as a component. - if isWithinBounds && !otherParamContains then Nil else errors - case _ => errors + if isWithinBounds && !otherParamContains then + tryReporter.abort() + Nil + else + tryReporter.errors + case _ => tryReporter.errors } (errors, allArgsHot) @@ -721,15 +746,16 @@ object Semantic: if target.hasSource then val cls = target.owner.enclosingClass.asClass val ddef = target.defTree.asInstanceOf[DefDef] - val argErrors = Reporter.errorsIn { promoteArgs() } + val tryReporter = Reporter.errorsIn { promoteArgs() } // normal method call - if argErrors.nonEmpty && isSyntheticApply(meth) then + if tryReporter.errors.nonEmpty && isSyntheticApply(meth) then + tryReporter.abort() val klass = meth.owner.companionClass.asClass val outerCls = klass.owner.lexicallyEnclosingClass.asClass val outer = resolveOuterSelect(outerCls, ref, 1) outer.instantiate(klass, klass.primaryConstructor, args) else - reporter.reportAll(argErrors) + reporter.reportAll(tryReporter.errors) extendTrace(ddef) { eval(ddef.rhs, ref, cls, cacheResult = true) } @@ -841,15 +867,15 @@ object Semantic: if promoted.isCurrentObjectPromoted then Hot else value match { case Hot => - val buffer = new mutable.ArrayBuffer[Error] + var allHot = true val args2 = args.map { arg => - val errors = Reporter.errorsIn { arg.promote } - buffer ++= errors - if errors.isEmpty then Hot - else arg.value.widenArg + val hasErrors = Reporter.hasErrors { arg.promote } + allHot = allHot && !hasErrors + if hasErrors then arg.value.widenArg + else Hot } - if buffer.isEmpty then + if allHot then Hot else val outer = Hot @@ -998,7 +1024,7 @@ object Semantic: given Trace = Trace.empty.add(body) res.promote("The function return value is not fully initialized.") } - if (errors.nonEmpty) + if errors.nonEmpty then reporter.report(UnsafePromotion(msg, trace.toVector, errors.head)) else promoted.add(fun) From b5c2ffbd7784b84e3aa3bcd1f1be1c06a7e79e94 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Sat, 18 Jun 2022 00:55:44 +0200 Subject: [PATCH 07/10] More docs --- .../tools/dotc/transform/init/Semantic.scala | 68 +++++++++++-------- 1 file changed, 40 insertions(+), 28 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index 461175772d8a..d98f9b9b0c85 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -168,44 +168,56 @@ object Semantic: import Promoted.* inline def promoted(using p: Promoted): Promoted = p - /** Interpreter configuration + /** Cache used in fixed point computation * - * The (abstract) interpreter can be seen as a push-down automaton - * that transits between the configurations where the stack is the - * implicit call stack of the meta-language. + * The analysis computes the least fixed point for the cache (see doc for + * `ExprValueCache`). * - * It's important that the configuration is finite for the analysis - * to terminate. + * For the fixed point computation to terminate, we need to make sure that + * the domain of the cache, i.e. the key pair (Ref, Tree) is finite. As the + * code is finite, we only need to carefully design the abstract domain to + * be finitary. * - * For soundness, we need to compute fixed point of the cache, which - * maps configuration to evaluation result. + * We also need to make sure that the computing function (i.e. the abstract + * interpreter) is monotone. Error handling breaks monotonicity of the + * abstract interpreter, because when an error happens, we always return + * the bottom value `Hot` for an expression. It is not a threat for + * termination because when an error happens, we stop the fixed point + * computation at the end of the iteration where the error happens. * - * Thanks to heap monotonicity, heap is not part of the configuration. - * - * This class is only used for the purpose of documentation. - */ - case class Config(thisV: Value, expr: Tree) - - /** Cache used to terminate the analysis - * - * A finitary configuration is not enough for the analysis to - * terminate. We need to use cache to let the interpreter "know" - * that it can terminate. - * - * For performance reasons we use curried key. - * - * Note: It's tempting to use location of trees as key. That should - * be avoided as a template may have the same location as its single - * statement body. Macros may also create incorrect locations. + * Note: It's tempting to use location of trees as key. That should + * be avoided as a template may have the same location as its single + * statement body. Macros may also create incorrect locations. */ - object Cache: /** Cache for expressions * * Ref -> Tree -> Value * * The first key is the value of `this` for the expression. We do not need - * environment, because the environment is always hot. + * environment in the key, because the environment is always hot. + * + * We do not need the heap in the key, because the value of an expression + * is only determined by the value of `this`. The heap is immutable: the + * abstract values for object fields never change within one iteration. + * The initial abstraction of a field is always a safe over-approximation + * thanks to monotonicity of initialization states. + * + * If the heap is unstable in an iteration, the cache should also be + * unstable. This is because all values stored in the heap are also present + * in the cache. Therefore, we only need to track whether the cache is + * stable between two iterations. + * + * The heap is not part of the fixed point computation -- we throw the + * unstable heap from last iteration away. In contrast, we use the unstable + * output cache from the last iteration as input for the next iteration. + * This is safe because the heap is determined by the cache -- it is a + * "local" data to the computing function, conceptually. Local data is + * always safe be discarded. + * + * Now, if a fixed point is reached, the local data contains stable data + * that could be reused to check other classes. We employ this trick to + * improve performance of the analysis. */ private type ExprValueCache = Map[Value, Map[TreeWrapper, Value]] @@ -323,7 +335,7 @@ object Semantic: * * It assumes the value is `Hot` if it doesn't exist in the last cache. * - * It update the current caches if the values change. + * It updates the current caches if the values change. * * The two caches are required because we want to make sure in a new iteration, an expression is evaluated once. */ From 5e0afd8cd84d9b4dc5091266b9134a9b96ed12bc Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Mon, 20 Jun 2022 21:12:56 +0200 Subject: [PATCH 08/10] Apply suggestions from code review MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Ondřej Lhoták --- compiler/src/dotty/tools/dotc/transform/init/Semantic.scala | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index d98f9b9b0c85..69a8cffdf3eb 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -194,8 +194,7 @@ object Semantic: * * Ref -> Tree -> Value * - * The first key is the value of `this` for the expression. We do not need - * environment in the key, because the environment is always hot. + * The first key is the value of `this` for the expression. * * We do not need the heap in the key, because the value of an expression * is only determined by the value of `this`. The heap is immutable: the @@ -268,7 +267,7 @@ object Semantic: /** Whether the current heap is different from the last heap? * - * `changed == true` implies that the fixed point has been reached. + * `changed == false` implies that the fixed point has been reached. */ private var changed: Boolean = false From e351630d6e64774057a278f8e468032618e45270 Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Mon, 20 Jun 2022 21:23:07 +0200 Subject: [PATCH 09/10] Address review --- .../tools/dotc/transform/init/Semantic.scala | 25 ++++++++++++++++--- 1 file changed, 21 insertions(+), 4 deletions(-) diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index 69a8cffdf3eb..0b4bafb10124 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -183,7 +183,9 @@ object Semantic: * abstract interpreter, because when an error happens, we always return * the bottom value `Hot` for an expression. It is not a threat for * termination because when an error happens, we stop the fixed point - * computation at the end of the iteration where the error happens. + * computation at the end of the iteration where the error happens. Care + * must be paid to tests of errors, monotonicity will be broken if we simply + * ignore the test errors (See `TryReporter`). * * Note: It's tempting to use location of trees as key. That should * be avoided as a template may have the same location as its single @@ -240,7 +242,11 @@ object Semantic: /** The immutable wrapper is intended to be stored as key in the heap. */ private class ImmutableTreeWrapper(val tree: Tree) extends TreeWrapper - /** For queries on the heap, reuse the same wrapper to avoid unnecessary allocation. */ + /** For queries on the heap, reuse the same wrapper to avoid unnecessary allocation. + * + * A `MutableTreeWrapper` is only ever used temporarily for querying a map, + * and is never inserted to the map. + */ private class MutableTreeWrapper extends TreeWrapper: var queryTree: Tree | Null = null def tree: Tree = queryTree match @@ -251,9 +257,13 @@ object Semantic: /** The cache for expression values from last iteration */ private var last: ExprValueCache = Map.empty - /** The updated cache for expression values based on the cache values from the last iteration + /** The output cache for expression values + * + * The output cache is computed based on the cache values `last` from the + * last iteration. * - * Both `last` and `current` are required to make sure an expression is evaluated once in each iteration. + * Both `last` and `current` are required to make sure an encountered + * expression is evaluated once in each iteration. */ private var current: ExprValueCache = Map.empty @@ -473,8 +483,15 @@ object Semantic: /** A TryReporter cannot be simply thrown away * * Either `abort` should be called or the errors be reported. + * + * If errors are ignored and `abort` is not called, the monotonicity of the + * computation function is not guaranteed, thus termination of fixed-point + * computation becomes a problem. */ trait TryReporter extends Reporter: + /** + * Revert the cache to previous state. + */ def abort()(using Cache): Unit def errors: List[Error] From 227616c5e161f3152ff3aaace1bcde1b1c1281ba Mon Sep 17 00:00:00 2001 From: Fengyun Liu Date: Mon, 20 Jun 2022 22:07:08 +0200 Subject: [PATCH 10/10] Fix #15459: Display uninitialized fields in promotion error --- .../tools/dotc/transform/init/Semantic.scala | 21 +++++++++++++++++-- tests/init/neg/closureLeak.check | 3 ++- tests/init/neg/default-this.check | 19 +++++++++-------- tests/init/neg/i15459.check | 11 ++++++++++ tests/init/neg/i15459.scala | 8 +++++++ tests/init/neg/inlined-method.check | 15 ++++++------- tests/init/neg/promotion-loop.check | 1 + 7 files changed, 59 insertions(+), 19 deletions(-) create mode 100644 tests/init/neg/i15459.check create mode 100644 tests/init/neg/i15459.scala diff --git a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala index 0b4bafb10124..33edf79b2f1a 100644 --- a/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala +++ b/compiler/src/dotty/tools/dotc/transform/init/Semantic.scala @@ -1006,6 +1006,19 @@ object Semantic: } } + def nonInitFields(): Contextual[List[Symbol]] = + val obj = ref.objekt + ref.klass.baseClasses.flatMap { klass => + if klass.hasSource then + klass.info.decls.filter { member => + !member.isOneOf(Flags.Method | Flags.Lazy | Flags.Deferred) + && !member.isType + && !obj.hasField(member) + } + else + Nil + } + end extension extension (thisRef: ThisRef) @@ -1032,8 +1045,12 @@ object Semantic: reporter.report(PromoteError(msg, trace.toVector)) case thisRef: ThisRef => - if !thisRef.tryPromoteCurrentObject() then - reporter.report(PromoteError(msg, trace.toVector)) + val emptyFields = thisRef.nonInitFields() + if emptyFields.isEmpty then + promoted.promoteCurrent(thisRef) + else + val fields = "Non initialized field(s): " + emptyFields.map(_.show).mkString(", ") + "." + reporter.report(PromoteError(msg + "\n" + fields, trace.toVector)) case warm: Warm => if !promoted.contains(warm) then diff --git a/tests/init/neg/closureLeak.check b/tests/init/neg/closureLeak.check index a90355fce1d4..b25130a9ee64 100644 --- a/tests/init/neg/closureLeak.check +++ b/tests/init/neg/closureLeak.check @@ -8,6 +8,7 @@ | ^^^^^^^^^^^^^^^^^ | | Promoting the value to fully initialized failed due to the following problem: - | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. Calling trace: + | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. + | Non initialized field(s): value p. Calling trace: | -> l.foreach(a => a.addX(this)) // error [ closureLeak.scala:11 ] | ^^^^ diff --git a/tests/init/neg/default-this.check b/tests/init/neg/default-this.check index cccfa47a1fe7..25054c8360d3 100644 --- a/tests/init/neg/default-this.check +++ b/tests/init/neg/default-this.check @@ -1,12 +1,13 @@ -- Error: tests/init/neg/default-this.scala:9:8 ------------------------------------------------------------------------ 9 | compare() // error | ^^^^^^^ - | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. Calling trace: - | -> class B extends A { [ default-this.scala:6 ] - | ^ - | -> val result = updateThenCompare(5) [ default-this.scala:11 ] - | ^^^^^^^^^^^^^^^^^^^^ - | -> def updateThenCompare(c: Int): Boolean = { [ default-this.scala:7 ] - | ^ - | -> compare() // error [ default-this.scala:9 ] - | ^^^^^^^ + | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. + | Non initialized field(s): value result. Calling trace: + | -> class B extends A { [ default-this.scala:6 ] + | ^ + | -> val result = updateThenCompare(5) [ default-this.scala:11 ] + | ^^^^^^^^^^^^^^^^^^^^ + | -> def updateThenCompare(c: Int): Boolean = { [ default-this.scala:7 ] + | ^ + | -> compare() // error [ default-this.scala:9 ] + | ^^^^^^^ diff --git a/tests/init/neg/i15459.check b/tests/init/neg/i15459.check new file mode 100644 index 000000000000..f9f08c488605 --- /dev/null +++ b/tests/init/neg/i15459.check @@ -0,0 +1,11 @@ +-- Error: tests/init/neg/i15459.scala:3:10 ----------------------------------------------------------------------------- +3 | println(this) // error + | ^^^^ + | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. + | Non initialized field(s): value b. Calling trace: + | -> class Sub extends Sup: [ i15459.scala:5 ] + | ^ + | -> class Sup: [ i15459.scala:1 ] + | ^ + | -> println(this) // error [ i15459.scala:3 ] + | ^^^^ diff --git a/tests/init/neg/i15459.scala b/tests/init/neg/i15459.scala new file mode 100644 index 000000000000..4d54f31f7af8 --- /dev/null +++ b/tests/init/neg/i15459.scala @@ -0,0 +1,8 @@ +class Sup: + val a = 10 + println(this) // error + +class Sub extends Sup: + val b = 20 + + override def toString() = "a = " + a + ", b = " + b diff --git a/tests/init/neg/inlined-method.check b/tests/init/neg/inlined-method.check index 72637948ceb9..627623f315a3 100644 --- a/tests/init/neg/inlined-method.check +++ b/tests/init/neg/inlined-method.check @@ -1,10 +1,11 @@ -- Error: tests/init/neg/inlined-method.scala:8:45 --------------------------------------------------------------------- 8 | scala.runtime.Scala3RunTime.assertFailed(message) // error | ^^^^^^^ - | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. Calling trace: - | -> class InlineError { [ inlined-method.scala:1 ] - | ^ - | -> Assertion.failAssert(this) [ inlined-method.scala:2 ] - | ^^^^^^^^^^^^^^^^^^^^^^^^^^ - | -> scala.runtime.Scala3RunTime.assertFailed(message) // error [ inlined-method.scala:8 ] - | ^^^^^^^ + | Cannot prove the argument is fully initialized. Only fully initialized values are safe to leak. + | Non initialized field(s): value v. Calling trace: + | -> class InlineError { [ inlined-method.scala:1 ] + | ^ + | -> Assertion.failAssert(this) [ inlined-method.scala:2 ] + | ^^^^^^^^^^^^^^^^^^^^^^^^^^ + | -> scala.runtime.Scala3RunTime.assertFailed(message) // error [ inlined-method.scala:8 ] + | ^^^^^^^ diff --git a/tests/init/neg/promotion-loop.check b/tests/init/neg/promotion-loop.check index 5fae90f0ebfa..48eb763a7296 100644 --- a/tests/init/neg/promotion-loop.check +++ b/tests/init/neg/promotion-loop.check @@ -9,3 +9,4 @@ | | Promoting the value to fully initialized failed due to the following problem: | Cannot prove that the field val outer is fully initialized. + | Non initialized field(s): value n.