From 0277cd3c64d8e12701c7fdec41179c72f24c8a08 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 16 Feb 2024 05:56:48 +0100
Subject: [PATCH 001/169] don't emit header includes for unused imported
 globals (#1191)

## Summary

Imported globals are now only included in the build if they're used
anywhere in alive code, fixing C headers being unnecessarily pulled in
for them.

Closes https://github.com/nim-works/nimskull/issues/1190.
Closes https://github.com/nim-works/nimskull/issues/1125.

## Details

An imported 'let' or 'var' was so far added to the (logical) struct of
the module the global is part of, but this is wrong! The definition of
an imported global doesn't imply the definition of a location owned by
the NimSkull program, rather it makes an external name available with
the given name and type.

**Changes:**
- don't add globals to the module struct if they're marked with
  `sfImportc`
- introduce `symbolToPmir` for querying the PMIR/MIR kind of a symbol
  without adding it to the MIR environment (`nameNode` does this)
- change `mirgen.genLocDef` to only use `nameNode` (which registers the
  symbol with the environment) if the statement constitutes an
  assignment
- add a specification test for the new behaviour

Imported globals are now only registered with the MIR environment (and
subsequently have their definition/include emitted) when they're part
of the alive program.
---
 compiler/mir/mirgen.nim                       |  8 ++--
 compiler/mir/proto_mir.nim                    | 38 ++++++++++---------
 compiler/sem/modulelowering.nim               |  4 +-
 .../s01_interop/t05_unused_importc.nim        | 18 +++++++++
 4 files changed, 44 insertions(+), 24 deletions(-)
 create mode 100644 tests/lang/s05_pragmas/s01_interop/t05_unused_importc.nim

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index c5cda9354e6..e7cfd342fdd 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1243,10 +1243,10 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
     s = n.sym
     hasInitializer = val.kind != nkEmpty
     sink = sfCursor notin s.flags
-    node = nameNode(c, s)
+    kind = symbolToPmir(s)
 
   c.builder.useSource(c.sp, n)
-  if node.kind == mnkGlobal and c.scopeDepth == 1:
+  if kind == pirGlobal and c.scopeDepth == 1:
     # no 'def' statement is emitted for top-level globals
     if hasInitializer:
       genAsgn(c, true, sink, n, val)
@@ -1257,7 +1257,7 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
       # the location doesn't have an explicit starting value. Initialize
       # it to the type's default value.
       c.buildStmt mnkInit:
-        c.add node
+        c.add nameNode(c, s)
         c.buildMagicCall mDefault, s.typ:
           discard
     else:
@@ -1265,7 +1265,7 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
       discard
   else:
     c.buildStmt (if sfCursor in s.flags: mnkDefCursor else: mnkDef):
-      c.add node
+      c.add nameNode(c, s)
       if hasInitializer:
         genAsgnSource(c, val, sink)
       else:
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 2c6f30f23e2..620287bc0ef 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -438,6 +438,25 @@ proc wantArray(e: var seq[ProtoItem]) =
     #      without them, so we do prefer lvalue captures
     e[^1].keep = kLvalue
 
+func symbolToPmir*(s: PSym): range[pirProc..pirConst] =
+  ## Returns the proto-MIR item kind corresponding to `s`.
+  case s.kind
+  of skVar, skLet, skForVar:
+    if sfGlobal in s.flags:
+      pirGlobal
+    else:
+      pirLocal
+  of skTemp, skResult:
+    pirLocal
+  of skParam:
+    pirParam
+  of skConst:
+    pirConst
+  of skProc, skFunc, skConverter, skMethod, skIterator:
+    pirProc
+  else:
+    unreachable(s.kind)
+
 proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: bool) =
   ## Translates the single node `n` and recurses if it's a non-terminal. This
   ## procedure makes up the core of the AST-to-proto-MIR translation.
@@ -482,24 +501,7 @@ proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: boo
   of nkLambdaKinds:
     node pirProc, sym, n[namePos].sym
   of nkSym:
-    let kind: range[pirProc..pirConst] =
-      case n.sym.kind
-      of skVar, skLet, skForVar:
-        if sfGlobal in n.sym.flags:
-          pirGlobal
-        else:
-          pirLocal
-      of skTemp, skResult:
-        pirLocal
-      of skParam:
-        pirParam
-      of skConst:
-        pirConst
-      of skProc, skFunc, skConverter, skMethod, skIterator:
-        pirProc
-      else:
-        unreachable(n.sym.kind)
-
+    let kind = symbolToPmir(n.sym)
     result.add ProtoItem(orig: n, typ: n.sym.typ, kind: kind, sym: n.sym)
   of nkDerefExpr:
     wantPure(n[0])
diff --git a/compiler/sem/modulelowering.nim b/compiler/sem/modulelowering.nim
index 025c7fef8bc..694d1955586 100644
--- a/compiler/sem/modulelowering.nim
+++ b/compiler/sem/modulelowering.nim
@@ -190,8 +190,8 @@ proc registerGlobals(stmts: seq[PNode], structs: var ModuleStructs) =
   ## the module level (within the module imperative body `stmts`).
 
   proc register(structs: var ModuleStructs, s: PSym, isTopLevel: bool) {.nimcall.} =
-    if sfCompileTime in s.flags:
-      # don't register compile-time globals with the module struct
+    if {sfCompileTime, sfImportc} * s.flags != {}:
+      # don't register compile-time or imported globals with the module struct
       discard
     elif s.kind == skTemp:
       # HACK: semantic analysis sometimes produces temporaries (it does so for
diff --git a/tests/lang/s05_pragmas/s01_interop/t05_unused_importc.nim b/tests/lang/s05_pragmas/s01_interop/t05_unused_importc.nim
new file mode 100644
index 00000000000..3a830d0ba74
--- /dev/null
+++ b/tests/lang/s05_pragmas/s01_interop/t05_unused_importc.nim
@@ -0,0 +1,18 @@
+discard """
+  description: '''
+    Let and var bindings for imported entities are only included in the
+    build if they're assigned to, read from, or have their address taken,
+    within code part of the final build
+  '''
+"""
+
+var a {.importc, header: "<doesnt_exist.h>".}: int
+let b {.importc, header: "<doesnt_exist2.h>".}: int
+
+# an initial assignment (e.g.: `` = 0``) would count as a usage and result in
+# a compiler error, since the headers are non-existent
+
+proc f() =
+  # while this is a usage of `a`, `f` is not part of the final build, so
+  # `a` is not pulled in
+  a = 1

From 6a40423ffd9a8a47790b4a897382b92d0498bfe7 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 17 Feb 2024 23:43:08 +0100
Subject: [PATCH 002/169] cgen: fix undefined behaviour of `openArray`
 conversions (#1197)

## Summary

When in their default empty state, both implicit and explicit
conversions
from  `string`  and  `seq`  to  `openArray`  invoked undefined behaviour
at the
C level. This is fixed now.

Fixes https://github.com/nim-works/nimskull/issues/1194.

## Details

Access of the payload pointer, which is null when the sequence is in
its default state, is now guarded by a not-null check. If the payload
pointer is null, the payload pointer is not accessed and null is used
as the data pointer value for the `openArray` tuple.

Benchmarking this change with the compiler itself showed it to have
little to no effect on execution time.
---
 compiler/backend/ccgcalls.nim | 6 ++++--
 compiler/backend/ccgexprs.nim | 4 ++--
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index 4a9159c9f80..1b164a61efb 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -148,10 +148,12 @@ proc genOpenArraySlice(p: BProc; q: CgNode; formalType, destType: PType): (Rope,
     if formalType.skipTypes(abstractInst).kind in {tyVar} and atyp.kind == tyString:
       linefmt(p, cpsStmts, "#nimPrepareStrMutationV2($1);$n", [byRefLoc(p, a)])
     if atyp.kind in {tyVar}:
-      result = ("($4*)(*$1)$3+($2)" % [rdLoc(a), rdLoc(b), dataField(p), dest],
+      result = ("((*$1).p != NIM_NIL ? ($4*)(*$1)$3+$2 : NIM_NIL)" %
+                  [rdLoc(a), rdLoc(b), dataField(p), dest],
                 lengthExpr)
     else:
-      result = ("($4*)$1$3+($2)" % [rdLoc(a), rdLoc(b), dataField(p), dest],
+      result = ("($1.p != NIM_NIL ? ($4*)$1$3+$2 : NIM_NIL)" %
+                  [rdLoc(a), rdLoc(b), dataField(p), dest],
                 lengthExpr)
   else:
     internalError(p.config, "openArrayLoc: " & typeToString(a.t))
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 694fba74505..f33c570ccd1 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -129,7 +129,7 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
       linefmt(p, cpsStmts, "$1.Field0 = $2; $1.Field1 = $2Len_0;$n",
         [rdLoc(d), a.rdLoc])
   of tySequence:
-    linefmt(p, cpsStmts, "$1.Field0 = $2$3; $1.Field1 = $4;$n",
+    linefmt(p, cpsStmts, "$1.Field0 = ($2.p != NIM_NIL ? $2$3 : NIM_NIL); $1.Field1 = $4;$n",
       [rdLoc(d), a.rdLoc, dataField(p), lenExpr(p, a)])
   of tyArray:
     linefmt(p, cpsStmts, "$1.Field0 = $2; $1.Field1 = $3;$n",
@@ -138,7 +138,7 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
     if skipTypes(d.t, abstractInst).kind in {tyVar}:
       linefmt(p, cpsStmts, "#nimPrepareStrMutationV2($1);$n", [byRefLoc(p, a)])
 
-    linefmt(p, cpsStmts, "$1.Field0 = $2$3; $1.Field1 = $4;$n",
+    linefmt(p, cpsStmts, "$1.Field0 = ($2.p != NIM_NIL ? $2$3 : NIM_NIL); $1.Field1 = $4;$n",
       [rdLoc(d), a.rdLoc, dataField(p), lenExpr(p, a)])
   else:
     internalError(p.config, a.lode.info, "cannot handle " & $a.t.kind)

From ceab1aa75241576a52d67683be6ecc535ad374c1 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 17 Feb 2024 23:43:44 +0100
Subject: [PATCH 003/169] cgen: fix undefined behaviour with object conversion 
 (#1196)

## Summary

Fix up-conversions of `nil` `ref object` or `ptr object` values
invoking undefined behaviour at the C level.

Fixes https://github.com/nim-works/nimskull/issues/1193.

## Details

Up conversions of pointers or `ref`s were translated into a
dereference + address-of sequence (e.g., `&a->Sup`), which invokes UB
if the pointer is null.

Instead, the pointer is now directly cast to the super type. According
to the C89 standard (6.5.2.1 "Structure and union specifiers"), "A
pointer to a structure object, suitably converted, points to its
initial member", so this cast is legal.
---
 compiler/backend/ccgexprs.nim | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index f33c570ccd1..628bc3b1262 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1943,10 +1943,15 @@ proc upConv(p: BProc, n: CgNode, d: var TLoc) =
                 a.storage)
     # an indirection is used:
     d.flags.incl lfIndirect
+  elif isRef:
+    # using ``&(x->Sup)`` is undefined behaviour when x is null, so the
+    # pointer has to be cast instead
+    putIntoDest(p, d, n,
+                "(($1) ($2))" % [getTypeDesc(p.module, n.typ), rdLoc(a)])
   else:
-    var r = rdLoc(a) & (if isRef: "->Sup" else: ".Sup")
+    var r = rdLoc(a) & ".Sup"
     for i in 2..inheritanceDiff(src, dest): r.add(".Sup")
-    putIntoDest(p, d, n, if isRef: "&" & r else: r, a.storage)
+    putIntoDest(p, d, n, r, a.storage)
 
 proc useConst*(m: BModule; id: ConstId) =
   let sym = m.g.env[id]

From ee40a2f816400a3aea164f6e57cf3ca1f9fffbc7 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 18 Feb 2024 18:28:11 +0100
Subject: [PATCH 004/169] fix constant expressions sometimes having the wrong
 value (#1198)

## Summary

Fix a critical bug with the constant-data table, which led to, in rare
cases, constant aggregate construction expressions evaluating to the
wrong value at run-time. All backends were affected.

## Details

The `MirNode` comparison procedure of `DataTable` didn't take all
relevant fields into account, meaning that unequal `mnkObjConstr`,
`mnkConstr`, and `mnkField` were treated as equal. For example, the
comparison would result in 'true' for `Obj(a: 1)` and `Obj(b: 1)`.

This problem was hidden by the hashing procedure properly considering
all relevant `MirNode` fields; only when there were hash or bucket
collisions did the equality problem surface. All fields are taken into
account by `datatables.==` now, and the used case statement is made
exhaustive in order to prevent similar issues in the future.

Since a language-level test would be rather contrived and brittle (a
hash/bucket collision is required), a unit test for the comparison
used by `datatables` is added.
---
 compiler/mir/datatables.nim    | 11 +++--
 tests/compiler/tdatatables.nim | 87 ++++++++++++++++++++++++++++++++++
 2 files changed, 95 insertions(+), 3 deletions(-)
 create mode 100644 tests/compiler/tdatatables.nim

diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index dc03151d1ab..e2ac06d6857 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -85,9 +85,14 @@ proc cmp(a, b: ConstrTree): bool =
       exprStructuralEquivalent(a.lit, b.lit)
     of mnkProc:
       a.prc == b.prc
-    else:
-      # all other nodes are equal when their kind is the same
-      true
+    of mnkConstr, mnkObjConstr:
+      a.len == b.len
+    of mnkField:
+      a.field.id == b.field.id
+    of mnkArg, mnkEnd:
+      true # same node kind -> equal nodes
+    of AllNodeKinds - ConstrTreeNodes:
+      unreachable(a.kind)
 
   if not a[0].typ.sameBackendType(b[0].typ) or a.len != b.len:
     # the (backend-)type is different -> not the same constant expressions
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
new file mode 100644
index 00000000000..d0129b49977
--- /dev/null
+++ b/tests/compiler/tdatatables.nim
@@ -0,0 +1,87 @@
+discard """
+  description: "Tests for the compiler/mir/datatables module"
+  targets: native
+"""
+
+import compiler/ast/ast
+include compiler/mir/datatables
+
+# some placeholder types to assing to the nodes. For object types, a different
+# ID means that it's a different type
+let
+  t1 = PType(itemId: ItemId(item: 1), kind: tyObject, sons: @[PType nil])
+  t2 = PType(itemId: ItemId(item: 2), kind: tyObject, sons: @[PType nil])
+  t3 = PType(itemId: ItemId(item: 3), kind: tyObject, sons: @[PType nil])
+  field1 = PSym(itemId: ItemId(item: 1))
+  field2 = PSym(itemId: ItemId(item: 2))
+
+# node constructor
+template node(k: MirNodeKind, t: PType, field, val: untyped): MirNode =
+  MirNode(kind: k, typ: t, field: val)
+template node(k: MirNodeKind, field, val: untyped): MirNode =
+  MirNode(kind: k, field: val)
+template node(k: MirNodeKind): MirNode =
+  MirNode(kind: k)
+template literal(val: PNode): MirNode =
+  MirNode(kind: mnkLiteral, lit: val)
+
+block tree_equality:
+  # the type is only relevant for the head of the tree (the first node)
+
+  # setup a list of structurally valid and unique (in terms of equality) trees
+  let trees = @[
+    # --- literals
+    @[node(mnkLiteral, t1, lit, newIntNode(nkIntLit, 0))],
+    @[node(mnkLiteral, t2, lit, newIntNode(nkIntLit, 0))],
+    @[node(mnkLiteral, t1, lit, newStrNode(nkStrLit, ""))],
+    @[node(mnkLiteral, t1, lit, newStrNode(nkStrLit, "a"))],
+    @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, 0.0))],
+    # 0.0 and -0.0 are different float values
+    # FIXME: doesn't work yet
+    #@[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, -0.0))],
+
+    # --- ordered aggregates
+    @[node(mnkConstr, t1, len, 0), node(mnkEnd)],
+    @[node(mnkConstr, t2, len, 0), node(mnkEnd)],
+    @[node(mnkConstr, t1, len, 1),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)),
+      node(mnkEnd)],
+    @[node(mnkConstr, t1, len, 2),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+      node(mnkEnd)],
+
+    # --- aggregates with fields
+    @[node(mnkObjConstr, t1, len, 0), node(mnkEnd)],
+    @[node(mnkObjConstr, t2, len, 0), node(mnkEnd)],
+    @[node(mnkObjConstr, t1, len, 1),
+        node(mnkField, field, field1),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+      node(mnkEnd)],
+    # same field value, different field:
+    @[node(mnkObjConstr, t1, len, 1),
+        node(mnkField, field, field2),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+      node(mnkEnd)],
+    @[node(mnkObjConstr, t1, len, 1),
+        node(mnkField, field, field1),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkField, field, field2),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+      node(mnkEnd)],
+    # swapped fields
+    @[node(mnkObjConstr, t1, len, 1),
+        node(mnkField, field, field2),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkField, field, field1),
+        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+      node(mnkEnd)]
+  ]
+
+  # compare all trees with each other
+  for i in 0..<trees.len:
+    doAssert cmp(trees[i], trees[i]) # tree must be equal to itself
+    for j in (i+1)..<trees.len:
+      if cmp(trees[i], trees[j]):
+        echo "compared equal, but shouldn't: ", i, " vs. ", j
+        doAssert false

From 94837f4ca9c6b01c12ba4ae57986390b95fe887d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 19 Feb 2024 00:01:49 +0100
Subject: [PATCH 005/169] rework the MIR (part 2) (#1195)

## Summary

This introduces the `copy`, `move`, and `sink` *assignment modifiers*,
which make it explicit where and how ownership is transferred with
assignments. An assignment with an lvalue expression as the source
operand and no modifier is a *shallow copy*, replacing the need for
`fastAsgn`. Previously, the exact semantics of an assignment where an
implicit property of every assignment.

Besides slightly simplifying the `injectdestructors` pass and data-flow
graph construction, the semantics of assignments being properly encoded
in the MIR is a pre-requisite for many MIR-based optimization passes.
More generally, it's a significant step towards decoupling value
ownership semantics from lifetime hooks.

Semantics of existing code don't (intentionally) change, this is an
internal-only rework.

## Details

### MIR

* the `mnkCopy`, `mnkMove`, and `mnkSink` nodes are added, representing
  the modifiers. Syntax-wise, they may only appear directly in
  assignment source slots
* the `mnkFastAsgn` node is obsolete and removed
* `copy` and `move` assignments are *final* . That is, a `copy`
  assignment cannot become a `move` assignment, and the inverse is also
  not possible
* only `sink` assignments are non-final. Collapsing them into either a
  `copy` or `move` assignment is the focus of the move analyzer

### AST-to-MIR Translation

`mirgen` performs the initial placement of assignment modifier, using a
proto-MIR-based analysis. The decision-making works as follows:
1. when the destination is owning (i.e., all non-`.cursor` locals/
   globals/fields):
	1. if a non-destructive move is definitely possible, `move` is used
	2. if a move is never possible (e.g., because the source is a
     cursor), `copy` is used
	3. if whether a move is possible depends on a data-flow analysis,
     `sink` is used
	4. if a destructive move is possible, `sink` is used
	5. if the source expression is an rvalue expression returning an
     owning value (e.g., a call, a construction, etc.), and the
     assignment is an initial assignment, an in-place assignment is
     used
	6. for types with custom copy/sink/destroy behaviour, and non-initial
     assignments, the rvalue is first assigned to a temporary and then
     `move`d into the destination
2. when the destination is non-owning, no modifier is used

Except for the rule 1.6, placement of the modifiers is independent on
whether lifetime hooks are involved.

In addition, all rvalue expressions (except for `cast`) are now treated
as returning *owning* values. What this means, in effect, is that
temporaries now properly use `def` instead of `def_cursor`. As the
moment, whether `def` or `def_cursor` is used for non-lifetime-hook
using types has no practical effect, but the new behaviour is
technically correct, while the previous one was not.

### Move Analyzer

Operation of the move analyzer changes slightly: instead of looking for
all `opConsume` data-flow instructions, it only looks for those
corresponding to `sink` assignments. Since whether a move or copy is
used is only relevant for lifetime-hook-using types, the `isLastRead`
analysis continues to only be performed for assignments of those types.

Compared to before, the DFG is now updated with the move analyzer
results, removing the need to pass them to each of the following
analysis routine.

### Assignment Rewriting

Rewriting of assignment now only looks for assignments with modifiers,
all assignments without a modifier are ignored. `move`s are exclusively
turned into `=sink` calls (never destructive moves), `copy`s into
`=copy`. `sink` is either turned into a copy, move, or destructive
move. Only the implementation is different, effective program behaviour
doesn't change.

### MIR-to-CGIR Translation

* `move` assignments and *shallow copy* assignments are translated to
  `cnkFastAsgn`
* all other assignments translate to `cnkAsgn`
* the small optimization preventing definitions being moved to the
  start of their scope is expanded to also apply to `def`s of
  temporaries without lifetime hooks, now that `def` is used for
  temporaries more often

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/backends.nim              |  16 +-
 compiler/backend/cgirgen.nim               |  36 ++-
 compiler/mir/analysis.nim                  |  44 ++--
 compiler/mir/mirconstr.nim                 |  18 +-
 compiler/mir/mirgen.nim                    | 123 +++++++---
 compiler/mir/mirpasses.nim                 |  12 +-
 compiler/mir/mirtrees.nim                  |  25 +-
 compiler/mir/proto_mir.nim                 | 154 ++++++++++---
 compiler/mir/utils.nim                     |  15 +-
 compiler/sem/injectdestructors.nim         | 253 ++++++++++-----------
 compiler/sem/mirexec.nim                   |  48 ++--
 doc/mir.rst                                |  23 +-
 tests/arc/topt_cursor.nim                  |   8 +-
 tests/arc/topt_no_cursor.nim               |  80 +++----
 tests/arc/topt_refcursors.nim              |  16 +-
 tests/arc/topt_wasmoved_destroy_pairs.nim  |  25 +-
 tests/lang_objects/destructor/tv2_cast.nim |  20 +-
 tests/misc/tdont_fold_procedure_cast.nim   |   7 +-
 18 files changed, 559 insertions(+), 364 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 58e79f8143e..a2e48ec4b28 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -401,21 +401,7 @@ proc produceFragmentsForGlobals(
       let global = env.globals.add(s)
       # generate the MIR code for an initializing assignment:
       prepare(init, result.init.source, graph.emptyNode)
-      init.setSource(result.init.source.add(it))
-      init.buildStmt mnkInit:
-        init.setSource(result.init.source.add(it[0]))
-        init.use toValue(global, s.typ)
-        init.setSource(result.init.source.add(it[2]))
-        if it[2].kind == nkEmpty:
-          # no explicit initializer expression means that the default value
-          # should be used
-          # XXX: ^^ it'd make sense to instead let semantic analysis ensure
-          #      this (i.e. by placing a ``default(T)`` in the initializer
-          #      slot)
-          init.buildMagicCall mDefault, s.typ:
-            discard
-        else:
-          generateCode(graph, env, config, it[2], init, result.init.source)
+      generateAssignment(graph, env, config, it, init, result.init.source)
 
       # if the global requires one, emit a destructor call into the deinit
       # fragment:
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index ac01da15cae..96b31615263 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -473,6 +473,29 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
 
 proc exprToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode
 
+proc sourceExprToIr(tree: MirBody, cl: var TranslateCl,
+                    cr: var TreeCursor): tuple[n: CgNode, useFast: bool] =
+  ## Translates the MIR expression appearing in an assignment's source
+  ## slot. Assignment modifiers are dropped, and whether a fast assignment or
+  ## normal assignment should be used is computed and returned.
+  case tree[cr].kind
+  of mnkCopy, mnkSink:
+    # requires a full assignment
+    discard enter(tree, cr)
+    result = (valueToIr(tree, cl, cr), false)
+    leave(tree, cr)
+  of mnkMove:
+    # an ``x = move y`` assignment can be turned into a fast assignment
+    discard enter(tree, cr)
+    result = (valueToIr(tree, cl, cr), true)
+    leave(tree, cr)
+  of LvalueExprKinds:
+    # a fast assignment is correct for all raw lvalues
+    result = (lvalueToIr(tree, cl, cr), true)
+  else:
+    # rvalue expressions require a full assignment
+    result = (exprToIr(tree, cl, cr), false)
+
 proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
            n: MirNode, cr: var TreeCursor): CgNode =
   ## Translates a 'def'-like construct
@@ -531,13 +554,14 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       # don't use the field interperation for variant access
       lvalueToIr(tree, cl, cr, preferField=false)
     else:
-      exprToIr(tree, cl, cr)
+      sourceExprToIr(tree, cl, cr)[0]
   leave(tree, cr)
   if n.kind in {mnkBind, mnkBindMut} and arg.typ.kind notin {tyVar, tyLent}:
     # wrap the operand in an address-of operation
     arg = newOp(cnkHiddenAddr, info, def.typ, arg)
 
   let isLet = (entity.kind == mnkTemp and n.kind == mnkDefCursor) or
+              (entity.kind == mnkTemp and not hasDestructor(def.typ)) or
               (entity.kind == mnkAlias)
   # to reduce the pressure on the code generator, locals that never cross
   # structured control-flow boundaries are not lifted. As a temporary
@@ -634,9 +658,10 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   of DefNodes:
     defToIr(tree, env, cl, n, cr)
   of mnkAsgn, mnkInit, mnkSwitch:
-    to cnkAsgn, lvalueToIr(tree, cl, cr), exprToIr(tree, cl, cr)
-  of mnkFastAsgn:
-    to cnkFastAsgn, lvalueToIr(tree, cl, cr), exprToIr(tree, cl, cr)
+    let
+      dst = lvalueToIr(tree, cl, cr)
+      (src, useFast) = sourceExprToIr(tree, cl, cr)
+    to (if useFast: cnkFastAsgn else: cnkAsgn), dst, src
   of mnkRepeat:
     to cnkRepeatStmt, body()
   of mnkBlock:
@@ -810,6 +835,9 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
                  mnkMul: cnkMul, mnkDiv: cnkDiv, mnkModI: cnkModI]
     treeOp Map[n.kind]:
       res.kids = @[valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)]
+  of mnkCopy, mnkMove, mnkSink:
+    # translation of assignments needs to handle all modifiers
+    unreachable("loose assignment modifier")
   of AllNodeKinds - ExprKinds - {mnkNone}:
     unreachable(n.kind)
 
diff --git a/compiler/mir/analysis.nim b/compiler/mir/analysis.nim
index 4b32ff61d4d..eec14495a53 100644
--- a/compiler/mir/analysis.nim
+++ b/compiler/mir/analysis.nim
@@ -9,10 +9,6 @@
 ## not. This means that run-time aliasing (e.g., through pointers) is **not**
 ## considered.
 ##
-## Analysis routine related to liveness take an additional ``Values``
-## instance as input, for knowing about what operation to collapse an
-## ``opConsume`` to.
-##
 ## When a "before" or "after" relationship is mentioned in the context of
 ## operations, it doesn't refer to the relative memory location of the
 ## nodes representing the operations, but rather to the operations'
@@ -53,7 +49,7 @@ type
     alive
 
   ComputeAliveProc[T] =
-    proc(tree: MirTree, values: Values, loc: T, op: Opcode,
+    proc(tree: MirTree, loc: T, op: Opcode,
          n: OpValue): AliveState {.nimcall, noSideEffect.}
 
 func skipConversions*(tree: MirTree, val: OpValue): OpValue =
@@ -68,7 +64,7 @@ func isOwned*(v: Values, val: OpValue): bool {.inline.} =
 func markOwned*(v: var Values, val: OpValue) {.inline.} =
   v.owned.incl val
 
-func isAlive*(tree: MirTree, cfg: DataFlowGraph, v: Values,
+func isAlive*(tree: MirTree, cfg: DataFlowGraph,
              span: Subgraph, loc: Path, start: InstrPos): bool =
   ## Computes whether the location named by `loc` does contain a value (i.e.,
   ## is alive) when the data-flow operation at `start` is reached (but not
@@ -99,10 +95,16 @@ func isAlive*(tree: MirTree, cfg: DataFlowGraph, v: Values,
         # return already
         return true
 
-    of opKill:
+    of opKill, opConsume:
       if isPartOf(tree, loc, path n) == yes:
+        # the location's value is consumed or the location is killed. No
+        # operation coming before the current one can change that, so we can
+        # stop traversing the current path
         exit = true
 
+      # partially consuming the value, or killing the location, does *not*
+      # change the alive state
+
     of opInvalidate:
       discard
 
@@ -112,16 +114,6 @@ func isAlive*(tree: MirTree, cfg: DataFlowGraph, v: Values,
         # derived from a global -> assume the analysed global is mutated
         return true
 
-    of opConsume:
-      if v.isOwned(n):
-        if isPartOf(tree, loc, path n) == yes:
-          # the location's value is consumed and it becomes empty. No operation
-          # coming before the current one can change that, so we can stop
-          # traversing the current path
-          exit = true
-
-        # partially consuming the location does *not* change the alive state
-
     of opUse:
       discard "not relevant"
 
@@ -226,7 +218,7 @@ func isLastWrite*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph, loc: Path,
   result = (true, state.exit, state.escapes)
 
 func computeAliveOp*[T: PSym | GlobalId | TempId](
-  tree: MirTree, values: Values, loc: T, op: Opcode, n: OpValue): AliveState =
+  tree: MirTree, loc: T, op: Opcode, n: OpValue): AliveState =
   ## Computes the state of `loc` at the *end* of the given operation. The
   ## operands are expected to *not* alias with each other. The analysis
   ## result will be wrong if they do
@@ -253,9 +245,10 @@ func computeAliveOp*[T: PSym | GlobalId | TempId](
       # the analysed location or one derived from it is mutated
       return alive
 
-  of opKill:
+  of opKill, opConsume:
     if sameLocation(n):
-      # the location is killed
+      # the location is killed or its value is consumed (i.e., moved somewhere
+      # else)
       return dead
 
   of opInvalidate:
@@ -266,15 +259,10 @@ func computeAliveOp*[T: PSym | GlobalId | TempId](
       # the operation mutates global state and we're analysing a global
       result = alive
 
-  of opConsume:
-    if values.isOwned(n) and sameLocation(n):
-      # the location's value is consumed
-      result = dead
-
   else:
     discard
 
-func computeAlive*[T](tree: MirTree, cfg: DataFlowGraph, values: Values,
+func computeAlive*[T](tree: MirTree, cfg: DataFlowGraph,
                       span: Subgraph, loc: T, op: static ComputeAliveProc[T]
                      ): tuple[alive, escapes: bool] =
   ## Computes whether the location is alive when `span` is exited via either
@@ -287,7 +275,7 @@ func computeAlive*[T](tree: MirTree, cfg: DataFlowGraph, values: Values,
 
   var exit = false
   for opc, n in traverseFromExits(cfg, span, exit):
-    case op(tree, values, loc, opc, n)
+    case op(tree, loc, opc, n)
     of dead:
       exit = true
     of alive:
@@ -299,7 +287,7 @@ func computeAlive*[T](tree: MirTree, cfg: DataFlowGraph, values: Values,
 
   # check if the location is alive at the structured exit of the span
   for opc, n in traverseReverse(cfg, span, span.b + 1, exit):
-    case op(tree, values, loc, opc, n)
+    case op(tree, loc, opc, n)
     of dead:
       exit = true
     of alive:
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 5b00531336d..e7db1ec85fa 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -357,12 +357,23 @@ func emitByName*(bu: var MirBuilder, val: Value, e: EffectKind) =
     bu.subTree MirNode(kind: mnkTag, effect: e):
       bu.use val
 
+func move*(bu: var MirBuilder, val: Value) =
+  ## Emits ``move val``.
+  bu.subTree MirNode(kind: mnkMove, typ: val.typ):
+    bu.use val
+
 func asgn*(buf: var MirBuilder, a, b: Value) =
-  ## Emits an assignment of `b` to `a`.
+  ## Emits a shallow assignment: ``a = b``.
   buf.subTree MirNode(kind: mnkAsgn):
     buf.use a
     buf.use b
 
+func asgnMove*(bu: var MirBuilder, a, b: Value) =
+  ## Emits a move assignment: ``a = move b``.
+  bu.subTree mnkAsgn:
+    bu.use a
+    bu.move b
+
 func inline*(bu: var MirBuilder, tree: MirTree, fr: NodePosition): Value =
   ## Inlines the operand for non-mutating use. This is meant to be used for
   ## materialzing immutable arguments when inlining calls / expanding
@@ -415,6 +426,11 @@ func materialize*(bu: var MirBuilder, loc: Value): Value =
     bu.use result
     bu.use loc
 
+func materializeMove*(bu: var MirBuilder, loc: Value): Value =
+  ## Emits a new owning temporary that's initialized with the moved-from `loc`.
+  bu.wrapTemp loc.typ:
+    bu.move loc
+
 func finish*(bu: sink MirBuilder): MirTree =
   ## Consumes `bu` and returns the finished tree.
   if bu.swapped:
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index e7cfd342fdd..3a1666de2e4 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -833,7 +833,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   of mAnd, mOr:
     let tmp = getTemp(c, n.typ)
     withFront c.builder:
-      genAndOr(c, n, Destination(isSome: true, val: tmp))
+      genAndOr(c, n, Destination(isSome: true, val: tmp, flags: {dfOwns}))
     c.use tmp
   of mDefault:
     # use the canonical form:
@@ -1134,8 +1134,11 @@ proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
 proc genRaise(c: var TCtx, n: PNode) =
   assert n.kind == nkRaiseStmt
   if n[0].kind != nkEmpty:
-    let tmp = c.wrapTemp n[0].typ:
-      genx(c, n[0], consume=true)
+    # the raise operand slot is a sink context, and it behaves much like a
+    # ``sink`` parameter
+    var e = exprToPmir(c, n[0], true, false)
+    wantConsumeable(e)
+    let tmp = toValue(c, e, e.high)
 
     # emit the preparation code:
     let
@@ -1166,26 +1169,35 @@ proc genReturn(c: var TCtx, n: PNode) =
 
   c.add MirNode(kind: mnkReturn)
 
-proc genAsgnSource(c: var TCtx, e: PNode, sink: bool) =
+proc genAsgnSource(c: var TCtx, e: PNode, status: set[DestFlag]) =
   ## Generates the MIR code for the right-hand side of an assignment.
-  ## The value is captured in a temporary if necessary for proper
-  ## destruction.
-  var e = exprToPmir(c, e, sink, false)
-  if not sink:
+  ## `status` provides the information necessary to decide what assignment
+  ## modifiers to use and whether a temporary is required.
+  ##
+  ## If not an initial assignment, and lifetime hooks are present, a temporary
+  ## is introduced for rvalue expressions that return owning values:
+  ##
+  ##   def _1 = get()
+  ##   dest = move _1
+  ##
+  ## This is necessary for the later hook injection, which triggers on
+  ## assignment modifiers, to work.
+  var e = exprToPmir(c, e, dfOwns in status, false)
+  if dfOwns in status:
+    wantOwning(e, dfEmpty notin status and hasDestructor(e.typ))
+  else:
     wantShallow(e)
+
   genx(c, e, e.high)
 
 proc genAsgn(c: var TCtx, dest: Destination, rhs: PNode) =
   assert dest.isSome
-  let owns = dfOwns in dest.flags
   let kind =
-    if owns:
-      if dfEmpty in dest.flags: mnkInit
-      else:                     mnkAsgn
-    else:                       mnkFastAsgn
+    if dfEmpty in dest.flags: mnkInit
+    else:                     mnkAsgn
   c.buildStmt kind:
     c.use dest.val
-    c.genAsgnSource(rhs, sink = owns)
+    c.genAsgnSource(rhs, dest.flags)
 
 proc unwrap(c: var TCtx, n: PNode): PNode =
   ## If `n` is a statement-list expression, generates the code for all
@@ -1215,7 +1227,7 @@ proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
     sink = sink and not isCursor(lhs)
 
   case rhs.kind
-  of ComplexExprs, nkStmtListExpr:
+  of ComplexExprs:
     # optimization: forward the destination. For example:
     #   x = if cond: a else: b
     # becomes:
@@ -1225,16 +1237,20 @@ proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
     genWithDest(c, rhs, initDestination(dest, isFirst, sink))
   else:
     let kind =
-      if sink:
-        if isFirst: mnkInit
-        else:       mnkAsgn
-      else:         mnkFastAsgn
+      if isFirst: mnkInit
+      else:       mnkAsgn
+
+    var status: set[DestFlag]
+    if sink:
+      status.incl dfOwns
+    if isFirst:
+      status.incl dfEmpty
 
     c.buildStmt kind:
       # ``genLvalueOperand`` ensures that unstable lvalue
       # expressions are captured
       genLvalueOperand(c, lhs, true)
-      genAsgnSource(c, rhs, sink)
+      genAsgnSource(c, rhs, status)
 
 proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
   ## Generates the 'def' construct for the entity provided by the symbol node
@@ -1267,7 +1283,9 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
     c.buildStmt (if sfCursor in s.flags: mnkDefCursor else: mnkDef):
       c.add nameNode(c, s)
       if hasInitializer:
-        genAsgnSource(c, val, sink)
+        genAsgnSource(c, val):
+          if sink: {dfEmpty, dfOwns}
+          else:    {dfEmpty}
       else:
         c.add MirNode(kind: mnkNone)
 
@@ -1319,7 +1337,8 @@ proc genVarTuple(c: var TCtx, n: PNode) =
     let val = c.allocTemp(initExpr.typ)
     c.buildStmt mnkDefUnpack:
       c.use val
-      genx(c, initExpr, consume = true)
+      # ensure that the temporary owns the tuple value:
+      genAsgnSource(c, initExpr, {dfEmpty, dfOwns})
 
     # generate the unpack logic:
     for i in 0..<numDefs:
@@ -1331,9 +1350,14 @@ proc genVarTuple(c: var TCtx, n: PNode) =
       # generate the assignment:
       c.buildStmt (if isInit: mnkInit else: mnkAsgn):
         genOperand(c, lhs)
-        c.subTree MirNode(kind: mnkPathPos, typ: lhs.typ,
-                          position: i.uint32):
-          c.use val
+        # the temporary tuple is ensured to own (see the emission of the
+        # definition above), and it's only used for unpacking; it can always be
+        # moved out of. The temporary tuple is not destroyed, so no
+        # destructive move is required
+        c.buildTree mnkMove, lhs.typ:
+          c.subTree MirNode(kind: mnkPathPos, typ: lhs.typ,
+                            position: i.uint32):
+            c.use val
 
 proc genVarSection(c: var TCtx, n: PNode) =
   for a in n:
@@ -1352,12 +1376,21 @@ proc genVarSection(c: var TCtx, n: PNode) =
         let isInit = c.inLoop == 0
         if a[2].kind != nkEmpty:
           genAsgn(c, isInit, true, a[0], a[2])
-        else:
-          # no intializer expression -> assign the default value
-          c.buildStmt (if isInit: mnkInit else: mnkAsgn):
+        elif isInit or not hasDestructor(a[0].typ):
+          # the default value can be assigned in-place
+          c.buildStmt mnkInit:
             genOperand(c, a[0])
             c.buildMagicCall mDefault, a[0].typ:
               discard
+        else:
+          # a 'move' modifier is required for the assignment to later be
+          # rewritten
+          c.buildStmt mnkAsgn:
+            genOperand(c, a[0])
+            c.buildTree mnkMove, a[0].typ:
+              c.wrapAndUse a[0].typ:
+                c.buildMagicCall mDefault, a[0].typ:
+                  discard
       else:
         unreachable()
 
@@ -1778,6 +1811,18 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
         Destination(isSome: true, val: tmp, flags: {dfOwns, dfEmpty})
 
     c.use tmp
+  of pirCopy:
+    c.buildOp mnkCopy, n.typ:
+      recurse()
+  of pirMove:
+    c.buildOp mnkMove, n.typ:
+      recurse()
+  of pirSink, pirDestructiveMove:
+    # a destructive move is currently not translated into a move + wasMoved,
+    # but rather into a sink, which is then, if necessary, later turned into
+    # a destructive move
+    c.buildOp mnkSink, n.typ:
+      recurse()
   of pirMat, pirMatCursor:
     let f = c.builder.push: recurse()
     # only materialize a temporary if the expression is not already a
@@ -1858,7 +1903,7 @@ proc gen(c: var TCtx, n: PNode) =
                           field: dest[^1].field):
           genx(c, dest, dest.len - 2)
 
-        genAsgnSource(c, n[1], false) # the source operand
+        genAsgnSource(c, n[1], {dfOwns}) # the source operand
     else:
       # a normal assignment
       genAsgn(c, false, true, n[0], n[1])
@@ -1958,6 +2003,26 @@ proc genWithDest(c: var TCtx, n: PNode; dest: Destination) =
   else:
     gen(c, n)
 
+proc generateAssignment*(graph: ModuleGraph, env: var MirEnv,
+                   config: TranslationConfig, n: PNode,
+                   builder: var MirBuilder, source: var SourceMap) =
+  ## Translates an `nkIdentDefs` AST into MIR and emits the result into
+  ## `builder`'s currently selected buffer.
+  assert n.kind == nkIdentDefs and n.len == 3
+  var c = TCtx(context: skUnknown, graph: graph, config: config)
+  # treat the code as top-level code so that no 'def' is generated for
+  # assignments to globals
+  c.scopeDepth = 1
+
+  template swapState() =
+    swap(c.sp.map, source)
+    swap(c.builder, builder)
+    swap(c.env, env)
+
+  swapState()
+  genLocInit(c, n[0], n[2])
+  swapState()
+
 proc generateCode*(graph: ModuleGraph, env: var MirEnv,
                    config: TranslationConfig, n: PNode,
                    builder: var MirBuilder, source: var SourceMap) =
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 95caec3a114..02c01e6e805 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -110,7 +110,7 @@ proc preventRvo(tree: MirTree, changes: var Changeset) =
   # we don't need to consider defs or initializing assignments (``mnkInit``)
   # here, because there it is guaranteed that the destination does not appear
   # anywhere in the source expression
-  for i in search(tree, {mnkFastAsgn, mnkAsgn}):
+  for i in search(tree, {mnkAsgn}):
     let source = tree.operand(i, 1)
     if tree[source].kind notin CallKinds or tree[source, 0].kind == mnkMagic or
        not eligibleForRvo(tree[source].typ):
@@ -159,9 +159,9 @@ proc preventRvo(tree: MirTree, changes: var Changeset) =
         tmp = bu.allocTemp(tree[source].typ)
         bu.use tmp
       changes.insert(tree, tree.sibling(i), i, bu):
-        bu.subTree tree[i].kind:
+        bu.subTree mnkAsgn:
           bu.emitFrom(tree, pos)
-          bu.use tmp
+          bu.move tmp
 
 proc lowerSwap(tree: MirTree, changes: var Changeset) =
   ## Lowers a ``swap(a, b)`` call into:
@@ -180,10 +180,10 @@ proc lowerSwap(tree: MirTree, changes: var Changeset) =
       let
         a = bu.bindMut(tree, NodePosition tree.argument(i, 0))
         b = bu.bindMut(tree, NodePosition tree.argument(i, 1))
-        temp = bu.materialize(a)
+        temp = bu.materializeMove(a)
       # we're just swapping the values, no full copy is needed
-      bu.asgn a, b
-      bu.asgn b, temp
+      bu.asgnMove a, b
+      bu.asgnMove b, temp
 
 proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
   ## Where safe (i.e., observable program behaviour does not change), elides
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index dafa8dd0078..d29892ae298 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -97,9 +97,6 @@ type
     mnkBindMut   ## introduces an alias that may be used for read/write access
                  ## and assignments. The source expression must not be empty
 
-    mnkFastAsgn ## assignment that cannot be rewritten into copy, move, or
-                ## hook call
-    # future direction: same as with DefCursor, remove FastAsgn
     mnkAsgn     ## normal assignment; the destination might store a value
                 ## already. Whether the source is copied or moved depends
                 ## on the expression
@@ -185,6 +182,17 @@ type
                   ## ``ref`` to it, or or constructs a new aggregate value
                   ## with named fields
 
+    mnkCopy   ## denotes the assignment as copying the source value
+    mnkMove   ## denotes the assignment as moving the value. This does
+              ## not imply a phyiscal change to the source location
+    mnkSink   ## collapses into one of the following:
+              ## - a copy (`mnkCopy`)
+              ## - a non-destructive move (`mnkMove`)
+              ## - a destructive move
+              ##
+              ## Collapsing ``mnkSink`` is the responsibility of the move
+              ## analyzer.
+
     mnkArg    ## when used in a call: denotes an argument that may either be
               ## passed by value or by name. Evaluation order is unspecified
               ## when used in a construction: denotes a value that is copied
@@ -330,12 +338,17 @@ const
   SingleOperandNodes* = {mnkPathNamed, mnkPathPos, mnkPathVariant, mnkPathConv,
                          mnkAddr, mnkDeref, mnkView, mnkDerefView, mnkStdConv,
                          mnkConv, mnkCast, mnkRaise, mnkTag, mnkArg,
-                         mnkName, mnkConsume, mnkVoid}
+                         mnkName, mnkConsume, mnkVoid, mnkCopy, mnkMove,
+                         mnkSink}
     ## Nodes that start sub-trees but that always have a single sub node.
 
   ArgumentNodes* = {mnkArg, mnkName, mnkConsume}
     ## Nodes only allowed in argument contexts.
 
+  ModifierNodes* = {mnkCopy, mnkMove, mnkSink}
+    ## Assignment modifiers. Nodes that can only appear directly in the source
+    ## slot of assignments.
+
   SymbolLike* = {mnkParam, mnkLocal}
     ## Nodes for which the `sym` field is available
 
@@ -350,7 +363,7 @@ const
 
   StmtNodes* = {mnkScope, mnkStmtList, mnkIf, mnkCase, mnkRepeat, mnkTry,
                 mnkBlock, mnkBreak, mnkReturn, mnkRaise, mnkPNode, mnkInit,
-                mnkAsgn, mnkSwitch, mnkFastAsgn, mnkVoid, mnkRaise, mnkEmit,
+                mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkEmit,
                 mnkAsm} + DefNodes
 
   UnaryOps*  = {mnkNeg}
@@ -365,7 +378,7 @@ const
                       mnkCast, mnkAddr, mnkView, mnkToSlice} + UnaryOps +
                      BinaryOps
   ExprKinds* =       {mnkCall, mnkCheckedCall, mnkConstr, mnkObjConstr} +
-                     LvalueExprKinds + RvalueExprKinds
+                     LvalueExprKinds + RvalueExprKinds + ModifierNodes
 
   CallKinds* = {mnkCall, mnkCheckedCall}
 
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 620287bc0ef..43337a79b23 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -70,6 +70,13 @@ type
 
     pirStmtList # usually skipped
 
+    # --- ownership operations
+
+    pirCopy
+    pirMove
+    pirDestructiveMove # move + wasMoved
+    pirSink
+
     # --- constructors
 
     pirClosureConstr
@@ -180,9 +187,6 @@ func typ*(n: seq[ProtoItem]): PType {.inline.} =
 
 func classify*(e: seq[ProtoItem], i: int): ExprKind =
   ## Returns the kind of the given proto-MIR expression.
-  # XXX: ownership is unrelated to whether a type has custom copy/sink/
-  #      destruction logic. Taking the latter into consideration is an
-  #      optimization that needs to eventually be removed
   case e[i].kind
   of pirLiteral, pirProc:
     Literal
@@ -191,22 +195,20 @@ func classify*(e: seq[ProtoItem], i: int): ExprKind =
     # constant expression are later turned into anonymous constants, so
     # they're lvalues too
     Lvalue
-  of pirCall, pirComplex, pirStringToCString, pirCStringToString:
-    if hasDestructor(e[i].typ):
-      OwnedRvalue
-    else:
-      Rvalue
+  of pirCall, pirComplex, pirSetConstr, pirAddr, pirView, pirToSlice,
+     pirToSubSlice, pirStringToCString, pirCStringToString,
+     pirConv, pirStdConv, pirChckRange:
+    OwnedRvalue
   of pirObjConstr, pirTupleConstr, pirClosureConstr, pirArrayConstr:
-    if e[i].owning and hasDestructor(e[i].typ):
+    if e[i].owning:
       OwnedRvalue
     else:
       Rvalue
   of pirRefConstr:
     OwnedRvalue
-  of pirSetConstr, pirAddr, pirView, pirCast, pirConv, pirStdConv,
-     pirChckRange, pirToSlice, pirToSubSlice:
+  of pirCast:
     Rvalue
-  of pirMat:
+  of pirMat, pirCopy, pirMove, pirDestructiveMove, pirSink:
     OwnedRvalue
   of pirMatCursor:
     Rvalue
@@ -247,6 +249,9 @@ func isPure(e: seq[ProtoItem], n: int): bool =
   of pirMat, pirMatCursor:
     # the materialized-into temporary is never assigned to
     true
+  of pirCopy, pirMove, pirDestructiveMove, pirSink:
+    # always produce an owning value
+    true
   of pirDeref, pirViewDeref:
     # the pointer destination could change (unless it's an immutable view)
     false
@@ -286,15 +291,107 @@ func isStable(e: seq[ProtoItem], n: int): bool =
   else:
     unreachable(e[n].kind)
 
+func ownershipOp(e: seq[ProtoItem], i: int): ProtoItemKind =
+  ## Infers and returns the best fitting operation to retrieve an owning
+  ## value from the given *lvalue*.
+  func decayMove(kind: ProtoItemKind): ProtoItemKind {.inline.} =
+    # moving from a projection requires a destructive move, since the source
+    # location needs to be destroyed after (in order to free the non-moved
+    # parts)
+    case kind
+    of pirMove: pirDestructiveMove
+    else:       kind
+
+  case e[i].kind
+  of pirParam:
+    if e[i].typ.kind == tySink:
+      pirSink
+    else:
+      pirCopy
+  of pirLocal, pirGlobal:
+    if sfCursor in e[i].sym.flags:
+      pirCopy # cursors can only be copied from
+    else:
+      pirSink # moveability depends on data flow
+  of pirConst, pirConstExpr, pirLiteral:
+    pirCopy
+  of pirFieldAccess:
+    if sfCursor in e[i].field.flags:
+      pirCopy # non-owning fields cannot be copied
+    else:
+      decayMove ownershipOp(e, i - 1)
+  of pirTupleAccess, pirArrayAccess, pirVariantAccess, pirSeqAccess:
+    decayMove ownershipOp(e, i - 1)
+  of pirLvalueConv:
+    # it's still the whole location that would be consumed, so no destructive
+    # move is required
+    ownershipOp(e, i - 1)
+  of pirCheckedArrayAccess, pirCheckedSeqAccess, pirCheckedVariantAccess,
+     pirCheckedObjConv:
+    decayMove ownershipOp(e, i - 1)
+  of pirDeref, pirViewDeref:
+    # pointers and views are currently not tracked, so their targets can only
+    # be copied from
+    pirCopy
+  of pirMat:
+    pirMove
+  of pirMatCursor:
+    pirCopy
+  of pirStmtList, pirMatLvalue:
+    ownershipOp(e, i - 1)
+  else:
+    # cannot be part of an lvalue expression sequence
+    unreachable(e[i].kind)
+
+func wantOwning*(e: var seq[ProtoItem], forceTemp: bool) =
+  ## Makes sure `e` produces an owning value. If `forceTemp` is true, a
+  ## temporary is materialized even if the expression would already produce
+  ## an owning value.
+  case classify(e, e.high)
+  of Rvalue:
+    # rvalue expressions cannot be copied from directly
+    if e[^1].kind != pirMatCursor:
+      e.add pirMatCursor
+    e.add pirCopy
+  of OwnedRvalue:
+    var i = e.high
+    while e[i].kind == pirStmtList:
+      dec i
+    case e[i].kind
+    of pirMat:
+      e.add pirMove
+    of pirComplex:
+      # watch out! try-finally expressions can have exceptional control-flow
+      # that forces the destination temporary to have to be destroyed in a
+      # finalizer. A destructive move is required
+      e.add pirMat
+      e.add pirDestructiveMove
+    elif forceTemp:
+      e.add pirMat
+      e.add pirMove
+  of Lvalue:
+    e.add ownershipOp(e, e.high)
+  of Literal:
+    if forceTemp:
+      e.add pirMat
+      e.add pirMove
+
 func wantConsumeable*(e: var seq[ProtoItem]) =
   ## Makes sure `e` is an expression that can be used in a context requiring a
-  ## certainly-consumeable value.
+  ## certainly-consumeable value (either a materialized temporary or a literal
+  ## value).
   case classify(e, e.high)
-  of Rvalue, OwnedRvalue:
+  of Rvalue:
+    if e[^1].kind != pirMatCursor:
+      e.add pirMatCursor
+    e.add pirCopy
+    e.add pirMat
+  of OwnedRvalue:
     if e[^1].kind != pirMat:
       # requires an owning temporary
       e.add pirMat
   of Lvalue:
+    e.add ownershipOp(e, e.high)
     e.add pirMat
   of Literal:
     discard "okay, can be used as is"
@@ -351,13 +448,14 @@ func selectWhenBranch*(n: PNode, isNimvm: bool): PNode =
   else:       n[1][0]
 
 func handleConstExpr(result: var seq[ProtoItem], n: PNode, kind: ProtoItemKind,
-                     sink: bool) =
-  ## If eligible, translates `n` to a constant expression. To a construction of
-  ## kind `kind` otherwise.
+                     sink, lift: bool) =
+  ## If `lift` is true and the expression is eligible, translates `n` to a
+  ## constant expression. To a construction of kind `kind` otherwise.
   ##
   ## Only fully constant, non-empty aggregate or set constructions are
   ## treated as constant expressions.
-  if not sink and n.len > ord(n.kind == nkObjConstr) and isDeepConstExpr(n):
+  if lift and n.len > ord(n.kind == nkObjConstr) and
+     isDeepConstExpr(n):
     result.add ProtoItem(orig: n, typ: n.typ, kind: pirConstExpr)
   elif kind == pirSetConstr:
     result.add ProtoItem(orig: n, typ: n.typ, kind: kind)
@@ -671,24 +769,24 @@ proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: boo
 
   of nkBracket:
     # if the construction is of seq type, then it's a constant seq value,
-    # which we prefer to lift into a constant (again)
-    let consume =
-      n.typ.skipTypes(IrrelevantTypes).kind != tySequence and sink
-    handleConstExpr(result, n, pirArrayConstr, consume)
+    # which we prefer to lift into a constant (again), even in sink contexts
+    let lift =
+      n.typ.skipTypes(IrrelevantTypes).kind == tySequence or not(sink)
+    handleConstExpr(result, n, pirArrayConstr, sink, lift)
   of nkCurly:
-    # never treat set constructions as appearing in a sink context, so that
-    # they're always turned into constants, if possible
-    handleConstExpr(result, n, pirSetConstr, false)
+    # always attempt to turn set constructions into constants, regardless of
+    # whether they're used in a sink context
+    handleConstExpr(result, n, pirSetConstr, false, true)
   of nkObjConstr:
     if n.typ.skipTypes(IrrelevantTypes).kind == tyRef:
       # ref constructions are never constant
       result.add n, pirRefConstr
     else:
-      handleConstExpr(result, n, pirObjConstr, sink)
+      handleConstExpr(result, n, pirObjConstr, sink, not sink)
   of nkTupleConstr:
-    handleConstExpr(result, n, pirTupleConstr, sink)
+    handleConstExpr(result, n, pirTupleConstr, sink, not sink)
   of nkClosure:
-    handleConstExpr(result, n, pirClosureConstr, sink)
+    handleConstExpr(result, n, pirClosureConstr, sink, not sink)
 
   of nkWhenStmt:
     # a ``when nimvm`` expression
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index a2fcb55ab79..4bbf962cc2f 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -332,6 +332,15 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
                    mnkMul: " * ", mnkDiv: " div ", mnkModI: " mod "]
       result.add Map[kind]
       valueToStr() # second operand
+  of mnkCopy:
+    tree "copy ":
+      valueToStr()
+  of mnkMove:
+    tree "move ":
+      valueToStr()
+  of mnkSink:
+    tree "sink ":
+      valueToStr()
   else:
     # TODO: make this branch exhaustive
     result.add "<error: " & $nodes[i].kind & ">"
@@ -413,12 +422,6 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
       result.add " := "
       exprToStr()
     result.add "\n"
-  of mnkFastAsgn:
-    tree "":
-      valueToStr()
-      result.add " =fast "
-      exprToStr()
-    result.add "\n"
   of mnkStmtList:
     renderList(indent)
   of mnkTry:
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 049d340db1d..fb8471c3f07 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -28,20 +28,19 @@
 ##          Except for thread-local variables, the others are destroyed at the
 ##          end of the program.
 ##
-## ``solveOwnership`` then computes for all lvalue expression appearing in
-## consume (e.g., argument to ``sink`` parameter) or sink contexts (source
-## lvalue in an assignment).
+## ``collapseSink`` then computes for all lvalue expression appearing as
+## source operands to sink assignments whether it's the last use of the
+## value currently stored in the location identified by the lvalue. All sinks
+## where this is the case are remembered, and their corresponding data-flow
+## operation is turned from a 'use' into a 'consume'.
 ##
-## Using the now resolved ownership status of all expressions, the next
-## analysis step computes which locations need to be destroyed via a destructor
-## call (see ``computeDestructors``).
+## With all sink assignments either collapsed into copy or move assignments,
+## the next analysis step computes which locations need to be destroyed via a
+## destructor call (see ``computeDestructors``).
 ##
 ## As the last step, the assignment rewriting and destructor injection is
 ## performed, using the previously gathered data.
 ##
-## For the assignment rewriting, if the source operand of an assignment is
-## owned, a move is used instead of a copy.
-##
 ## Ownership analysis
 ## ==================
 ##
@@ -339,13 +338,6 @@ func computeOwnership(tree: MirTree, cfg: DataFlowGraph, entities: EntityDict,
   ## Computes for `lval` whether it can be moved from (i.e., ownership of the
   ## value transferred) at the program position `start`.
   case tree[lval.root].kind
-  of mnkDeref, mnkDerefView, mnkConst:
-    # * derefs reaching here means that they couldn't be resolved
-    # * handles to constant locations are never owning
-    false
-  of mnkLiteral:
-    # literals can be moved (although not destructively)
-    true
   of mnkLocal, mnkParam, mnkGlobal, mnkTemp:
     # only entities that are relevant for destructor injection have an entry in
     # `entities`. Those that don't also can't be consumed (because we either
@@ -364,19 +356,34 @@ func computeOwnership(tree: MirTree, cfg: DataFlowGraph, entities: EntityDict,
   else:
     unreachable()
 
-func solveOwnership(tree: MirTree, cfg: DataFlowGraph,
-                    entities: EntityDict): Values =
-  ## Computes for all lvalues used in consume context whether they're owning
-  ## or not. Returns a ``Values`` instance with the results.
-  # search for 'consume' instructions and compute for their operands whether
-  # it's a handle that owns the location's value
+func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
+                  entities: EntityDict): Values =
+  ## Computes for every ``mnkSink`` node what operation (copy or move) it has
+  ## to collapse to, returning the result(s) as a ``Values`` instance.
+  ##
+  ## In addition, the DFG instructions in `cfg` for sinks-turned-into-moves
+  ## are updated to ``opConsume`` instructions.
+  var update: seq[InstrPos]
+    ## tracks the DFG instructions that need to be updated
+
+  # search for all 'use' instructions representing sinks, and compute whether
+  # they have to be turned into a move or copy
   for i, op, opr in cfg.instructions:
-    if op == opConsume and hasDestructor(tree[opr].typ) and
-       computeOwnership(tree, cfg, entities,
-                        computePath(tree, NodePosition opr), i + 1):
-      result.markOwned(opr)
-    else:
-      discard "nothing to do"
+    if op == opUse and tree[tree.parent(NodePosition opr)].kind == mnkSink:
+      # it's the DFG instruction for a sink
+      if hasDestructor(tree[opr].typ) and
+         computeOwnership(tree, cfg, entities,
+                          computePath(tree, NodePosition opr), i + 1):
+        update.add i
+        result.markOwned(opr)
+
+      # for the moment, sinks are always turned into copies for values without
+      # custom destroy/copy/sink behaviour
+
+  # change all 'use' instructions corresponding to sinks to 'consume'
+  # instructions. This is more efficient than changing the node kinds and then
+  # recomputing the graph
+  cfg.change(update, opConsume)
 
 type DestructionMode = enum
   demNone    ## location doesn't need to be destroyed because it contains no
@@ -386,11 +393,11 @@ type DestructionMode = enum
   demFinally ## the location contains a value when the scope is exited via
              ## unstructured control-flow
 
-func requiresDestruction(tree: MirTree, cfg: DataFlowGraph, values: Values,
+func requiresDestruction(tree: MirTree, cfg: DataFlowGraph,
                          span: Subgraph, def: NodePosition, entity: MirNode
                         ): DestructionMode =
   template computeAlive(loc, op: untyped): untyped =
-    computeAlive(tree, cfg, values, span, loc, op)
+    computeAlive(tree, cfg, span, loc, op)
 
   let r =
     case entity.kind
@@ -413,7 +420,7 @@ func requiresDestruction(tree: MirTree, cfg: DataFlowGraph, values: Values,
     elif r.alive: demNormal
     else:         demNone
 
-func computeDestructors(tree: MirTree, cfg: DataFlowGraph, values: Values,
+func computeDestructors(tree: MirTree, cfg: DataFlowGraph,
                         entities: EntityDict): seq[DestroyEntry] =
   ## Computes and collects which locations present in `entities` need to be
   ## destroyed at the exit of their enclosing scope in order to prevent the
@@ -441,7 +448,7 @@ func computeDestructors(tree: MirTree, cfg: DataFlowGraph, values: Values,
       #       defer destruction of the global to the end of the program
       discard
 
-    case requiresDestruction(tree, cfg, values, info.scope, def, entity)
+    case requiresDestruction(tree, cfg, info.scope, def, entity)
     of demNormal:
       result.add (scopeStart, def, false)
     of demFinally:
@@ -458,7 +465,7 @@ func computeDestructors(tree: MirTree, cfg: DataFlowGraph, values: Values,
 
 # --------- analysis routines --------------
 
-func isAlive(tree: MirTree, cfg: DataFlowGraph, v: Values,
+func isAlive(tree: MirTree, cfg: DataFlowGraph,
              entities: EntityDict, val: Path, at: InstrPos): bool =
   ## Computes if `val` refers to a location that contains a value when
   ## `at` in the DFG is reached.
@@ -482,7 +489,7 @@ func isAlive(tree: MirTree, cfg: DataFlowGraph, v: Values,
     if at <= scope.a:
       false # the location cannot be alive
     else:
-      isAlive(tree, cfg, v, scope, val, at)
+      isAlive(tree, cfg, scope, val, at)
   else:
     # something that we can't analyse (e.g. a dereferenced pointer). We have
     # to be conservative and assume that the location the lvalue names already
@@ -546,23 +553,14 @@ func needsReset(tree: MirTree, cfg: DataFlowGraph, ar: AnalysisResults,
     # the presence of the value is observed -> a reset is required
     result = true
 
-func isMoveable(tree: MirTree, v: Values, n: NodePosition): bool =
-  ## Returns whether the value of the expression `n` can be moved.
+func isMove(tree: MirTree, v: Values, n: NodePosition): bool =
+  ## Returns whether the assignment modifier at `n` is a move modifier (after
+  ## collapsing sink).
   case tree[n].kind:
-  of LvalueExprKinds - {mnkDeref, mnkDerefView}:
-    v.isOwned(OpValue n)
-  of mnkDeref, mnkDerefView:
-    false
-  of mnkLiteral, mnkProc, mnkType:
-    true
-  of mnkConv, mnkStdConv, mnkCast, mnkAddr, mnkView, mnkToSlice, UnaryOps,
-     BinaryOps:
-    # the result of these operations is not an owned value
-    false
-  of mnkCall, mnkCheckedCall, mnkObjConstr, mnkConstr:
-    true
-  of AllNodeKinds - ExprKinds:
-    unreachable(tree[n].kind)
+  of mnkCopy: false
+  of mnkMove: true
+  of mnkSink: v.isOwned(tree.operand(n))
+  else:       unreachable(tree[n].kind)
 
 # ------- code generation routines --------
 
@@ -605,13 +603,13 @@ proc genInjectedSink(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
   else:
     # without a sink hook, a ``=destroy`` + blit-copy is used
     genDestroy(bu, graph, env, dest)
-    bu.asgn dest, source
+    bu.asgnMove dest, source
 
 proc genSinkFromTemporary(bu: var MirBuilder, graph: ModuleGraph,
                           env: var MirEnv, dest, source: Value) =
   ## Similar to ``genInjectedSink`` but generates code for destructively
   ## moving the source operand into a temporary first.
-  let tmp = bu.materialize(source)
+  let tmp = bu.materializeMove(source)
   genWasMoved(bu, graph, source)
   genInjectedSink(bu, graph, env, dest, tmp)
 
@@ -650,12 +648,13 @@ func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
 proc expandAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                 env: var MirEnv, stmt: NodePosition, pos: InstrPos,
                 c: var Changeset) =
-  ## Expands an assignment into either a copy, move, or destructive move.
-  ## `stmt` is the assignment statement node and `pos` is the 'def' data-flow
-  ## instruction corresponding to it.
+  ## Rewrites the assignment at `stmt` into either a ``=copy`` hook call,
+  ## ``=sink`` hook call, move, or destructive move.
+  ## `pos` is the 'def' data-flow instruction corresponding to the assignment.
   let
     dest       = tree.child(stmt, 0)
-    source     = tree.child(stmt, 1)
+    operator   = tree.child(stmt, 1)
+    source     = tree.child(operator, 0)
     sourcePath = computePath(tree, source)
     destPath   = computePath(tree, dest)
     relation   = compare(tree, sourcePath, destPath)
@@ -663,77 +662,60 @@ proc expandAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
   if relation.isSame:
     # a self-assignment -> elide
     c.remove(tree, stmt)
-  elif isMoveable(tree, ar.v[], source):
+  elif isMove(tree, ar.v[], operator):
     # a move is possible -> sink
     if true:
-      let fromLvalue = isNamed(tree, OpValue source)
+      template needsReset(): bool =
+        # only a ``sink`` modifier allows for the injection of resets
+        (tree[operator].kind == mnkSink and
+         needsReset(tree, ctx.cfg, ar, sourcePath, pos))
 
       if tree[stmt].kind != mnkInit and
-         isAlive(tree, ctx.cfg, ar.v[], ar.entities[], destPath, pos):
+         isAlive(tree, ctx.cfg, ar.entities[], destPath, pos):
         # there already exists a value in the destination location -> use the
         # sink operation
-        if fromLvalue:
+        if true:
           c.replaceMulti(tree, stmt, bu):
             let a = bu.bindMut(tree, dest)
             if isAPartOfB(relation) != no:
-              # this is a potential part-to-whole assignment, e.g.: ``x = x.y``.
-              # We need to move the source value into a temporary first, as
-              # ``=sink`` would otherwise destroy ``x`` first, also destroying
-              # ``x.y`` in the process
-              let b = bu.bindImmutable(tree, source)
+              # this is a potential part-to-whole assignment, e.g.:
+              # ``x = move x.y``. We need to move the source value into a
+              # temporary first, as ``=sink`` would otherwise destroy ``x``
+              # first, also destroying ``x.y`` in the process
+              let b = bu.bindMut(tree, source)
               genSinkFromTemporary(bu, ctx.graph, env, a, b)
-            elif needsReset(tree, ctx.cfg, ar, sourcePath, pos):
+            elif needsReset():
               # a sink from a location that needs to be reset after the move
               # (i.e., a destructive move)
               let (b, clear) = bu.destructiveMoveOperands(tree, source)
               genInjectedSink(bu, ctx.graph, env, a, b)
               genWasMoved(bu, ctx.graph, clear)
             else:
-              # a sink from a location that doesn't need to be cleared after
+              # a sink from a location that doesn't need to be reset afterwards
               let b = bu.bindImmutable(tree, source)
               genInjectedSink(bu, ctx.graph, env, a, b)
 
-        else:
-          # this is a bit hack-y, but in order to support changes within the
-          # second operand's tree, the assignment is not replaced as a whole
-          # but rather turned into a def statement. ``a.x = f(arg 1)`` becomes:
-          #   def _1 = f(arg 1)
-          #   bind_mut _2 = a.x
-          #   =sink(name _2, arg _1)
-          # XXX: this is going to become cleaner once `mirgen` handles most of
-          #      the sink-related transformations
-          var tmp: Value
-          c.changeTree(tree, stmt, MirNode(kind: mnkDef))
-          c.replaceMulti(tree, dest, bu):
-            # replace the destination operand with the name of a newly
-            # allocated temporary
-            tmp = bu.allocTemp(tree[source].typ)
-            bu.use tmp
-
-          c.insert(tree, tree.sibling(stmt), stmt, bu):
-            # the value is only accessible through the source expression, a
-            # destructive move is not required
-            let a = bu.bindMut(tree, dest)
-            genInjectedSink(bu, ctx.graph, env, a, tmp)
-
-      else:
+      elif needsReset():
         # the destination location doesn't contain a value yet (which would
         # need to be destroyed first otherwise) -> a bitwise copy can be used
-        if fromLvalue and needsReset(tree, ctx.cfg, ar, sourcePath, pos):
-          # we don't need to check for part-to-whole assignments here, because
-          # if the destination location has no value, so don't locations derived
-          # from it, in which case it doesn't matter when the reset happens
-          # XXX: the reset could be omitted for part-to-whole assignments
-          c.replaceMulti(tree, stmt, bu):
-            let
-              a          = bu.bindMut(tree, dest)
-              (b, clear) = bu.destructiveMoveOperands(tree, source)
-            bu.asgn a, b
-            genWasMoved(bu, ctx.graph, clear)
-
-        else:
-          # no hook call nor destructive move is required
-          discard
+        # we don't need to check for part-to-whole assignments here, because
+        # if the destination location has no value, so don't locations derived
+        # from it, in which case it doesn't matter when the reset happens
+        # XXX: the reset could be omitted for part-to-whole assignments
+        c.replaceMulti(tree, stmt, bu):
+          let
+            a          = bu.bindMut(tree, dest)
+            (b, clear) = bu.destructiveMoveOperands(tree, source)
+          bu.asgnMove a, b
+          genWasMoved(bu, ctx.graph, clear)
+
+      elif tree[operator].kind == mnkSink:
+        # no reset and/or hook call needs to be injected, simply replace the
+        # sink modifier with a move
+        c.changeTree(tree, operator): MirNode(kind: mnkMove)
+      else:
+        # no hook call nor destructive move is required
+        discard "nothing to do"
 
   else:
     # a move is not possible -> copy
@@ -753,18 +735,18 @@ proc expandDef(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                c: var Changeset) =
   ## Depending on whether the source can be moved out of, either rewrites the
   ## 'def' at `at` into a call to the ``=copy`` hook call or into a
-  ## destructive move. If the source can be moved out of non-destructively,
-  ## nothing is changed. `pos` is the data-flow instruction
+  ## destructive or non-destructive move. `pos` is the data-flow instruction.
   let
-    dest   = tree.child(at, 0)
-    source = tree.child(at, 1)
-  case isMoveable(tree, ar.v[], source)
+    dest     = tree.child(at, 0)
+    operator = tree.child(at, 1)
+    source   = tree.child(operator, 0)
+  case isMove(tree, ar.v[], operator)
   of false:
-    # a copy is required. Transform ``def x = a.b`` into:
+    # a copy is required. Transform ``def x = copy a.b`` into:
     #   def x
     #   bind _1 = a.b
     #   =copy(name x, arg _1)
-    c.replace(tree, source): MirNode(kind: mnkNone)
+    c.replace(tree, operator): MirNode(kind: mnkNone)
     c.insert(tree, tree.sibling(at), source, bu):
       let
         a = bu.bindMut(tree, dest)
@@ -773,20 +755,25 @@ proc expandDef(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
       # etc.), no cycle can possibly be introduced
       genCopy(bu, ctx.graph, env, a, b, false)
   of true:
-    if isNamed(tree, OpValue source) and
-       needsReset(tree, ctx.cfg, ar, computePath(tree, source), pos):
+    assert tree[operator].kind == mnkSink
+    if needsReset(tree, ctx.cfg, ar, computePath(tree, source), pos):
       # the value can be moved, but the location needs to be reset. Transform
-      # ``def x = a.b`` into:
+      # ``def x = sink a.b`` into:
       #   bind_mut _1 = a.b
-      #   def x = _1
+      #   def x = move _1
       #   wasMoved(name x)
       var tmp, clear: Value
       c.insert(tree, at, source, bu):
         (tmp, clear) = bu.destructiveMoveOperands(tree, source)
-      c.replaceMulti(tree, source, bu):
-        bu.use tmp
+      c.replaceMulti(tree, operator, bu):
+        bu.move tmp
       c.insert(tree, tree.sibling(at), source, bu):
         genWasMoved(bu, ctx.graph, clear)
+    else:
+      # turn into a ``Move`` operation
+      c.changeTree(tree, operator):
+        MirNode(kind: mnkMove, typ: tree[operator].typ)
+
 
 proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                 expr: NodePosition, src: OpValue, pos: InstrPos,
@@ -812,7 +799,7 @@ proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
       var tmp: Value
       c.insert(tree, stmt, NodePosition src, bu):
         let v = bu.bindMut(tree, NodePosition src)
-        tmp = bu.materialize(v)
+        tmp = bu.materializeMove(v)
         genWasMoved(bu, ctx.graph, v)
 
       # replace the argument with the injected temporary:
@@ -876,8 +863,7 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                         env: var MirEnv, diags: var seq[LocalDiag],
                         c: var Changeset) =
   ## Rewrites assignments to locations into calls to either the ``=copy``
-  ## or ``=sink`` hook (see ``expandAsgn`` for more details), using the
-  ## previously computed ownership information to decide.
+  ## or ``=sink`` hook (see ``expandAsgn`` for more details).
   ##
   ## Also injects the necessary location reset logic for lvalues passed to
   ## 'consume' argument sinks.
@@ -893,7 +879,7 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         consumeArg(tree, ctx, ar, tree.parent(parent), val, i, c)
       of mnkRaise:
         consumeArg(tree, ctx, ar, NodePosition val, val, i, c)
-      of mnkAsgn, mnkInit, mnkDef, mnkDefUnpack:
+      of mnkMove, mnkSink:
         # assignments are handled separately
         discard
       else:
@@ -906,9 +892,10 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
       case tree[stmt].kind
       of mnkDef, mnkDefUnpack:
         let src = tree.child(stmt, 1)
-        # ignore definitions with no initializer
-        if tree[src].kind != mnkNone:
-          if not isMoveable(tree, ar.v[], src):
+        # only rewrite definitions with modifiers. The ``move`` modifier
+        # is ignored since there's nothing to be rewritten for it
+        if tree[src].kind in ModifierNodes - {mnkMove}:
+          if not isMove(tree, ar.v[], src):
             checkCopy(ctx.graph, tree, src, diags)
             # emit a warning for copies-to-sink
             if isUsedForSink(tree, stmt):
@@ -917,9 +904,11 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
           expandDef(tree, ctx, ar, env, stmt, i, c)
       of mnkAsgn, mnkInit:
         let src = tree.child(stmt, 1)
-        if not isMoveable(tree, ar.v[], src):
-          checkCopy(ctx.graph, tree, src, diags)
-        expandAsgn(tree, ctx, ar, env, stmt, i, c)
+        # only rewrite assignments with modifiers
+        if tree[src].kind in ModifierNodes:
+          if not isMove(tree, ar.v[], src):
+            checkCopy(ctx.graph, tree, src, diags)
+          expandAsgn(tree, ctx, ar, env, stmt, i, c)
       else:
         # e.g., output arguments to procedures
         discard "ignore"
@@ -1164,13 +1153,13 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
     var
       changes = initChangeset(body.code)
       diags: seq[LocalDiag]
+      actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
 
     let
-      actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
       entities = initEntityDict(body.code, actx.cfg)
-      values = solveOwnership(body.code, actx.cfg, entities)
+      values = collapseSink(body.code, actx.cfg, entities)
 
-    let destructors = computeDestructors(body.code, actx.cfg, values, entities)
+    let destructors = computeDestructors(body.code, actx.cfg, entities)
 
     rewriteAssignments(
       body.code, actx,
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index 02309eda105..c9b51c3fbeb 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -48,11 +48,7 @@ type
     opInvalidate  ## all information gathered about a value becomes invalid
     opMutate      ## mutation of a value. Can be viewed as a combined 'use' +
                   ## 'def'
-    opConsume     ## a value is consumed. Counts as either a 'use' or a 'use'
-                  ## + 'kill', depending on the context
-    # future direction: change ``opConsume`` to always mean 'use' + 'kill'.
-    # The callsite should be fully responsible for handling sinks, rather
-    # than this being partially pushed into the DFG
+    opConsume     ## a value is consumed. This is effectively a 'use' + 'kill'
 
     opMutateGlobal ## an unspecified global is mutated
 
@@ -233,8 +229,7 @@ func emitForArgs(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
     else:
       emitLvalueOp(env, opUse, tree, at, OpValue it)
 
-func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition,
-                consume: bool) =
+func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   ## Emits the data- and control-flow instructions corresponding to the
   ## expression at `source`.
   template op(o: Opcode, v: OpValue) =
@@ -273,17 +268,20 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition,
       if tree[source].typ.kind == tyVar: opMutate
       else:                              opUse
     emitLvalueOp(env, opc, tree, at, tree.operand(source, 0))
+  of mnkCopy, mnkSink:
+    # until it's collapsed, a sink is conservatively treated as only a
+    # usage (not a consumption)
+    emitLvalueOp(env, opUse, tree, at, tree.operand(source))
+  of mnkMove:
+    emitLvalueOp(env, opConsume, tree, at, tree.operand(source))
   of UnaryOps:
     emitLvalueOp(env, opUse, tree, at, tree.operand(source, 0))
   of BinaryOps:
     emitLvalueOp(env, opUse, tree, at, tree.operand(source, 0))
     emitLvalueOp(env, opUse, tree, at, tree.operand(source, 1))
   of LvalueExprKinds:
-    # a read or consume is performed on an lvalue
-    let opc =
-      if consume: opConsume
-      else:       opUse
-    emitLvalueOp(env, opc, tree, at, OpValue source)
+    # raw usage of an lvalue
+    emitLvalueOp(env, opUse, tree, at, OpValue source)
   of mnkNone, mnkLiteral, mnkProc:
     discard "okay, ignore"
   of AllNodeKinds - ExprKinds - {mnkNone} + {mnkType}:
@@ -316,12 +314,12 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition,
   else:
     discard
 
-func emitForDef(env: var ClosureEnv, tree: MirTree, n: NodePosition, consume: bool) =
+func emitForDef(env: var ClosureEnv, tree: MirTree, n: NodePosition) =
   let
     dest   = tree.operand(n, 0)
     source = tree.operand(n, 1)
   emitForValue(env, tree, n, dest)
-  emitForExpr(env, tree, n, NodePosition source, consume)
+  emitForExpr(env, tree, n, NodePosition source)
   # defs with an empty initializer have no data- or control-flow properties.
   # Parameter definitions are an exception.
   if tree[dest].kind == mnkParam or tree[source].kind != mnkNone:
@@ -548,10 +546,8 @@ func computeDfg*(tree: MirTree): DataFlowGraph =
         # no control-flow or other effects
         discard
 
-    of mnkAsgn, mnkInit:
-      emitForDef(env, tree, i, true)
-    of mnkFastAsgn:
-      emitForDef(env, tree, i, false)
+    of mnkDef, mnkDefCursor, mnkDefUnpack, mnkAsgn, mnkInit:
+      emitForDef(env, tree, i)
     of mnkSwitch:
       # the switch statement invalidates the destination rather than
       # reassigning it (i.e., ``opDef``)
@@ -559,16 +555,12 @@ func computeDfg*(tree: MirTree): DataFlowGraph =
         dest   = tree.operand(i, 0)
         source = tree.operand(i, 1)
       emitForValue(env, tree, i, dest)
-      emitForExpr(env, tree, i, NodePosition source, false)
+      emitForExpr(env, tree, i, NodePosition source)
       dfaOp env, opInvalidate, i, dest
-    of mnkDef, mnkDefUnpack:
-      emitForDef(env, tree, i, true)
-    of mnkDefCursor:
-      emitForDef(env, tree, i, false)
     of mnkBindMut, mnkBind:
       emitForValue(env, tree, i, tree.operand(i, 1))
     of mnkVoid:
-      emitForExpr(env, tree, i, NodePosition tree.operand(i), false)
+      emitForExpr(env, tree, i, NodePosition tree.operand(i))
     of mnkEmit, mnkAsm:
       emitForArgs(env, tree, i, i)
 
@@ -606,6 +598,14 @@ func find*(dfg: DataFlowGraph, n: NodePosition): InstrPos =
   ## attached-to node position) operation is returned.
   lowerBound(dfg, n)
 
+func change*(dfg: var DataFlowGraph, instrs: openArray[InstrPos],
+             to: Opcode) =
+  ## Changes all data-flow instructions identified by `instrs` to use the
+  ## `to` opcode.
+  for it in instrs.items:
+    assert dfg.instructions[it].op in DataFlowOps
+    dfg.instructions[it].op = to
+
 iterator instructions*(dfg: DataFlowGraph): (InstrPos, Opcode, OpValue) =
   ## Returns all data-flow operations in order of appearance together with
   ## their position.
diff --git a/doc/mir.rst b/doc/mir.rst
index c090f877aca..1a6c0514193 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -110,7 +110,14 @@ Semantics
                                          # at the upper bound (inclusive, third
                                          # parameter)
 
-  FULL_VALUE = RVALUE | VALUE
+  ASGN_SRC = RVALUE
+           | VALUE
+           | Copy VALUE
+           | Move LVALUE
+           | Sink LVALUE
+
+  SHALLOW_SRC = RVALUE
+              | VALUE
 
   STATEMENT =
             | StmtList STATEMENT ...    # a list of statements
@@ -118,10 +125,10 @@ Semantics
                                         # delimits the lifetime of all
                                         # definitions within
             | Def NAME none             # definition
-            | Def NAME FULL_VALUE       # definition + initial value assignment
+            | Def NAME ASGN_SRC         # definition + initial value assignment
             | DefCursor NAME            # definition of non-owning location
-            | DefCursor NAME FULL_VALUE # same as above, but with initial
-                                        # assignment
+            | DefCursor NAME SHALLOW_SRC# definition of non-owning location +
+                                        # initial (shallow copy) assignment
             | Bind <Alias> LVALUE       # bind the lvalue to the given alias.
                                         # May be used for mutation, but must
                                         # not be used as an assignment's
@@ -136,13 +143,11 @@ Semantics
             | Void CALL_EXPR            # represents a void call. The called
                                         # procedure or magic *must* have a
                                         # `void`` return type
-            | Asgn LVALUE FULL_VALUE    # normal assignment of the right value
+            | Asgn LVALUE ASGN_SRC      # normal assignment of the right value
                                         # to the left location
-            | Init LVALUE FULL_VALUE    # initial assignment (the destination
+            | Init LVALUE ASGN_SRC      # initial assignment (the destination
                                         # is empty)
-            | FastAsgn LVALUE FULL_VALUE# fast assignment (cannot be rewritten
-                                        # into a full copy)
-            | Switch LVALUE FULL_VALUE  # changes the active branch of a
+            | Switch LVALUE ASGN_SRC    # changes the active branch of a
                                         # variant. Unclear semantics.
             | If VALUE STATEMENT        # if the value evaluates to true
                                         # execute the statement
diff --git a/tests/arc/topt_cursor.nim b/tests/arc/topt_cursor.nim
index 76f2b9f0ddd..2085b3c17d9 100644
--- a/tests/arc/topt_cursor.nim
+++ b/tests/arc/topt_cursor.nim
@@ -9,10 +9,10 @@ scope:
     block L0:
       if cond:
         scope:
-          x =fast <D1>
+          x = <D1>
           break L0
       scope:
-        x =fast <D2>
+        x = <D2>
     def_cursor _0: (string, int) = x
     def _1: string = $(arg _0) (raises)
     echo(arg type(array[0..0, string]), arg _1) (raises)
@@ -35,8 +35,8 @@ scope:
               while true:
                 scope:
                   def_cursor _1: File = f
-                  def_cursor _2: bool = readLine(arg _1, name res) (raises)
-                  def_cursor _3: bool = not(arg _2)
+                  def _2: bool = readLine(arg _1, name res) (raises)
+                  def _3: bool = not(arg _2)
                   if _3:
                     scope:
                       break L0
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 9499d20a989..3546a896f86 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -14,16 +14,17 @@ doing shady stuff...
 
 scope:
   def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) (raises)
-  bind_mut _3: string = splat.0
-  def _0: string = _3
-  wasMoved(name _3)
-  bind_mut _4: string = splat.1
-  def _1: string = _4
+  bind_mut _4: string = splat.0
+  def _0: string = move _4
   wasMoved(name _4)
-  bind_mut _5: string = splat.2
-  def _2: string = _5
+  bind_mut _5: string = splat.1
+  def _1: string = move _5
   wasMoved(name _5)
-  result = construct (consume _0, consume _1, consume _2)
+  bind_mut _6: string = splat.2
+  def _2: string = move _6
+  wasMoved(name _6)
+  def _3: Target = construct (consume _0, consume _1, consume _2)
+  result = move _3
   =destroy(name splat)
 -- end of expandArc ------------------------
 --expandArc: delete
@@ -55,15 +56,16 @@ scope:
   def lresult: seq[int] = arrToSeq(consume _0)
   def lvalue: seq[int]
   def lnext: string
-  def _1: seq[int] = lresult
+  def _1: seq[int] = move lresult
   def _: (seq[int], string) = construct (consume _1, consume ";")
-  bind_mut _2: seq[int] = _.0
-  lvalue = _2
-  wasMoved(name _2)
-  bind_mut _3: string = _.1
-  lnext = _3
+  bind_mut _3: seq[int] = _.0
+  lvalue = move _3
   wasMoved(name _3)
-  result.value = move(name lvalue)
+  bind_mut _4: string = _.1
+  lnext = move _4
+  wasMoved(name _4)
+  def _2: seq[int] = move(name lvalue)
+  result.value = move _2
   =destroy(name _)
   =destroy(name lnext)
   =destroy(name lvalue)
@@ -102,8 +104,8 @@ scope:
           while true:
             scope:
               def_cursor _1: int = i
-              def_cursor _2: bool = ltI(arg _1, arg L)
-              def_cursor _3: bool = not(arg _2)
+              def _2: bool = ltI(arg _1, arg L)
+              def _3: bool = not(arg _2)
               if _3:
                 scope:
                   break L0
@@ -115,7 +117,7 @@ scope:
                     def_cursor _5: string = line[]
                     def splitted: seq[string] = split(arg _5, arg " ", arg -1) (raises)
                     def_cursor _6: string = splitted[0]
-                    def_cursor _7: bool = eqStr(arg _6, arg "opt")
+                    def _7: bool = eqStr(arg _6, arg "opt")
                     if _7:
                       scope:
                         def _10: string = splitted[1]
@@ -148,8 +150,8 @@ scope:
           while true:
             scope:
               def_cursor _2: int = i
-              def_cursor _3: bool = ltI(arg _2, arg L)
-              def_cursor _4: bool = not(arg _3)
+              def _3: bool = ltI(arg _2, arg L)
+              def _4: bool = not(arg _3)
               if _4:
                 scope:
                   break L0
@@ -171,15 +173,15 @@ scope:
   try:
     def x: sink string
     def_cursor _0: sink string = x
-    def_cursor _1: int = lengthStr(arg _0)
-    def_cursor _2: bool = eqI(arg _1, arg 2)
+    def _1: int = lengthStr(arg _0)
+    def _2: bool = eqI(arg _1, arg 2)
     if _2:
       scope:
-        result = x
+        result = move x
         wasMoved(name x)
         return
     def_cursor _3: sink string = x
-    def_cursor _4: int = lengthStr(arg _3)
+    def _4: int = lengthStr(arg _3)
     def _5: string = $(arg _4) (raises)
     echo(arg type(array[0..0, string]), arg _5) (raises)
   finally:
@@ -196,12 +198,12 @@ scope:
     def _1: tuple[dir: string, front: string]
     block L0:
       def_cursor _2: string = this[].value
-      def_cursor _3: bool = dirExists(arg _2) (raises)
+      def _3: bool = dirExists(arg _2) (raises)
       if _3:
         scope:
           def _4: string
-          def _14: string = this[].value
-          =copy(name _4, arg _14)
+          def _16: string = this[].value
+          =copy(name _4, arg _16)
           _1 := construct (consume _4, consume "")
           break L0
       scope:
@@ -209,33 +211,33 @@ scope:
           def_cursor _5: string = this[].value
           def _6: string = parentDir(arg _5) (raises)
           def _7: string
-          def _15: string = this[].value
-          =copy(name _7, arg _15)
+          def _17: string = this[].value
+          =copy(name _7, arg _17)
           def _8: tuple[head: string, tail: string] = splitPath(consume _7) (raises)
-          bind_mut _16: string = _8.1
-          def _9: string = _16
-          wasMoved(name _16)
+          bind_mut _18: string = _8.1
+          def _9: string = move _18
+          wasMoved(name _18)
           _1 := construct (consume _6, consume _9)
           wasMoved(name _6)
         finally:
           =destroy(name _8)
           =destroy(name _6)
-    def par: tuple[dir: string, front: string] = _1
+    def par: tuple[dir: string, front: string] = move _1
     block L1:
       def_cursor _10: string = par.0
-      def_cursor _11: bool = dirExists(arg _10) (raises)
+      def _11: bool = dirExists(arg _10) (raises)
       if _11:
         scope:
           def_cursor _12: string = par.0
           def_cursor _13: string = par.1
-          def _17: seq[string] = getSubDirs(arg _12, arg _13) (raises)
-          bind_mut _18: seq[string] = this[].matchDirs
-          =sink(name _18, arg _17)
+          def _14: seq[string] = getSubDirs(arg _12, arg _13) (raises)
+          bind_mut _19: seq[string] = this[].matchDirs
+          =sink(name _19, arg _14)
           break L1
       scope:
-        def _19: seq[string] = construct ()
+        def _15: seq[string] = construct ()
         bind_mut _20: seq[string] = this[].matchDirs
-        =sink(name _20, arg _19)
+        =sink(name _20, arg _15)
   finally:
     =destroy(name par)
 -- end of expandArc ------------------------'''
diff --git a/tests/arc/topt_refcursors.nim b/tests/arc/topt_refcursors.nim
index f9b62b5685d..20b5823ee66 100644
--- a/tests/arc/topt_refcursors.nim
+++ b/tests/arc/topt_refcursors.nim
@@ -10,9 +10,9 @@ scope:
       while true:
         scope:
           def_cursor _0: Node = it
-          def_cursor _1: bool = eqRef(arg _0, arg nil)
-          def_cursor _2: bool = not(arg _1)
-          def_cursor _3: bool = not(arg _2)
+          def _1: bool = eqRef(arg _0, arg nil)
+          def _2: bool = not(arg _1)
+          def _3: bool = not(arg _2)
           if _3:
             scope:
               break L0
@@ -21,16 +21,16 @@ scope:
             def_cursor _5: string = _4[].s
             echo(arg type(array[0..0, string]), arg _5) (raises)
             def_cursor _6: Node = it
-            it =fast _6[].ri
+            it = _6[].ri
   def_cursor jt: Node = root
   block L1:
     scope:
       while true:
         scope:
           def_cursor _7: Node = jt
-          def_cursor _8: bool = eqRef(arg _7, arg nil)
-          def_cursor _9: bool = not(arg _8)
-          def_cursor _10: bool = not(arg _9)
+          def _8: bool = eqRef(arg _7, arg nil)
+          def _9: bool = not(arg _8)
+          def _10: bool = not(arg _9)
           if _10:
             scope:
               break L1
@@ -40,7 +40,7 @@ scope:
             def_cursor _12: Node = jt
             def_cursor _13: string = _12[].s
             echo(arg type(array[0..0, string]), arg _13) (raises)
-            jt =fast ri
+            jt = ri
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/arc/topt_wasmoved_destroy_pairs.nim b/tests/arc/topt_wasmoved_destroy_pairs.nim
index c549515e9b8..6ee175c65ac 100644
--- a/tests/arc/topt_wasmoved_destroy_pairs.nim
+++ b/tests/arc/topt_wasmoved_destroy_pairs.nim
@@ -10,11 +10,11 @@ scope:
   block L0:
     if cond:
       scope:
-        def _0: seq[int] = x
+        def _0: seq[int] = move x
         add(name a, consume _0)
         break L0
     scope:
-      def _1: seq[int] = x
+      def _1: seq[int] = move x
       add(name b, consume _1)
   =destroy(name b)
   =destroy(name a)
@@ -29,21 +29,21 @@ scope:
     scope:
       def a: int = 0
       def b: int = 4
-      def i: int = a
+      def i: int = sink a
       block L0:
         scope:
           while true:
             scope:
               def_cursor _0: int = i
-              def_cursor _1: bool = ltI(arg _0, arg b)
-              def_cursor _2: bool = not(arg _1)
+              def _1: bool = ltI(arg _0, arg b)
+              def _2: bool = not(arg _1)
               if _2:
                 scope:
                   break L0
               scope:
                 scope:
                   def_cursor i: int = i
-                  def_cursor _3: bool = eqI(arg i, arg 2)
+                  def _3: bool = eqI(arg i, arg 2)
                   if _3:
                     scope:
                       return
@@ -54,12 +54,12 @@ scope:
     block L1:
       if cond:
         scope:
-          def _5: seq[int] = x
+          def _5: seq[int] = move x
           wasMoved(name x)
           add(name a, consume _5)
           break L1
       scope:
-        def _6: seq[int] = x
+        def _6: seq[int] = move x
         wasMoved(name x)
         add(name b, consume _6)
   finally:
@@ -75,11 +75,12 @@ scope:
     if cond:
       scope:
         return
-    str = boolToStr(arg cond)
-    def_cursor _0: bool = not(arg cond)
-    if _0:
+    def _0: string = boolToStr(arg cond)
+    str = move _0
+    def _1: bool = not(arg cond)
+    if _1:
       scope:
-        result = str
+        result = move str
         wasMoved(name str)
         return
   finally:
diff --git a/tests/lang_objects/destructor/tv2_cast.nim b/tests/lang_objects/destructor/tv2_cast.nim
index dbb16c26ada..e0a0f43f00a 100644
--- a/tests/lang_objects/destructor/tv2_cast.nim
+++ b/tests/lang_objects/destructor/tv2_cast.nim
@@ -9,10 +9,10 @@ scope:
   try:
     def _0: string = newString(arg 100)
     def_cursor _1: seq[byte] = cast _0
-    def_cursor _2: openArray[byte] = toOpenArray _1
+    def _2: openArray[byte] = toOpenArray _1
     def _3: seq[byte] = encode(arg _2) (raises)
+    def_cursor _4: string = cast _3
     def data: string
-    def _4: string = cast _3
     =copy(name data, arg _4)
   finally:
     =destroy(name data)
@@ -24,13 +24,13 @@ scope:
   try:
     def s: string = newString(arg 100)
     def_cursor _0: string = s
-    def_cursor _1: int = lengthStr(arg _0)
-    def_cursor _2: int = subI(arg _1, arg 1) (raises)
+    def _1: int = lengthStr(arg _0)
+    def _2: int = subI(arg _1, arg 1) (raises)
     chckBounds(arg s, arg 0, arg _2) (raises)
-    def_cursor _3: openArray[byte] = toOpenArray s, 0, _2
+    def _3: openArray[byte] = toOpenArray s, 0, _2
     def _4: seq[byte] = encode(arg _3) (raises)
+    def_cursor _5: string = cast _4
     def data: string
-    def _5: string = cast _4
     =copy(name data, arg _5)
   finally:
     =destroy(name data)
@@ -41,10 +41,10 @@ scope:
 scope:
   try:
     def s: seq[byte] = newSeq(arg 100) (raises)
-    def_cursor _0: openArray[byte] = toOpenArray s
+    def _0: openArray[byte] = toOpenArray s
     def _1: seq[byte] = encode(arg _0) (raises)
+    def_cursor _2: string = cast _1
     def data: string
-    def _2: string = cast _1
     =copy(name data, arg _2)
   finally:
     =destroy(name data)
@@ -55,10 +55,10 @@ scope:
 scope:
   try:
     def _0: seq[byte] = newSeq(arg 100) (raises)
-    def_cursor _1: openArray[byte] = toOpenArray _0
+    def _1: openArray[byte] = toOpenArray _0
     def _2: seq[byte] = encode(arg _1) (raises)
+    def_cursor _3: string = cast _2
     def data: string
-    def _3: string = cast _2
     =copy(name data, arg _3)
   finally:
     =destroy(name data)
diff --git a/tests/misc/tdont_fold_procedure_cast.nim b/tests/misc/tdont_fold_procedure_cast.nim
index 56a58dc4a92..81e6ce7d4c2 100644
--- a/tests/misc/tdont_fold_procedure_cast.nim
+++ b/tests/misc/tdont_fold_procedure_cast.nim
@@ -8,9 +8,10 @@ discard """
   nimout: '''
 --expandArc: test
 scope:
-  def p: proc (x: float){.nimcall.} = cast other
-  def_cursor _0: proc (x: int){.nimcall.} = cast p
-  _0(arg 1) (raises)
+  def_cursor _0: proc (x: float){.nimcall.} = cast other
+  def p: proc (x: float){.nimcall.} = copy _0
+  def_cursor _1: proc (x: int){.nimcall.} = cast p
+  _1(arg 1) (raises)
 -- end of expandArc ------------------------
   '''
   output: "1"

From 4948ae809f7d84ef6d765111a7cd0c7cf2ae77d2 Mon Sep 17 00:00:00 2001
From: Saem Ghani <saemghani+github@gmail.com>
Date: Sun, 18 Feb 2024 15:59:14 -0800
Subject: [PATCH 006/169] sem: template `typed` param only  in using pos
 (#1199)

## Summary

Disallow  `typed`  parameter template substitution in defining
positions, restricting them to using position substitution only.

## Details

Updated  `semtempl`  to only allow  `untyped`  parameters to be inserted
into definition positions during template parameter substitution. This
is based on lessons learned following the initial changes to template
parameter substitution rules in:
483726f957da5660268d0f72120ec234509a7b0c via the PR
https://github.com/nim-works/nimskull/pull/605

Along with this change the substitution test has been expanded and
manual updated.

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 compiler/sem/semtempl.nim                     | 19 ++++++-----
 doc/manual.rst                                | 19 ++++++-----
 ...usage_substitution_nonast_typed_params.nim | 25 ---------------
 ...mplate_usage_substitution_typed_params.nim | 32 +++++++++++++++++++
 4 files changed, 50 insertions(+), 45 deletions(-)
 delete mode 100644 tests/lang_callable/template/template_usage_substitution_nonast_typed_params.nim
 create mode 100644 tests/lang_callable/template/template_usage_substitution_typed_params.nim

diff --git a/compiler/sem/semtempl.nim b/compiler/sem/semtempl.nim
index 8ddbc3061fa..be499f5cb9d 100644
--- a/compiler/sem/semtempl.nim
+++ b/compiler/sem/semtempl.nim
@@ -40,18 +40,18 @@
 ## Substitution Positions
 ## ----------------------
 ## Templates are ultimately AST level constructs regardless of output type,
-## even they follow the grammar. There are two types of positions in a template
-## body, one is `definition` and the other is `usage`. A `definition` are any
+## they must be valid syntax. There are two types of positions in a template
+## body, one is `definition` and the other is `usage`. A `definition` is any
 ## position where the grammar construct is intended to introduce a new symbol,
 ## i.e.: the name of a routine, including its parameters; names of variables
 ## (`const`, `let`, `var`), and so on. All other sites are `usage` sites, where
-## a symbol of "chunk" of AST might be used.
+## a symbol referring to a "chunk" of AST might be used.
 ## 
 ## This is a draft of subsitution rules:
-## - `untyped` template bodies accept `typed` and `untyped` params in
-##   definition or usage positions; and all other params are usage only
-## - `typed` template bodies accept `typed` and `untyped` params in definition
-##    or usage positions; and all other params are usage only
+## - `untyped` template bodies accept `untyped` params in definition or usage
+##   positions; and all other params are usage only
+## - `typed` template bodies accept `untyped` params in definition or usage
+##   positions; and all other params are usage only
 ## - non-ast template bodies only allow subsitutions within usage positions
 
 discard """
@@ -257,9 +257,8 @@ func isTemplParam(c: TemplCtx, n: PNode): bool {.inline.} =
     sfTemplateParam in n.sym.flags
 
 func definitionTemplParam(c: TemplCtx, n: PNode): bool {.inline.} =
-  ## True if `n` is an AST typed (`typed`/`untyped`) parameter symbol of the
-  ## current template
-  isTemplParam(c, n) and n.sym.typ.kind in {tyUntyped, tyTyped}
+  ## True if `n` is an `untyped` parameter symbol of the current template.
+  isTemplParam(c, n) and n.sym.typ.kind in {tyUntyped}
 
 proc semTemplBody(c: var TemplCtx, n: PNode): PNode
 
diff --git a/doc/manual.rst b/doc/manual.rst
index cc37bc7a9e6..53af501e4e9 100644
--- a/doc/manual.rst
+++ b/doc/manual.rst
@@ -5421,7 +5421,7 @@ Templates
 
 A template is a form of metaprogramming: a template call evaluates to a
 |Nimskull| abstract syntax tree that is substituted in place of the call. The
-evaluation and substitution is done during semantic pass of the compiler.
+evaluation and substitution is done during the semantic pass of the compiler.
 
 The syntax to *invoke* a template is the same as calling a procedure.
 
@@ -5441,8 +5441,8 @@ templates:
 | `a in b` is transformed into `contains(b, a)`.
 | `notin` and `isnot` have the obvious meanings.
 
-The "types" of templates can be the symbols `untyped`, `typed` or `typedesc`.
-These are "meta types", they can only be used in certain contexts. Regular
+The "types" of templates can be the symbols `untyped`, `typed` or `typedesc`,
+these are "meta types" and can only be used in certain contexts. Regular
 types can be used too; this implies that `typed` expressions are expected.
 
 **Future directions**: the output type of a template is the output type of the
@@ -5450,10 +5450,10 @@ template body, which itself can be thought of as an out parameter. Templates
 will be classified into two major categories AST output (`untyped` and `typed`)
 and expression based (other types). Along with substitution positions (see
 below) template evaluation will be revised as follows:
-- `untyped` template: allow `typed` and `untyped` params in defining or
-  using positions; and all other params only in using positions
-- `typed` template: allow `typed` and `untyped` params in defining or using
-  positions; and all other params only in using positions
+- `untyped` template: allow `untyped` parameters in defining or using
+  positions; and all other parameters only in using positions
+- `typed` template: allow `untyped` parameters in defining or using positions;
+  and all other parameters only in using positions
 - non-ast template: only allow substitution in the using positions
 The above direction describes the nuance that will be incorporated into a
 broader redesign of how templates work in |Nimskull|.
@@ -5495,9 +5495,8 @@ performed before the expression is passed to the template. This allows
 
   declareInt(x) # invalid, because x has not been declared and so it has no type
 
-`typed` and `untyped` parameters may appear in defining or using symbol
-positions, while all other parameters are only substituted for using symbol
-positions.
+`untyped` parameters may appear in defining or using symbol positions, while
+all other parameters are only substituted for using symbol positions.
 
 A template where every parameter is `untyped` is called an `immediate`:idx:
 template. For historical reasons, templates can be explicitly annotated with
diff --git a/tests/lang_callable/template/template_usage_substitution_nonast_typed_params.nim b/tests/lang_callable/template/template_usage_substitution_nonast_typed_params.nim
deleted file mode 100644
index 302fbb4b5b7..00000000000
--- a/tests/lang_callable/template/template_usage_substitution_nonast_typed_params.nim
+++ /dev/null
@@ -1,25 +0,0 @@
-discard """
-  description: '''
-Templates parameters of non-AST type do not replace identifiers in new symbol
-definition positions. Meaning a template parameter that is not `untyped` or
-`typed` will not substitute for a matching identifier if defining things like
-variables, routines, parameters, types, fields, etc.
-'''
-"""
-
-block originally_this_did_not_work_now_it_does:
-  # this was kept for historical reasons and can be replaced, when this was an
-  # error it originated from https://github.com/nim-lang/nim/issues/3158
-  type
-    MyData = object
-      x: int
-
-  template newDataWindow(data: ref MyData): untyped =
-    proc testProc(data: ref MyData): string =
-      "Hello, " & $data.x
-    testProc(data)
-
-  var d: ref MyData
-  new(d)
-  d.x = 10
-  doAssert newDataWindow(d) == "Hello, 10"
\ No newline at end of file
diff --git a/tests/lang_callable/template/template_usage_substitution_typed_params.nim b/tests/lang_callable/template/template_usage_substitution_typed_params.nim
new file mode 100644
index 00000000000..9b000e071f6
--- /dev/null
+++ b/tests/lang_callable/template/template_usage_substitution_typed_params.nim
@@ -0,0 +1,32 @@
+discard """
+  description: '''
+Except for `untyped`, template parameters do not replace identifiers in new
+symbol definition positions. Meaning a template parameter that is not `untyped`
+will not substitute for a matching identifier if defining things like
+variables, routines, parameters, types, fields, etc.
+'''
+"""
+
+block originally_this_did_not_work_now_it_does:
+  # this was kept for historical reasons and can be replaced, when this was an
+  # error, example originated from https://github.com/nim-lang/nim/issues/3158
+  type
+    MyData = object
+      x: int
+
+  template newDataWindow(data: ref MyData): untyped =
+    proc testProc(data: ref MyData): string =
+      "Hello, " & $data.x
+    testProc(data)
+
+  var d: ref MyData
+  new(d)
+  d.x = 10
+  doAssert newDataWindow(d) == "Hello, 10"
+
+block also_true_for_typed_parameters:
+  template foo(a: typed): untyped =
+    let a = a + 10
+    a
+  let x = foo(10)
+  doAssert x == 20
\ No newline at end of file

From 8e2d0faf5fa2ba0cc4c50f1ba44dbeefafd57786 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 19 Feb 2024 21:03:42 +0100
Subject: [PATCH 007/169] refactor: remove `Values` type from `analysis`
 (#1201)

## Summary

Replace the `Values` usages in `injectdestructors` with directly using
a `PackedSet`, and remove the `Values` type.
---
 compiler/mir/analysis.nim          | 11 -----------
 compiler/sem/injectdestructors.nim | 29 +++++++++++++++++------------
 2 files changed, 17 insertions(+), 23 deletions(-)

diff --git a/compiler/mir/analysis.nim b/compiler/mir/analysis.nim
index eec14495a53..f815d493586 100644
--- a/compiler/mir/analysis.nim
+++ b/compiler/mir/analysis.nim
@@ -38,11 +38,6 @@ import
   ]
 
 type
-  Values* = object
-    ## Stores information about MIR expressions.
-    owned: PackedSet[OpValue]
-      ## all lvalue expressions that can be moved from
-
   AliveState = enum
     unchanged
     dead
@@ -58,12 +53,6 @@ func skipConversions*(tree: MirTree, val: OpValue): OpValue =
   while tree[result].kind == mnkPathConv:
     result = tree.operand(result)
 
-func isOwned*(v: Values, val: OpValue): bool {.inline.} =
-  val in v.owned
-
-func markOwned*(v: var Values, val: OpValue) {.inline.} =
-  v.owned.incl val
-
 func isAlive*(tree: MirTree, cfg: DataFlowGraph,
              span: Subgraph, loc: Path, start: InstrPos): bool =
   ## Computes whether the location named by `loc` does contain a value (i.e.,
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index fb8471c3f07..07d961727c2 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -175,11 +175,15 @@ type
     needsFinally: bool  ## whether the destructor needs to be placed in a
                         ## 'finally' clause
 
+  Moves = PackedSet[OpValue]
+    ## A set storing the operands of all sinks that were collapsed into
+    ## moves.
+
   AnalysisResults = object
     ## Bundled-up immutable state needed for assignment rewriting. Since
     ## they're immutable, ``Cursor``s are used in order to not copy
     # XXX: ideally, view types (i.e. ``lent``) would be used here
-    v: Cursor[Values]
+    moves: Cursor[Moves]
     entities: Cursor[EntityDict]
     destroy: Cursor[seq[DestroyEntry]]
 
@@ -357,9 +361,10 @@ func computeOwnership(tree: MirTree, cfg: DataFlowGraph, entities: EntityDict,
     unreachable()
 
 func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
-                  entities: EntityDict): Values =
+                  entities: EntityDict): Moves =
   ## Computes for every ``mnkSink`` node what operation (copy or move) it has
-  ## to collapse to, returning the result(s) as a ``Values`` instance.
+  ## to collapse to, returning a set with the operands of all sinks that are
+  ## collapsed into moves.
   ##
   ## In addition, the DFG instructions in `cfg` for sinks-turned-into-moves
   ## are updated to ``opConsume`` instructions.
@@ -375,7 +380,7 @@ func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
          computeOwnership(tree, cfg, entities,
                           computePath(tree, NodePosition opr), i + 1):
         update.add i
-        result.markOwned(opr)
+        result.incl opr
 
       # for the moment, sinks are always turned into copies for values without
       # custom destroy/copy/sink behaviour
@@ -553,13 +558,13 @@ func needsReset(tree: MirTree, cfg: DataFlowGraph, ar: AnalysisResults,
     # the presence of the value is observed -> a reset is required
     result = true
 
-func isMove(tree: MirTree, v: Values, n: NodePosition): bool =
+func isMove(tree: MirTree, moves: Moves, n: NodePosition): bool =
   ## Returns whether the assignment modifier at `n` is a move modifier (after
   ## collapsing sink).
   case tree[n].kind:
   of mnkCopy: false
   of mnkMove: true
-  of mnkSink: v.isOwned(tree.operand(n))
+  of mnkSink: tree.operand(n) in moves
   else:       unreachable(tree[n].kind)
 
 # ------- code generation routines --------
@@ -662,7 +667,7 @@ proc expandAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
   if relation.isSame:
     # a self-assignment -> elide
     c.remove(tree, stmt)
-  elif isMove(tree, ar.v[], operator):
+  elif isMove(tree, ar.moves[], operator):
     # a move is possible -> sink
     if true:
       template needsReset(): bool =
@@ -740,7 +745,7 @@ proc expandDef(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
     dest     = tree.child(at, 0)
     operator = tree.child(at, 1)
     source   = tree.child(operator, 0)
-  case isMove(tree, ar.v[], operator)
+  case isMove(tree, ar.moves[], operator)
   of false:
     # a copy is required. Transform ``def x = copy a.b`` into:
     #   def x
@@ -895,7 +900,7 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         # only rewrite definitions with modifiers. The ``move`` modifier
         # is ignored since there's nothing to be rewritten for it
         if tree[src].kind in ModifierNodes - {mnkMove}:
-          if not isMove(tree, ar.v[], src):
+          if not isMove(tree, ar.moves[], src):
             checkCopy(ctx.graph, tree, src, diags)
             # emit a warning for copies-to-sink
             if isUsedForSink(tree, stmt):
@@ -906,7 +911,7 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         let src = tree.child(stmt, 1)
         # only rewrite assignments with modifiers
         if tree[src].kind in ModifierNodes:
-          if not isMove(tree, ar.v[], src):
+          if not isMove(tree, ar.moves[], src):
             checkCopy(ctx.graph, tree, src, diags)
           expandAsgn(tree, ctx, ar, env, stmt, i, c)
       else:
@@ -1157,13 +1162,13 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
 
     let
       entities = initEntityDict(body.code, actx.cfg)
-      values = collapseSink(body.code, actx.cfg, entities)
+      moves = collapseSink(body.code, actx.cfg, entities)
 
     let destructors = computeDestructors(body.code, actx.cfg, entities)
 
     rewriteAssignments(
       body.code, actx,
-      AnalysisResults(v: cursor(values),
+      AnalysisResults(moves: cursor(moves),
                       entities: cursor(entities),
                       destroy: cursor(destructors)),
       env, diags, changes)

From 8969bf2ef5996b51f3417c466865baf1f2b71a1b Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 19 Feb 2024 22:19:56 +0100
Subject: [PATCH 008/169] fix wrong signed-ness for floats in constants (#1202)

## Summary

Fix the sign of `0.0` float values being inverted in implicit or
explicit constant expression. All backends were affected, but the
issue only surfaced seemingly at random.

## Details

`datatables` used `exprStructuralEquivalent`, which treats `0.0` as
being equal to `-0.0`, for comparing nodes storing literal values.
Since the hashing procedure for nodes hashed the float values' bit-
representation, the problem only surfaced in case of hash or bucket
collision.

A dedicated comparison procedure that compares the bit-representations
of float values is now used, fixing the issue.
---
 compiler/mir/datatables.nim    | 23 +++++++++++++++++++++--
 tests/compiler/tdatatables.nim |  3 +--
 2 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index e2ac06d6857..cefb94ba452 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -8,7 +8,6 @@ import
   compiler/ast/[
     ast_query,
     ast_types,
-    trees,
     types
   ],
   compiler/mir/[
@@ -74,6 +73,26 @@ func hashTree(tree: ConstrTree): Hash =
   result = result !& hash(tree[0].typ.kind)
   result = !$(result)
 
+func cmp(a, b: PNode): bool =
+  ## Compares for equality two nodes storing literal values. For float values,
+  ## their bit-representation is compared.
+  if a.kind != b.kind:
+    return false
+
+  case a.kind
+  of nkIntLiterals:
+    a.intVal == b.intVal
+  of nkFloatLiterals:
+    cast[BiggestUInt](a.floatVal) == cast[BiggestUInt](b.floatVal)
+  of nkStrLiterals:
+    a.strVal == b.strVal
+  of nkNilLit:
+    true
+  of nkRange:
+    cmp(a[0], b[0]) and cmp(a[1], b[1])
+  else:
+    unreachable(a.kind)
+
 proc cmp(a, b: ConstrTree): bool =
   ## Compares two MIR constant expressions for structural equality.
   proc `==`(a, b: MirNode): bool {.nimcall.} =
@@ -82,7 +101,7 @@ proc cmp(a, b: ConstrTree): bool =
 
     case a.kind
     of mnkLiteral:
-      exprStructuralEquivalent(a.lit, b.lit)
+      cmp(a.lit, b.lit)
     of mnkProc:
       a.prc == b.prc
     of mnkConstr, mnkObjConstr:
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index d0129b49977..9485607bdb8 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -37,8 +37,7 @@ block tree_equality:
     @[node(mnkLiteral, t1, lit, newStrNode(nkStrLit, "a"))],
     @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, 0.0))],
     # 0.0 and -0.0 are different float values
-    # FIXME: doesn't work yet
-    #@[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, -0.0))],
+    @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, -0.0))],
 
     # --- ordered aggregates
     @[node(mnkConstr, t1, len, 0), node(mnkEnd)],

From 4f591b377fbbcaff7571387feb4680175fcac0b5 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 20 Feb 2024 03:20:37 +0000
Subject: [PATCH 009/169] build(deps): Bump dawidd6/action-download-artifact
 from 3.0.0 to 3.1.1 (#1203)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 3.0.0 to 3.1.1.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v3.1.1</h2>
<h2>What's Changed</h2>
<ul>
<li>Head sha revert by <a
href="https://github.com/romangg"><code>@​romangg</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/271">dawidd6/action-download-artifact#271</a></li>
<li>build(deps): bump undici from 5.28.2 to 5.28.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/272">dawidd6/action-download-artifact#272</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.1">https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.1</a></p>
<h2>v3.1.0</h2>
<h2>What's Changed</h2>
<ul>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.0.0 to
2.0.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/267">dawidd6/action-download-artifact#267</a></li>
<li>build(deps): bump actions/upload-artifact from 3 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/264">dawidd6/action-download-artifact#264</a></li>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.0.1 to
2.1.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/269">dawidd6/action-download-artifact#269</a></li>
<li>Optionally search for workflows by <a
href="https://github.com/romangg"><code>@​romangg</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/270">dawidd6/action-download-artifact#270</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/romangg"><code>@​romangg</code></a> made
their first contribution in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/270">dawidd6/action-download-artifact#270</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.0">https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.0</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/72aaadce3bc708349fc665eee3785cbb1b6e51d0"><code>72aaadc</code></a>
build(deps): bump undici from 5.28.2 to 5.28.3 (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/272">#272</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/e454ec2044fbb6b77c4c69ad26c5e5c2427458c5"><code>e454ec2</code></a>
Head sha revert (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/271">#271</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/f6b0bace624032e30a85a8fd9c1a7f8f611f5737"><code>f6b0bac</code></a>
Optionally search for workflows (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/270">#270</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/a07e1dd02259003cd866ea4e16c903f1459e46a4"><code>a07e1dd</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.0.1 to 2.1.1
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/269">#269</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/2a4aebd3cbaad4fd177bb9819f3553fa8e2b8cd0"><code>2a4aebd</code></a>
build(deps): bump actions/upload-artifact from 3 to 4 (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/264">#264</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/919731637237edfee1503d8a42b0e0caa49a4c63"><code>9197316</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.0.0 to 2.0.1
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/267">#267</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/e73ee10c7552966e58bde25ecb4a0033cd13a843"><code>e73ee10</code></a>
README: fix</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/5a9d5a89d110d4559c2f3e29fe323d1789397d7c"><code>5a9d5a8</code></a>
README: update</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.0.0...v3.1.1">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=3.0.0&new-version=3.1.1)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 694f51c37ae..9bc6c6939ed 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v3.0.0
+        uses: dawidd6/action-download-artifact@v3.1.1
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v3.0.0
+        uses: dawidd6/action-download-artifact@v3.1.1
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v3.0.0
+        uses: dawidd6/action-download-artifact@v3.1.1
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v3.0.0
+        uses: dawidd6/action-download-artifact@v3.1.1
         with:
           workflow: ci.yml
           workflow_conclusion: success

From 4c2ff3c4f9f8e1b16e7f0504a16d14acf8cc4b28 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 20 Feb 2024 21:36:54 +0100
Subject: [PATCH 010/169] mir: separate hook injection from move analyzer
 (#1204)

## Summary

Make turning copy and move assignments into `=copy` and `=sink` calls a
standalone MIR pass; semantics don't change, but higher quality MIR
code is produced. This is progress towards fully decoupling lifetime
hooks from the move analyzer / destructor injection.

## Details

### General architecture

* the `injectdestructors` pass/module only collapses `sink` assignments
  and updates the MIR tree accordingly
* turning copy assignments into `=copy` and sink assignments into
  `=sink` calls is done by the new `injecthooks` pass/module
* reporting errors and warnings regarding hooks is also made part of
  the `injecthooks` pass
* the `injecthooks` is run after the `injectdestructors` pass
* handling of `--expandArc` is moved to `backends.process`, so that it
  can happen after hook injection

### `injectdestructors` Pass

* assignments are not replaced with `=copy` or `=sink` calls
* `expandAsgn` is renamed to `specializeAsgn`
* `sink` assignments are turned into either `copy`, `move`, or
  destructive `move` assignments (same as before)
* assignments to locations that don't yet store a value are turned into
  *initializing* assignments (this is necessary for the later `=sink`
  injection to work)
* compared to before, *all* assignments are processed by
  `specializeAsgn`, not only those for locations with lifetime hooks
* `=destroy` hooks are still injected

### `injecthooks` Pass

* the pass looks for `move` and `copy` assignment modifiers
  * if the involved type has lifetime hooks, the assignment is
     replaced with a call to the appropriate hook
  * the same injection rules as used previously apply
* the error detection and reporting logic is moved over - without
  change - from `injectdestructors`
* an adapter procedure to the legacy pass managements is provided
  (needed by `backends`)

With less surrounding complexity, more effort is spent on using less
temporaries for the hook call injection:
* no temporary is used for the destination operand
* no temporary is used for the source operand when it's guaranteed to
  not alias the destination. This is the case for:
  * `move` assignments
  * define with `copy` (e.g., `def x = copy y`)
  * initial assignments with `copy` (e.g., `x := copy y`)

Less temporaries means less work for the pass eliminating unnecessary
temporaries.

### Technical Correctness

* `mirconstr.inline` is only usable with lvalue expressions and always
  creates a non-owning temporary (instead of an owning temporary)
* the remaining usage of `mirconstr.inline` in
  `injectdestructors.lowerBranchSwitch`, where an owning temporary is
  required, is replaced with using `wrapTemp`

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/backends.nim             |  12 +-
 compiler/mir/injecthooks.nim              | 259 +++++++++++++++
 compiler/mir/mirconstr.nim                |  18 +-
 compiler/sem/injectdestructors.nim        | 369 +++++-----------------
 tests/arc/topt_no_cursor.nim              |  56 ++--
 tests/arc/topt_wasmoved_destroy_pairs.nim |   6 +-
 6 files changed, 378 insertions(+), 342 deletions(-)
 create mode 100644 compiler/mir/injecthooks.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index a2e48ec4b28..5fe5bd5fe03 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -4,6 +4,7 @@ import
   std/[
     deques,
     dynlib, # for computing possible candidate names
+    strtabs,
     tables
   ],
   compiler/ast/[
@@ -17,10 +18,12 @@ import
     cgirgen
   ],
   compiler/front/[
+    msgs,
     options
   ],
   compiler/mir/[
     datatables,
+    injecthooks,
     mirbodies,
     mirbridge,
     mirconstr,
@@ -28,7 +31,8 @@ import
     mirgen,
     mirpasses,
     mirtrees,
-    sourcemaps
+    sourcemaps,
+    utils
   ],
   compiler/modules/[
     modulegraphs,
@@ -324,6 +328,12 @@ proc process(body: var MirBody, prc: PSym, graph: ModuleGraph,
   ## procedure.
   if shouldInjectDestructorCalls(prc):
     injectDestructorCalls(graph, idgen, env, prc, body)
+    injectHooks(body, graph, env, prc)
+
+    if graph.config.arcToExpand.hasKey(prc.name.s):
+      graph.config.msgWrite("--expandArc: " & prc.name.s & "\n")
+      graph.config.msgWrite(render(body.code, addr env))
+      graph.config.msgWrite("\n-- end of expandArc ------------------------\n")
 
   let target =
     case graph.config.backend
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
new file mode 100644
index 00000000000..d7d4cad67a3
--- /dev/null
+++ b/compiler/mir/injecthooks.nim
@@ -0,0 +1,259 @@
+## Implements the MIR pass for replacing copy and move assignments with the
+## ``=copy`` or ``=sink`` hook (if available for the type).
+##
+## Future direction: injection of ``=destroy`` hooks also needs to happen
+## here.
+
+import
+  compiler/ast/[
+    ast_query,
+    ast_types,
+    lineinfos
+  ],
+  compiler/front/[
+    msgs,
+    options
+  ],
+  compiler/mir/[
+    mirbodies,
+    mirchangesets,
+    mirconstr,
+    mirenv,
+    mirtrees
+  ],
+  compiler/modules/[
+    modulegraphs
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+# XXX: reports are a code smell meaning data types are misplaced
+from compiler/ast/reports_sem import SemReport
+from compiler/ast/report_enums import ReportKind
+
+# XXX: temporary dependency until destroy hooks are injected here
+from compiler/sem/injectdestructors import getOp, genDestroy, buildVoidCall
+
+from compiler/sem/liftdestructors import boolLit, cyclicType
+
+type
+  LocalDiagKind = enum
+    ldkPassCopyToSink       ## a copy is introduced in a consume context
+    ldkUnavailableTypeBound ## a type-bound operator is requested but not
+                            ## available
+
+  LocalDiag = object
+    ## A temporary diagnostic representation that is later turned into a
+    ## ``SemReport``
+    pos: NodePosition ## the location of the report
+    case kind: LocalDiagKind
+    of ldkUnavailableTypeBound:
+      op: TTypeAttachedOp
+    of ldkPassCopyToSink:
+      discard
+
+const
+  skipAliases = {tyGenericInst, tyAlias, tySink}
+
+proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
+  ## Computes whether the definition statement is something produced for
+  ## sink parameter handling.
+  assert tree[stmt].kind in {mnkDef, mnkDefUnpack}
+  let def = tree.operand(stmt, 0)
+  if tree[def].kind != mnkTemp:
+    # only temporaries are used for sink handling
+    return
+
+  # look for whether the temporary is used as a 'consume' node's operand,
+  # but do reduce the amount of work by not searching beyond the
+  # temporary's lifetime
+  # HACK: this detection relies on the code shapes ``mirgen`` currently
+  #       emits for sink parameters and is thus very brittle. The proper
+  #       solution is to mark through a side channel the statement as being
+  #       generated for a sink parameter
+  var
+    n = tree.sibling(stmt)
+    depth = 0
+  while n < NodePosition tree.len:
+    case tree[n].kind
+    of mnkConsume:
+      let x = tree.operand(n)
+      if tree[x].kind == mnkTemp and tree[x].temp == tree[def].temp:
+        # the temporary is used for sink parameter passing
+        result = true
+        break
+    of mnkScope:
+      inc depth
+    of mnkEnd:
+      if tree[n].kind == mnkScope:
+        dec depth
+        if depth < 0:
+          # the end of the temporary's surrounding scope is reached
+          break
+    else:
+      discard
+
+    inc n
+
+proc reportDiagnostics(g: ModuleGraph, body: MirBody,
+                       owner: PSym, diags: var seq[LocalDiag]) =
+  ## Reports all diagnostics in `diags` as ``SemReport``s and clear the list
+  for diag in diags.items:
+    let ast = body.sourceFor(diag.pos)
+    let rep =
+      case diag.kind
+      of ldkUnavailableTypeBound:
+        SemReport(kind: rsemUnavailableTypeBound,
+                  typ: body[diag.pos].typ,
+                  str: AttachedOpToStr[diag.op],
+                  ast: ast,
+                  sym: owner)
+      of ldkPassCopyToSink:
+        SemReport(kind: rsemCopiesToSink, ast: ast)
+
+    localReport(g.config, ast.info, rep)
+
+func couldIntroduceCycle(tree: MirTree, dest: NodePosition): bool =
+  # copies to locals or globals can't introduce cyclic structures, as
+  # both are standlone and not part of any other structure
+  tree[dest].kind notin {mnkLocal, mnkTemp, mnkParam, mnkGlobal}
+
+template genCopy(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
+             op: PSym, tree: MirTree, dst: NodePosition,
+             maybeCyclic: bool, src: untyped) =
+  ## Emits a ``=copy`` hook call with `dst` and `src` as the arguments. If ORC
+  ## is enabled, an additional bool value is passed to the hook, informing
+  ## whether a reference cycle might be created at run-time.
+  bu.buildVoidCall(env, op):
+    bu.emitByName ekMutate:
+      bu.emitFrom(tree, dst)
+    bu.subTree mnkArg:
+      src
+
+    if graph.config.selectedGC == gcOrc and
+       cyclicType(tree[dst].typ.skipTypes(skipAliases + {tyDistinct}), graph):
+      # pass whether the copy can potentially introduce cycles as the third
+      # parameter:
+      let c = maybeCyclic and couldIntroduceCycle(tree, dest)
+      bu.emitByVal literal(boolLit(graph, unknownLineInfo, c))
+
+proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
+                  owner: PSym, changes: var Changeset) =
+  ## Replaces all copy and move assignments for locations with lifetime hooks
+  ## to the types' respective hook.
+  var diags: seq[LocalDiag]
+  template tree: MirTree = body.code
+
+  for i, n in tree.pairs:
+    case n.kind
+    of mnkCopy:
+      let
+        stmt = tree.parent(i)
+        typ  = tree[stmt, 0].typ
+
+      if not hasDestructor(typ):
+        # nothing to insert
+        continue
+
+      let
+        dest = tree.child(stmt, 0)
+        src  = tree.child(i, 0)
+        op   = getOp(graph, typ, attachedAsgn)
+
+      if sfError in op.flags:
+        # emit an error if the hook is not available, but still continue
+        diags.add LocalDiag(pos: src, kind: ldkUnavailableTypeBound,
+                            op: attachedAsgn)
+
+      if tree[stmt].kind == mnkDef and isUsedForSink(tree, stmt):
+        # emit a warning for copies-to-sink:
+        diags.add LocalDiag(pos: src, kind: ldkPassCopyToSink)
+
+      case tree[stmt].kind
+      of mnkDef, mnkDefUnpack:
+        # turn a ``def x = copy a.b`` into:
+        #   def x
+        #   =copy(name x, arg a.b)
+        changes.replace(tree, i): MirNode(kind: mnkNone)
+        changes.insert(tree, tree.sibling(stmt), i, bu):
+          # the destination is a local; the assignment thus cannot introduce a
+          # cycle
+          genCopy(bu, graph, env, op, tree, dest, false):
+            bu.emitFrom(tree, src)
+      of mnkInit:
+        # we know the destination cannot overlap with the source. Replace
+        # ``x := copy a.b`` with:
+        #   =copy(name x, arg a.b)
+        changes.replaceMulti(tree, stmt, bu):
+          genCopy(bu, graph, env, op, tree, dest, true):
+            bu.emitFrom(tree, src)
+      of mnkAsgn:
+        # the source and destination could overlap. Replace ``x = copy a.b``
+        # with:
+        #   def_cursor _1 = a.b
+        #   =copy(name x, arg _1)
+        # XXX: the temporary could be omitted in more cases by using proper
+        #      alias analysis
+        changes.replaceMulti(tree, stmt, bu):
+          let tmp = bu.inline(tree, src)
+          genCopy(bu, graph, env, op, tree, dest, true):
+            bu.use(tmp)
+      else:
+        unreachable(tree[stmt].kind)
+
+    of mnkMove:
+      let
+        stmt = tree.parent(i)
+        typ  = tree[stmt, 0].typ
+
+      if not hasDestructor(typ) or
+         tree[stmt].kind in {mnkDef, mnkDefUnpack, mnkInit}:
+        # nothing to do if:
+        # * the type has no hooks
+        # * it's guaranteed that there's no value in the destination
+        continue
+
+      let
+        dest = tree.child(stmt, 0)
+        src  = tree.child(i, 0)
+        op   = getOp(graph, typ, attachedSink)
+
+      # note: the move analyzer has to make sure that the source operand
+      # doesn't overlap with the destination, so no temporary for the source is
+      # needed
+      if op != nil:
+        # replace ``x = move a.b`` with:
+        #   =sink(name x, arg a.b)
+        changes.replaceMulti(tree, stmt, bu):
+          bu.buildVoidCall(env, op):
+            bu.subTree mnkName:
+              bu.subTree MirNode(kind: mnkTag, effect: ekMutate):
+                bu.emitFrom(tree, dest)
+            bu.subTree mnkArg:
+              bu.emitFrom(tree, src)
+      else:
+        # no sink hook exists, rewrite ``x.y = move a.b`` into:
+        #   bind_mut _1 = x.y
+        #   =destroy(name _1)
+        #   _1 = move a.b
+        var loc: Value
+        changes.insert(tree, stmt, dest, bu):
+          loc = bu.bindMut(tree, dest)
+          genDestroy(bu, graph, env, loc)
+        changes.replaceMulti(tree, dest, bu):
+          bu.use loc
+
+    else:
+      discard "nothing to do"
+
+  # turn the collected diagnostics into reports and report them:
+  reportDiagnostics(graph, body, owner, diags)
+
+proc injectHooks*(body: var MirBody, graph: ModuleGraph, env: var MirEnv,
+                  owner: PSym) =
+  ## Adapter for the legacy pass-application pipeline. Once possible, the pass
+  ## needs to be treated as just another MIR pass.
+  var c = initChangeset(body.code)
+  injectHooks(body, graph, env, owner, c)
+  apply(body.code, prepare(c))
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index e7db1ec85fa..32500e74733 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -352,10 +352,14 @@ func emitByVal*(bu: var MirBuilder, y: Value) =
   bu.subTree mnkArg:
     bu.use y
 
-func emitByName*(bu: var MirBuilder, val: Value, e: EffectKind) =
+template emitByName*(bu: var MirBuilder, e: EffectKind, body: untyped) =
   bu.subTree mnkName:
     bu.subTree MirNode(kind: mnkTag, effect: e):
-      bu.use val
+      body
+
+func emitByName*(bu: var MirBuilder, val: Value, e: EffectKind) =
+  bu.emitByName e:
+    bu.use val
 
 func move*(bu: var MirBuilder, val: Value) =
   ## Emits ``move val``.
@@ -375,17 +379,19 @@ func asgnMove*(bu: var MirBuilder, a, b: Value) =
     bu.move b
 
 func inline*(bu: var MirBuilder, tree: MirTree, fr: NodePosition): Value =
-  ## Inlines the operand for non-mutating use. This is meant to be used for
-  ## materialzing immutable arguments when inlining calls / expanding
+  ## Inlines the lvalue operand for non-mutating use. This is meant to be used
+  ## for materialzing immutable arguments when inlining calls / expanding
   ## assignments.
   case tree[fr].kind
   of Atoms:
     result = Value(node: tree[fr])
-  else:
+  of LvalueExprKinds - Atoms:
     result = allocTemp(bu, tree[fr].typ)
-    bu.subTree mnkDef:
+    bu.subTree mnkDefCursor:
       bu.use result
       bu.emitFrom(tree, fr)
+  else:
+    unreachable("can only inline lvalue-expression arguments")
 
 func bindImmutable*(bu: var MirBuilder, tree: MirTree,
                     lval: NodePosition): Value =
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 07d961727c2..48e4335fc04 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -9,8 +9,8 @@
 
 ## This module implements the following MIR passes:
 ## - the 'switch' operation lowering (``lowerBranchSwitch``)
-## - the pass for rewriting assignments into calls to the respective
-##   lifetime-tracking hooks
+## - the pass for collapsing sink assignments into copies, moves, and
+##   destrutive moves
 ## - the pass for injected ``wasMoved`` calls for consumed lvalues
 ## - the destructor (i.e. ``=destroy`` hook) injection
 ##
@@ -102,7 +102,6 @@ import
     algorithm,
     hashes,
     packedsets,
-    strtabs,
     tables
   ],
   compiler/ast/[
@@ -117,16 +116,14 @@ import
     mirconstr,
     mirenv,
     mirtrees,
-    sourcemaps,
-    utils
+    sourcemaps
   ],
   compiler/modules/[
     magicsys,
     modulegraphs
   ],
   compiler/front/[
-    options,
-    msgs
+    options
   ],
   compiler/sem/[
     aliasanalysis,
@@ -139,10 +136,6 @@ import
     idioms
   ]
 
-# xxx: reports are a code smell meaning data types are misplaced
-from compiler/ast/reports_sem import SemReport
-from compiler/ast/report_enums import ReportKind
-
 type
   AnalyseCtx = object
     cfg: DataFlowGraph
@@ -187,25 +180,6 @@ type
     entities: Cursor[EntityDict]
     destroy: Cursor[seq[DestroyEntry]]
 
-  LocalDiagKind = enum
-    ldkPassCopyToSink       ## a copy is introduced in a consume context
-    ldkUnavailableTypeBound ## a type-bound operator is requested but not
-                            ## available
-
-  LocalDiag = object
-    ## A temporary diagnostic representation that is later turned into a
-    ## ``SemReport``
-    pos: NodePosition ## the location of the report
-    case kind: LocalDiagKind
-    of ldkUnavailableTypeBound:
-      op: TTypeAttachedOp
-    of ldkPassCopyToSink:
-      discard
-
-const
-  skipAliases = {tyGenericInst, tyAlias, tySink}
-    ## the set of types to not consider when looking up a type-bound operator
-
 iterator ritems[T](x: openArray[T]): lent T =
   ## Iterates and yields the items from the container `x` in reverse
   var i = x.high
@@ -558,18 +532,9 @@ func needsReset(tree: MirTree, cfg: DataFlowGraph, ar: AnalysisResults,
     # the presence of the value is observed -> a reset is required
     result = true
 
-func isMove(tree: MirTree, moves: Moves, n: NodePosition): bool =
-  ## Returns whether the assignment modifier at `n` is a move modifier (after
-  ## collapsing sink).
-  case tree[n].kind:
-  of mnkCopy: false
-  of mnkMove: true
-  of mnkSink: tree.operand(n) in moves
-  else:       unreachable(tree[n].kind)
-
 # ------- code generation routines --------
 
-template buildVoidCall(bu: var MirBuilder, env: var MirEnv, p: PSym,
+template buildVoidCall*(bu: var MirBuilder, env: var MirEnv, p: PSym,
                        body: untyped) =
   let prc = p # prevent multi evaluation
   bu.subTree mnkVoid:
@@ -596,46 +561,6 @@ proc genDestroy*(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
   bu.buildVoidCall(env, destr):
     bu.emitByName(target, ekMutate)
 
-proc genInjectedSink(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
-                     dest, source: Value) =
-  ## Generates and emits either a call to the ``=sink`` hook, or (if none
-  ## exists), a sink emulated via a destructor-call + bitwise-copy.
-  let op = getOp(graph, dest.typ, attachedSink)
-  if op != nil:
-    bu.buildVoidCall(env, op):
-      bu.emitByName(dest, ekMutate)
-      bu.emitByVal source
-  else:
-    # without a sink hook, a ``=destroy`` + blit-copy is used
-    genDestroy(bu, graph, env, dest)
-    bu.asgnMove dest, source
-
-proc genSinkFromTemporary(bu: var MirBuilder, graph: ModuleGraph,
-                          env: var MirEnv, dest, source: Value) =
-  ## Similar to ``genInjectedSink`` but generates code for destructively
-  ## moving the source operand into a temporary first.
-  let tmp = bu.materializeMove(source)
-  genWasMoved(bu, graph, source)
-  genInjectedSink(bu, graph, env, dest, tmp)
-
-proc genCopy(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
-             dst, src: Value, maybeCyclic: bool) =
-  ## Emits a ``=copy`` hook call with `dst`, `src`, and (if necessary)
-  ## `maybeCyclic` as the arguments.
-  let
-    t  = dst.typ
-    op = getOp(graph, t, attachedAsgn)
-
-  bu.buildVoidCall(env, op):
-    bu.emitByName(dst, ekMutate)
-    bu.emitByVal src
-
-    if graph.config.selectedGC == gcOrc and
-        cyclicType(t.skipTypes(skipAliases + {tyDistinct}), graph):
-      # pass whether the copy can potentially introduce cycles as the third
-      # parameter:
-      bu.emitByVal literal(boolLit(graph, unknownLineInfo, maybeCyclic))
-
 func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
                              src: NodePosition
                             ): tuple[src, clear: Value] =
@@ -650,11 +575,17 @@ func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
     # the assignment source
     (bu.bindImmutable(tree, src), bu.bindMut(tree, x))
 
-proc expandAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
-                env: var MirEnv, stmt: NodePosition, pos: InstrPos,
-                c: var Changeset) =
-  ## Rewrites the assignment at `stmt` into either a ``=copy`` hook call,
-  ## ``=sink`` hook call, move, or destructive move.
+proc specializeAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
+                    stmt: NodePosition, pos: InstrPos, c: var Changeset) =
+  ## Specializes the modifier-using assignment at `stmt` using the analysis
+  ## results:
+  ## * guaranteed self-assignments are eliminated (i.e., the assignment is
+  ##   removed)
+  ## * sink assignments are turned into copy, move, or destructive move
+  ##   assignments
+  ## * normal assignments are turned into initializing assignments (if
+  ##   possible)
+  ##
   ## `pos` is the 'def' data-flow instruction corresponding to the assignment.
   let
     dest       = tree.child(stmt, 0)
@@ -667,118 +598,57 @@ proc expandAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
   if relation.isSame:
     # a self-assignment -> elide
     c.remove(tree, stmt)
-  elif isMove(tree, ar.moves[], operator):
-    # a move is possible -> sink
-    if true:
-      template needsReset(): bool =
-        # only a ``sink`` modifier allows for the injection of resets
-        (tree[operator].kind == mnkSink and
-         needsReset(tree, ctx.cfg, ar, sourcePath, pos))
-
-      if tree[stmt].kind != mnkInit and
-         isAlive(tree, ctx.cfg, ar.entities[], destPath, pos):
-        # there already exists a value in the destination location -> use the
-        # sink operation
-        if true:
-          c.replaceMulti(tree, stmt, bu):
-            let a = bu.bindMut(tree, dest)
-            if isAPartOfB(relation) != no:
-              # this is a potential part-to-whole assignment, e.g.:
-              # ``x = move x.y``. We need to move the source value into a
-              # temporary first, as ``=sink`` would otherwise destroy ``x``
-              # first, also destroying ``x.y`` in the process
-              let b = bu.bindMut(tree, source)
-              genSinkFromTemporary(bu, ctx.graph, env, a, b)
-            elif needsReset():
-              # a sink from a location that needs to be reset after the move
-              # (i.e., a destructive move)
-              let (b, clear) = bu.destructiveMoveOperands(tree, source)
-              genInjectedSink(bu, ctx.graph, env, a, b)
-              genWasMoved(bu, ctx.graph, clear)
-            else:
-              # a sink from a location that doesn't need to be reset afterwards
-              let b = bu.bindImmutable(tree, source)
-              genInjectedSink(bu, ctx.graph, env, a, b)
-
-      elif needsReset():
-        # the destination location doesn't contain a value yet (which would
-        # need to be destroyed first otherwise) -> a bitwise copy can be used
-        # we don't need to check for part-to-whole assignments here, because
-        # if the destination location has no value, so don't locations derived
-        # from it, in which case it doesn't matter when the reset happens
-        # XXX: the reset could be omitted for part-to-whole assignments
-        c.replaceMulti(tree, stmt, bu):
-          let
-            a          = bu.bindMut(tree, dest)
-            (b, clear) = bu.destructiveMoveOperands(tree, source)
-          bu.asgnMove a, b
+  elif tree[operator].kind == mnkSink:
+    let isAlive = tree[stmt].kind == mnkAsgn and
+                  isAlive(tree, ctx.cfg, ar.entities[], destPath, pos)
+    if tree.operand(operator) in ar.moves[]:
+      # turn the sink into a move
+      if isAlive and isAPartOfB(relation) != no:
+        # it's potentially a part-to-whole assignment, e.g.: ``x = move x.y``,
+        # and the destination contains a value. The value must first be moved
+        # into a temporary, since a move destination must not overlap with
+        # the source
+        var tmp: Value
+        c.insert(tree, stmt, source, bu):
+          let b = bu.bindMut(tree, source)
+          tmp = bu.wrapTemp b.typ:
+            bu.move b
+          genWasMoved(bu, ctx.graph, b)
+
+        c.replaceMulti(tree, operator, bu):
+          bu.move tmp
+      elif needsReset(tree, ctx.cfg, ar, sourcePath, pos):
+        # the value can be moved, but the source location needs to be cleared
+        # afterwards. Turn ``a = sink x.y`` into:
+        #   bind_mut _1 = x.y
+        #   a = move _1
+        #   wasMoved(name _1)
+        var b, clear: Value
+        c.insert(tree, stmt, source, bu):
+          (b, clear) = bu.destructiveMoveOperands(tree, source)
+        c.replaceMulti(tree, operator, bu):
+          bu.move b
+        c.insert(tree, tree.sibling(stmt), source, bu):
           genWasMoved(bu, ctx.graph, clear)
-
-      elif tree[operator].kind == mnkSink:
-        # no reset and/or hook call needs to be injected, simply replace the
-        # sink modifier with a move
-        c.changeTree(tree, operator): MirNode(kind: mnkMove)
       else:
-        # no hook call nor destructive move is required
-        discard "nothing to do"
-
-  else:
-    # a move is not possible -> copy
-    c.replaceMulti(tree, stmt, bu):
-      # copies to locals or globals can't introduce cyclic structures, as
-      # those are standlone and not part of any other structure
-      let maybeCyclic =
-        tree[dest].kind notin {mnkLocal, mnkTemp, mnkParam, mnkGlobal}
-      let
-        a = bu.bindMut(tree, dest)
-        b = bu.inline(tree, source)
-
-      genCopy(bu, ctx.graph, env, a, b, maybeCyclic)
-
-proc expandDef(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
-               env: var MirEnv, at: NodePosition, pos: InstrPos,
-               c: var Changeset) =
-  ## Depending on whether the source can be moved out of, either rewrites the
-  ## 'def' at `at` into a call to the ``=copy`` hook call or into a
-  ## destructive or non-destructive move. `pos` is the data-flow instruction.
-  let
-    dest     = tree.child(at, 0)
-    operator = tree.child(at, 1)
-    source   = tree.child(operator, 0)
-  case isMove(tree, ar.moves[], operator)
-  of false:
-    # a copy is required. Transform ``def x = copy a.b`` into:
-    #   def x
-    #   bind _1 = a.b
-    #   =copy(name x, arg _1)
-    c.replace(tree, operator): MirNode(kind: mnkNone)
-    c.insert(tree, tree.sibling(at), source, bu):
-      let
-        a = bu.bindMut(tree, dest)
-        b = bu.inline(tree, source)
-      # the destination can only be a cell-like location (local, global,
-      # etc.), no cycle can possibly be introduced
-      genCopy(bu, ctx.graph, env, a, b, false)
-  of true:
-    assert tree[operator].kind == mnkSink
-    if needsReset(tree, ctx.cfg, ar, computePath(tree, source), pos):
-      # the value can be moved, but the location needs to be reset. Transform
-      # ``def x = sink a.b`` into:
-      #   bind_mut _1 = a.b
-      #   def x = move _1
-      #   wasMoved(name x)
-      var tmp, clear: Value
-      c.insert(tree, at, source, bu):
-        (tmp, clear) = bu.destructiveMoveOperands(tree, source)
-      c.replaceMulti(tree, operator, bu):
-        bu.move tmp
-      c.insert(tree, tree.sibling(at), source, bu):
-        genWasMoved(bu, ctx.graph, clear)
+        # the value can be moved without the source location having to be
+        # cleared
+        c.changeTree(tree, operator):
+          MirNode(kind: mnkMove, typ: tree[operator].typ)
     else:
-      # turn into a ``Move`` operation
+      # the value cannot be moved, turn the sink into a copy
       c.changeTree(tree, operator):
-        MirNode(kind: mnkMove, typ: tree[operator].typ)
+        MirNode(kind: mnkCopy, typ: tree[operator].typ)
 
+    if tree[stmt].kind == mnkAsgn and not isAlive:
+      # the assignment initializes the location
+      c.changeTree(tree, stmt): MirNode(kind: mnkInit)
+  else:
+    # it's a move or copy already, so nothing to change there
+    if tree[stmt].kind == mnkAsgn and
+       not isAlive(tree, ctx.cfg, ar.entities[], destPath, pos):
+      # the assignment initializes the location
+      c.changeTree(tree, stmt): MirNode(kind: mnkInit)
 
 proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                 expr: NodePosition, src: OpValue, pos: InstrPos,
@@ -816,56 +686,7 @@ proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         let v = bu.bindMut(tree, NodePosition src)
         genWasMoved(bu, ctx.graph, v)
 
-proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
-  ## Computes whether the definition statement is something produced for
-  ## sink parameter handling.
-  assert tree[stmt].kind in {mnkDef, mnkDefUnpack}
-  let def = tree.operand(stmt, 0)
-  if tree[def].kind != mnkTemp:
-    # only temporaries are used for sink handling
-    return
-
-  # look for whether the temporary is used as a 'consume' node's operand,
-  # but do reduce the amount of work by not searching beyond the
-  # temporary's lifetime
-  # HACK: this detection relies on the code shapes ``mirgen`` currently
-  #       emits for sink parameters and is thus very brittle. The proper
-  #       solution is to mark through a side channel the statement as being
-  #       generated for a sink parameter
-  var
-    n = tree.sibling(stmt)
-    depth = 0
-  while n < NodePosition tree.len:
-    case tree[n].kind
-    of mnkConsume:
-      let x = tree.operand(n)
-      if tree[x].kind == mnkTemp and tree[x].temp == tree[def].temp:
-        # the temporary is used for sink parameter passing
-        result = true
-        break
-    of mnkScope:
-      inc depth
-    of mnkEnd:
-      if tree[n].kind == mnkScope:
-        dec depth
-        if depth < 0:
-          # the end of the temporary's surrounding scope is reached
-          break
-    else:
-      discard
-
-    inc n
-
-proc checkCopy(graph: ModuleGraph, tree: MirTree, expr: NodePosition,
-               diags: var seq[LocalDiag]) =
-  let op = getOp(graph, tree[expr].typ, attachedAsgn)
-  if sfError in op.flags:
-    diags.add LocalDiag(pos: expr,
-                        kind: ldkUnavailableTypeBound,
-                        op: attachedAsgn)
-
 proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
-                        env: var MirEnv, diags: var seq[LocalDiag],
                         c: var Changeset) =
   ## Rewrites assignments to locations into calls to either the ``=copy``
   ## or ``=sink`` hook (see ``expandAsgn`` for more details).
@@ -889,34 +710,11 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         discard
       else:
         unreachable(tree[parent].kind)
-    elif opc == opDef and hasDestructor(tree[val].typ):
-      # where necessary, rewrite assignments into moves, destructive moves,
-      # and copies
-      let stmt = tree.parent(NodePosition val)
-
-      case tree[stmt].kind
-      of mnkDef, mnkDefUnpack:
-        let src = tree.child(stmt, 1)
-        # only rewrite definitions with modifiers. The ``move`` modifier
-        # is ignored since there's nothing to be rewritten for it
-        if tree[src].kind in ModifierNodes - {mnkMove}:
-          if not isMove(tree, ar.moves[], src):
-            checkCopy(ctx.graph, tree, src, diags)
-            # emit a warning for copies-to-sink
-            if isUsedForSink(tree, stmt):
-              diags.add LocalDiag(kind: ldkPassCopyToSink,
-                                  pos: src)
-          expandDef(tree, ctx, ar, env, stmt, i, c)
-      of mnkAsgn, mnkInit:
-        let src = tree.child(stmt, 1)
-        # only rewrite assignments with modifiers
-        if tree[src].kind in ModifierNodes:
-          if not isMove(tree, ar.moves[], src):
-            checkCopy(ctx.graph, tree, src, diags)
-          expandAsgn(tree, ctx, ar, env, stmt, i, c)
-      else:
-        # e.g., output arguments to procedures
-        discard "ignore"
+    elif opc == opDef and (let stmt = tree.parent(NodePosition val);
+          tree[stmt, 1].kind in {mnkCopy, mnkMove, mnkSink}):
+      # specialize the modifier-using assignment
+      assert tree[stmt].kind in {mnkDef, mnkDefUnpack, mnkAsgn, mnkInit}
+      specializeAsgn(tree, ctx, ar, stmt, i, c)
 
 # --------- destructor injection -------------
 
@@ -1026,13 +824,15 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
     typ = body[target].field.typ
 
   assert body[target].kind == mnkPathVariant
+  assert body[stmt, 1].kind in ModifierNodes
 
   let
     a = bu.wrapMutAlias(typ):
       # bind the discriminator lvalue, not the variant lvalue
       bu.subTree MirNode(kind: mnkPathNamed, typ: typ, field: body[target].field):
         bu.emitFrom(body, NodePosition body.operand(target))
-    b = bu.inline(body, body.child(stmt, 1))
+    b = bu.wrapTemp typ:
+      bu.emitFrom(body, body.child(stmt, 1))
 
   # check if the object contains fields requiring destruction:
   if hasDestructor(objType):
@@ -1093,24 +893,6 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
   # generate the ``discriminant = newValue`` assignment:
   bu.asgn(a, b)
 
-proc reportDiagnostics(g: ModuleGraph, body: MirBody,
-                       owner: PSym, diags: var seq[LocalDiag]) =
-  ## Reports all diagnostics in `diags` as ``SemReport``s and clear the list
-  for diag in diags.items:
-    let ast = body.sourceFor(diag.pos)
-    let rep =
-      case diag.kind
-      of ldkUnavailableTypeBound:
-        SemReport(kind: rsemUnavailableTypeBound,
-                  typ: body[diag.pos].typ,
-                  str: AttachedOpToStr[diag.op],
-                  ast: ast,
-                  sym: owner)
-      of ldkPassCopyToSink:
-        SemReport(kind: rsemCopiesToSink, ast: ast)
-
-    localReport(g.config, ast.info, rep)
-
 func shouldInjectDestructorCalls*(owner: PSym): bool =
   # only inject destructor calls if the owner is not a generated OP (e.g. a
   # generated ``=destroy``) and also not an ``.inline`` iterator
@@ -1157,7 +939,6 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
   block:
     var
       changes = initChangeset(body.code)
-      diags: seq[LocalDiag]
       actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
 
     let
@@ -1171,16 +952,8 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
       AnalysisResults(moves: cursor(moves),
                       entities: cursor(entities),
                       destroy: cursor(destructors)),
-      env, diags, changes)
-
-    # turn the collected diagnostics into reports and report them:
-    reportDiagnostics(g, body, owner, diags)
+      changes)
 
     injectDestructors(body.code, g, destructors, env, changes)
 
     apply(changes)
-
-  if g.config.arcToExpand.hasKey(owner.name.s):
-    g.config.msgWrite("--expandArc: " & owner.name.s & "\n")
-    g.config.msgWrite(render(body.code, addr env))
-    g.config.msgWrite("\n-- end of expandArc ------------------------\n")
\ No newline at end of file
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 3546a896f86..398a0fe593f 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -24,7 +24,7 @@ scope:
   def _2: string = move _6
   wasMoved(name _6)
   def _3: Target = construct (consume _0, consume _1, consume _2)
-  result = move _3
+  result := move _3
   =destroy(name splat)
 -- end of expandArc ------------------------
 --expandArc: delete
@@ -33,20 +33,16 @@ scope:
   def_cursor _0: Node = target[]
   def_cursor _1: Node = _0[].parent
   def sibling: Node
-  def _6: Node = _1[].left
-  =copy(name sibling, arg _6) (raises)
+  =copy(name sibling, arg _1[].left) (raises)
   def_cursor _2: Node = sibling
   def saved: Node
-  def _7: Node = _2[].right
-  =copy(name saved, arg _7) (raises)
+  =copy(name saved, arg _2[].right) (raises)
   def_cursor _3: Node = sibling
   def_cursor _4: Node = saved
-  bind_mut _8: Node = _3[].right
-  def _9: Node = _4[].left
-  =copy(name _8, arg _9) (raises)
+  def_cursor _6: Node = _4[].left
+  =copy(name _3[].right, arg _6) (raises)
   def_cursor _5: Node = sibling
-  bind_mut _10: Node = _5[].parent
-  =sink(name _10, arg saved) (raises)
+  =sink(name _5[].parent, arg saved) (raises)
   =destroy(name sibling) (raises)
 -- end of expandArc ------------------------
 --expandArc: p1
@@ -59,13 +55,13 @@ scope:
   def _1: seq[int] = move lresult
   def _: (seq[int], string) = construct (consume _1, consume ";")
   bind_mut _3: seq[int] = _.0
-  lvalue = move _3
+  lvalue := move _3
   wasMoved(name _3)
   bind_mut _4: string = _.1
-  lnext = move _4
+  lnext := move _4
   wasMoved(name _4)
   def _2: seq[int] = move(name lvalue)
-  result.value = move _2
+  result.value := move _2
   =destroy(name _)
   =destroy(name lnext)
   =destroy(name lvalue)
@@ -76,11 +72,9 @@ scope:
   try:
     def_cursor it: KeyValue = x
     def _0: seq[int]
-    def _4: seq[int] = it.0
-    =copy(name _0, arg _4)
+    =copy(name _0, arg it.0)
     def _1: seq[int]
-    def _5: seq[int] = it.1
-    =copy(name _1, arg _5)
+    =copy(name _1, arg it.1)
     def a: (seq[int], seq[int]) = construct (consume _0, consume _1)
     def_cursor _2: (seq[int], seq[int]) = a
     def _3: string = $(arg _2) (raises)
@@ -120,7 +114,7 @@ scope:
                     def _7: bool = eqStr(arg _6, arg "opt")
                     if _7:
                       scope:
-                        def _10: string = splitted[1]
+                        def_cursor _10: string = splitted[1]
                         =copy(name lan_ip, arg _10)
                     def_cursor _8: string = lan_ip
                     echo(arg type(array[0..0, string]), arg _8) (raises)
@@ -136,8 +130,7 @@ scope:
 scope:
   try:
     def shadowScope: Scope
-    def _7: Scope = c[].currentScope
-    =copy(name shadowScope, arg _7) (raises)
+    =copy(name shadowScope, arg c[].currentScope) (raises)
     rawCloseScope(arg c) (raises)
     scope:
       def_cursor _0: Scope = shadowScope
@@ -160,8 +153,7 @@ scope:
                   def_cursor _5: int = i
                   def sym: lent Symbol = borrow a[_5]
                   def _6: Symbol
-                  def _8: Symbol = sym[]
-                  =copy(name _6, arg _8)
+                  =copy(name _6, arg sym[])
                   addInterfaceDecl(arg c, consume _6) (raises)
                 i = addI(arg i, arg 1) (raises)
   finally:
@@ -177,7 +169,7 @@ scope:
     def _2: bool = eqI(arg _1, arg 2)
     if _2:
       scope:
-        result = move x
+        result := move x
         wasMoved(name x)
         return
     def_cursor _3: sink string = x
@@ -202,8 +194,7 @@ scope:
       if _3:
         scope:
           def _4: string
-          def _16: string = this[].value
-          =copy(name _4, arg _16)
+          =copy(name _4, arg this[].value)
           _1 := construct (consume _4, consume "")
           break L0
       scope:
@@ -211,12 +202,11 @@ scope:
           def_cursor _5: string = this[].value
           def _6: string = parentDir(arg _5) (raises)
           def _7: string
-          def _17: string = this[].value
-          =copy(name _7, arg _17)
+          =copy(name _7, arg this[].value)
           def _8: tuple[head: string, tail: string] = splitPath(consume _7) (raises)
-          bind_mut _18: string = _8.1
-          def _9: string = move _18
-          wasMoved(name _18)
+          bind_mut _16: string = _8.1
+          def _9: string = move _16
+          wasMoved(name _16)
           _1 := construct (consume _6, consume _9)
           wasMoved(name _6)
         finally:
@@ -231,13 +221,11 @@ scope:
           def_cursor _12: string = par.0
           def_cursor _13: string = par.1
           def _14: seq[string] = getSubDirs(arg _12, arg _13) (raises)
-          bind_mut _19: seq[string] = this[].matchDirs
-          =sink(name _19, arg _14)
+          =sink(name this[].matchDirs, arg _14)
           break L1
       scope:
         def _15: seq[string] = construct ()
-        bind_mut _20: seq[string] = this[].matchDirs
-        =sink(name _20, arg _15)
+        =sink(name this[].matchDirs, arg _15)
   finally:
     =destroy(name par)
 -- end of expandArc ------------------------'''
diff --git a/tests/arc/topt_wasmoved_destroy_pairs.nim b/tests/arc/topt_wasmoved_destroy_pairs.nim
index 6ee175c65ac..3e23ce3ee25 100644
--- a/tests/arc/topt_wasmoved_destroy_pairs.nim
+++ b/tests/arc/topt_wasmoved_destroy_pairs.nim
@@ -29,7 +29,7 @@ scope:
     scope:
       def a: int = 0
       def b: int = 4
-      def i: int = sink a
+      def i: int = copy a
       block L0:
         scope:
           while true:
@@ -76,11 +76,11 @@ scope:
       scope:
         return
     def _0: string = boolToStr(arg cond)
-    str = move _0
+    str := move _0
     def _1: bool = not(arg cond)
     if _1:
       scope:
-        result = move str
+        result := move str
         wasMoved(name str)
         return
   finally:

From f46227d7e16c444282f3ea51cc807a51c9122653 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 23 Feb 2024 02:54:13 +0100
Subject: [PATCH 011/169] fix(sem): crash with manual `=destroy` hook call
 (#1205)

## Summary

Fix a bug where manually calling the `=destroy` (or `=trace`) hook for
a type where the hook is compiler-generated crashed the compiler when
the call is within a typed procedure definition that is returned by a
macro or template.

Fixes https://github.com/nim-works/nimskull/issues/1161.

## Details

All compiler-synthesized hook procedures are marked as `sfFromGeneric`.
The `owner` of such procedures is expected to be the generic procedure
the procedure is an instantiation of (`skipGenericOwner` the immediate
owner), but this wasn't the case for the synthesized hooks, where the
owner was set to the owner of the type the hook is synthesized for.

When a compiler-synthesized hook is used in overload resolution, the
search for the owning module in `initCallCandidate` skips over the
`skModule` symbol (via `skipGenericOwner`), thus resulting in an NPE.

To fix the issue, the owner of synthesized hook procedures is now set
to the hook kind's corresponding generic magic procedure from the
`system` module, making the produced symbols well-formed.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/ast/ast_query.nim                    |  2 +
 compiler/sem/liftdestructors.nim              |  8 ++--
 .../tsynthesized_destroy_hook_roundtrip.nim   | 43 +++++++++++++++++++
 3 files changed, 50 insertions(+), 3 deletions(-)
 create mode 100644 tests/lang_callable/macros/tsynthesized_destroy_hook_roundtrip.nim

diff --git a/compiler/ast/ast_query.nim b/compiler/ast/ast_query.nim
index 19c9fa1426f..57533b37bbe 100644
--- a/compiler/ast/ast_query.nim
+++ b/compiler/ast/ast_query.nim
@@ -209,6 +209,8 @@ const
   UnknownLockLevel* = TLockLevel(1001'i16)
   AttachedOpToStr*: array[TTypeAttachedOp, string] = [
     "=destroy", "=copy", "=sink", "=trace", "=deepcopy"]
+  AttachedOpToMagic*: array[TTypeAttachedOp, TMagic] = [
+    mDestroy, mAsgn, mAsgn, mTrace, mDeepCopy]
 
 
 proc `$`*(x: TLockLevel): string =
diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index b909adf6a69..7493f01316d 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -854,9 +854,11 @@ proc produceSymDistinctType(g: ModuleGraph; c: PContext; typ: PType;
 
 proc symPrototype(g: ModuleGraph; typ: PType; owner: PSym; kind: TTypeAttachedOp;
               info: TLineInfo; idgen: IdGenerator): PSym =
-
+  # a synthesized hook is treated as an instantiation of the respective generic
+  # magic procedure from the system module
   let procname = getIdent(g.cache, AttachedOpToStr[kind])
-  result = newSym(skProc, procname, nextSymId(idgen), owner, info)
+  let base = getSysMagic(g, info, AttachedOpToStr[kind], AttachedOpToMagic[kind])
+  result = newSym(skProc, procname, nextSymId(idgen), base, info)
   let dest = newSym(skParam, getIdent(g.cache, "dest"), nextSymId(idgen), result, info)
   let src = newSym(skParam, getIdent(g.cache, if kind == attachedTrace: "env" else: "src"),
                    nextSymId(idgen), result, info)
@@ -866,7 +868,7 @@ proc symPrototype(g: ModuleGraph; typ: PType; owner: PSym; kind: TTypeAttachedOp
   else:
     src.typ = typ
 
-  result.typ = newProcType(info, nextTypeId(idgen), owner)
+  result.typ = newProcType(info, nextTypeId(idgen), result)
   result.typ.addParam dest
   if kind != attachedDestructor:
     result.typ.addParam src
diff --git a/tests/lang_callable/macros/tsynthesized_destroy_hook_roundtrip.nim b/tests/lang_callable/macros/tsynthesized_destroy_hook_roundtrip.nim
new file mode 100644
index 00000000000..dd3ae20c77f
--- /dev/null
+++ b/tests/lang_callable/macros/tsynthesized_destroy_hook_roundtrip.nim
@@ -0,0 +1,43 @@
+discard """
+  description: '''
+    Regression test for a bug where manually invoking a type's `=destroy` hook
+    within a procedure defined as part of a typed macro/template argument
+    crashed the compiler
+  '''
+"""
+
+type Destroy = object
+  ## A type that has a user-defined destroy hook.
+
+proc `=destroy`(x: var Destroy) =
+  discard
+
+type
+  NoHookObject = object
+    ## Object type where no destroy hook needs to be synthesized.
+  HookObject = object
+    ## Object type that needs a compiler-synthesized destroy hook.
+    field: Destroy
+
+macro m(x: typed): untyped = x
+
+# the compiler crashed when processing the macro output
+m:
+  proc f() =
+    # the bug only surfaced when the hook call is part of a procedure. Types
+    # that need a compiler-synthesized as well as those that don't were
+    # affected.
+    var v = NoHookObject()
+    `=destroy`(v)
+    var v2 = HookObject()
+    `=destroy`(v2)
+
+# the same bug happened when using a template:
+template t(x: typed): untyped = x
+
+t:
+  proc f2() =
+    var v = NoHookObject()
+    `=destroy`(v)
+    var v2 = HookObject()
+    `=destroy`(v2)
\ No newline at end of file

From 55deaaa31f54f81b4c21db86c93230cb629a7822 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 24 Feb 2024 17:50:38 +0100
Subject: [PATCH 012/169] mir: separate destructor from `=destroy` injection
 (#1206)

## Summary

Introduce the new `destroy` MIR operation and use it to decouple
destructor injection from the injection of `=destroy` hooks. Injection
of lifetime hooks is now fully decoupled from the move-analyzer /
destructor-injection pass. This is an internal-only change.

## Details

* introduce the `mnkDestroy` node kind / operator
* instead of `=destroy` hook calls, the `injectdestructors` pass only
  injects `mnkDestroy` operations
* the `injecthooks` pass then replaces `mnkDestroy` operations with
  `=destroy` calls
* the `getOp` and `genDestroy` procedure are moved to `injecthooks`
  without change
* injection of `=destroy` calls for variant objects (part of the
  `mnkSwitch` lowering) is still part of the `injectdestructors` pass
* since `mnkDestroy` operations are replaced right away, both `mirexec`
  and `cgirgen` (MIR-to-CGIR translation) don't handle them yet
---
 compiler/backend/cgirgen.nim       |  2 ++
 compiler/mir/injecthooks.nim       | 52 ++++++++++++++++++++++++++----
 compiler/mir/mirtrees.nim          |  7 ++--
 compiler/mir/utils.nim             |  4 +++
 compiler/sem/injectdestructors.nim | 46 +++++---------------------
 compiler/sem/mirexec.nim           |  2 ++
 compiler/sem/modulelowering.nim    |  2 +-
 doc/mir.rst                        |  1 +
 8 files changed, 68 insertions(+), 48 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 96b31615263..18c3f8ad58b 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -741,6 +741,8 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       res.kids.addIfNotEmpty stmtToIr(tree, env, cl, cr)
   of mnkScope:
     toSingleNode scopeToIr(tree, env, cl, cr)
+  of mnkDestroy:
+    unreachable("a 'destroy' that wasn't lowered")
   of AllNodeKinds - StmtNodes:
     unreachable(n.kind)
 
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index d7d4cad67a3..6f7d3b08b44 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -1,10 +1,13 @@
-## Implements the MIR pass for replacing copy and move assignments with the
-## ``=copy`` or ``=sink`` hook (if available for the type).
-##
-## Future direction: injection of ``=destroy`` hooks also needs to happen
-## here.
+## Implements the MIR pass for:
+## * replacing copy and move assignments with the ``=copy`` or ``=sink``
+##   hook (if available for the type).
+## * replacing destroy operations with calls to the ``=destroy`` hook (if
+##   available for the type)
 
 import
+  std/[
+    tables
+  ],
   compiler/ast/[
     ast_query,
     ast_types,
@@ -24,6 +27,9 @@ import
   compiler/modules/[
     modulegraphs
   ],
+  compiler/sem/[
+    sighashes
+  ],
   compiler/utils/[
     idioms
   ]
@@ -32,8 +38,8 @@ import
 from compiler/ast/reports_sem import SemReport
 from compiler/ast/report_enums import ReportKind
 
-# XXX: temporary dependency until destroy hooks are injected here
-from compiler/sem/injectdestructors import getOp, genDestroy, buildVoidCall
+# XXX: temporary dependency until switch assignments are lowered differently
+from compiler/sem/injectdestructors import buildVoidCall
 
 from compiler/sem/liftdestructors import boolLit, cyclicType
 
@@ -56,6 +62,18 @@ type
 const
   skipAliases = {tyGenericInst, tyAlias, tySink}
 
+proc getOp*(g: ModuleGraph, t: PType, kind: TTypeAttachedOp): PSym =
+  ## Returns the symbol for the `kind` type-bound hook for `t` (or nil, if
+  ## there's none).
+  let t = t.skipTypes(skipForHooks)
+  result = getAttachedOp(g, t, kind)
+  if result == nil or result.ast.isGenericRoutine:
+    # give up and find the canonical type instead:
+    let h = sighashes.hashType(t, {CoType, CoDistinct})
+    let canon = g.canonTypes.getOrDefault(h)
+    if canon != nil:
+      result = getAttachedOp(g, canon, kind)
+
 proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
   ## Computes whether the definition statement is something produced for
   ## sink parameter handling.
@@ -138,6 +156,13 @@ template genCopy(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
       let c = maybeCyclic and couldIntroduceCycle(tree, dest)
       bu.emitByVal literal(boolLit(graph, unknownLineInfo, c))
 
+proc genDestroy*(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
+                 target: Value) =
+  ## Emits a destructor call with `target` as the argument.
+  let destr = getOp(graph, target.typ, attachedDestructor)
+  bu.buildVoidCall(env, destr):
+    bu.emitByName(target, ekMutate)
+
 proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
                   owner: PSym, changes: var Changeset) =
   ## Replaces all copy and move assignments for locations with lifetime hooks
@@ -244,6 +269,19 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         changes.replaceMulti(tree, dest, bu):
           bu.use loc
 
+    of mnkDestroy:
+      let destr = getOp(graph, tree[tree.operand(i)].typ, attachedDestructor)
+      changes.replaceMulti(tree, i, bu):
+        bu.buildVoidCall(env, destr):
+          # XXX: the by-name passing and usage of ``ekMutate`` is not really
+          #      correct. For all intents and purposes, a destructor
+          #      *consumes* the value (and then effectively voids it), meaning
+          #      that ``mnkConsume`` should actually be used. However, this
+          #      would require changing the signature of ``=destroy`` to use
+          #      ``sink``
+          bu.emitByName ekMutate:
+            bu.emitFrom(tree, tree.child(i, 0))
+
     else:
       discard "nothing to do"
 
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index d29892ae298..85578bf341f 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -239,6 +239,9 @@ type
 
     mnkBranch ## defines a branch of an ``mnkExcept`` or ``mnkCase``
 
+    mnkDestroy## destroys the value stored in the given location, leaving the
+              ## location in an undefined state
+
     mnkAsm    ## embeds backend-dependent code directly into the output
     mnkEmit   ## embeds backend-dependent code directly into the output
 
@@ -339,7 +342,7 @@ const
                          mnkAddr, mnkDeref, mnkView, mnkDerefView, mnkStdConv,
                          mnkConv, mnkCast, mnkRaise, mnkTag, mnkArg,
                          mnkName, mnkConsume, mnkVoid, mnkCopy, mnkMove,
-                         mnkSink}
+                         mnkSink, mnkDestroy}
     ## Nodes that start sub-trees but that always have a single sub node.
 
   ArgumentNodes* = {mnkArg, mnkName, mnkConsume}
@@ -363,7 +366,7 @@ const
 
   StmtNodes* = {mnkScope, mnkStmtList, mnkIf, mnkCase, mnkRepeat, mnkTry,
                 mnkBlock, mnkBreak, mnkReturn, mnkRaise, mnkPNode, mnkInit,
-                mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkEmit,
+                mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkDestroy, mnkEmit,
                 mnkAsm} + DefNodes
 
   UnaryOps*  = {mnkNeg}
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 4bbf962cc2f..735978b6b1a 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -492,6 +492,10 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
     tree "raise ":
       valueToStr()
     result.add "\n"
+  of mnkDestroy:
+    tree "destroy ":
+      valueToStr()
+      result.add "\n"
   of mnkPNode:
     result.add repeat("  ", indent)
     result.add "PNode " & $n.node & "\n"
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 48e4335fc04..fa48d3d6c6f 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -12,7 +12,7 @@
 ## - the pass for collapsing sink assignments into copies, moves, and
 ##   destrutive moves
 ## - the pass for injected ``wasMoved`` calls for consumed lvalues
-## - the destructor (i.e. ``=destroy`` hook) injection
+## - the pass for injecting destructors
 ##
 ## Overview
 ## ========
@@ -129,7 +129,6 @@ import
     aliasanalysis,
     liftdestructors,
     mirexec,
-    sighashes
   ],
   compiler/utils/[
     cursors,
@@ -229,16 +228,6 @@ func findScope(entities: EntityDict, name: EntityName, at: InstrPos,
 proc getVoidType(g: ModuleGraph): PType {.inline.} =
   g.getSysType(unknownLineInfo, tyVoid)
 
-proc getOp*(g: ModuleGraph, t: PType, kind: TTypeAttachedOp): PSym =
-  let t = t.skipTypes(skipForHooks)
-  result = getAttachedOp(g, t, kind)
-  if result == nil or result.ast.isGenericRoutine:
-    # give up and find the canonical type instead:
-    let h = sighashes.hashType(t, {CoType, CoDistinct})
-    let canon = g.canonTypes.getOrDefault(h)
-    if canon != nil:
-      result = getAttachedOp(g, canon, kind)
-
 func isNamed(tree: MirTree, val: OpValue): bool =
   ## Returns whether `val` is the projection of a named location (or refers to
   ## the named location itself).
@@ -554,13 +543,6 @@ proc genWasMoved(bu: var MirBuilder, graph: ModuleGraph, target: Value) =
     bu.buildMagicCall mWasMoved, getVoidType(graph):
       bu.emitByName(target, ekKill)
 
-proc genDestroy*(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
-                 target: Value) =
-  let destr = getOp(graph, target.typ, attachedDestructor)
-
-  bu.buildVoidCall(env, destr):
-    bu.emitByName(target, ekMutate)
-
 func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
                              src: NodePosition
                             ): tuple[src, clear: Value] =
@@ -718,22 +700,12 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
 
 # --------- destructor injection -------------
 
-proc injectDestructorsInner(bu: var MirBuilder, orig: MirTree,
-                            graph: ModuleGraph, env: var MirEnv,
-                            entries: openArray[DestroyEntry]) =
-  ## Generates a destructor call for each item in `entries`, using `buf` as the
-  ## output.
+proc injectDestroysAux(bu: var MirBuilder, orig: MirTree,
+                       entries: openArray[DestroyEntry]) =
+  ## Emits a destroy operation for each item in `entries`.
   for it in ritems(entries):
-    let def = getDefEntity(orig, it.pos)
-    let t =
-      case orig[def].kind
-      of SymbolLike: orig[def].sym.typ
-      of mnkGlobal:  orig[def].typ
-      of mnkTemp:    orig[def].typ
-      else:          unreachable()
-
-    bu.buildVoidCall(env, getOp(graph, t, attachedDestructor)):
-      bu.emitByName(Value(node: orig[def]), ekMutate)
+    bu.subTree mnkDestroy:
+      bu.emitFrom(orig, getDefEntity(orig, it.pos))
 
 proc injectDestructors(tree: MirTree, graph: ModuleGraph,
                        destroy: seq[DestroyEntry], env: var MirEnv,
@@ -803,13 +775,11 @@ proc injectDestructors(tree: MirTree, graph: ModuleGraph,
           # there's no need for opening a new scope -- we use a statement-list
           # instead
           buf.subTree MirNode(kind: mnkStmtList):
-            injectDestructorsInner(buf, tree, graph, env,
-                                   toOpenArray(entries, s.a, s.b))
+            injectDestroysAux(buf, tree, toOpenArray(entries, s.a, s.b))
 
         buf.add endNode(mnkTry)
       else:
-        injectDestructorsInner(buf, tree, graph, env,
-                               toOpenArray(entries, s.a, s.b))
+        injectDestroysAux(buf, tree, toOpenArray(entries, s.a, s.b))
 
 proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
                        idgen: IdGenerator, env: var MirEnv,
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index c9b51c3fbeb..bb0d6bccf45 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -561,6 +561,8 @@ func computeDfg*(tree: MirTree): DataFlowGraph =
       emitForValue(env, tree, i, tree.operand(i, 1))
     of mnkVoid:
       emitForExpr(env, tree, i, NodePosition tree.operand(i))
+    of mnkDestroy:
+      unreachable("not implemented yet")
     of mnkEmit, mnkAsm:
       emitForArgs(env, tree, i, i)
 
diff --git a/compiler/sem/modulelowering.nim b/compiler/sem/modulelowering.nim
index 694d1955586..cce620e81f9 100644
--- a/compiler/sem/modulelowering.nim
+++ b/compiler/sem/modulelowering.nim
@@ -36,7 +36,7 @@ import
     idioms
   ]
 
-from compiler/sem/injectdestructors import getOp
+from compiler/mir/injecthooks import getOp
 
 type
   ModuleStructs* = object
diff --git a/doc/mir.rst b/doc/mir.rst
index 1a6c0514193..ac7fff3ac45 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -173,6 +173,7 @@ Semantics
             | Return                    # exit the procedure, but execute all
                                         # enclosing finalizers first (from
                                         # innermost to outermost)
+            | Destroy LVALUE
             | Emit VALUE ...
             | Asm VALUE ...
 

From 9be395f752aa23c01e7214987e0b2386609ae821 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 26 Feb 2024 22:24:54 +0100
Subject: [PATCH 013/169] cgen: better default initialization for `result`
 (#1209)

## Summary

Use a MIR pass for handling the default-initialization of `result`
variables for the C backend. This allows using the MIR's more precise
data-flow analysis, allowing for broader omission of `result` variable
initialization.

## Details

* introduce the `injectResultInit` MIR pass
  * it's only used with the C backend for now
  * if a data-flow analysis deems it required, a `result := default()`
    assignment is placed at the start of the body
* remove the `CgNode`-based `result`-assignment analysis from `cgen`

### Data-flow Analysis Bug

A small bug with the `mirexec.traversal` (forward traversal) routine
was discovered and fixed: the `exit` flag was erroneously set to true
when the main path was aborted on a data-flow instruction that's the
last instruction in the subgraph. The `exit` flag must only be true
when the end of the subgraph is reached, so this is wrong.

A regression test for the `traverse` routine is added.

This bug only affected the `injectdestructors.needsReset` optimization
(unnecessary but otherwise harmless `wasMoved` calls were injected
because of it) and `injectResultInit` (unnecessary initialization was
emitted).
---
 compiler/backend/cgen.nim     | 124 ----------------------------------
 compiler/mir/mirconstr.nim    |   3 +
 compiler/mir/mirpasses.nim    |  60 ++++++++++++++++
 compiler/sem/mirexec.nim      |   9 ++-
 tests/compiler/tmir_exec2.nim |  40 +++++++++++
 5 files changed, 109 insertions(+), 127 deletions(-)
 create mode 100644 tests/compiler/tmir_exec2.nim

diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 0d72dafaa81..9556a1f08ef 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -730,117 +730,6 @@ proc closureSetup(p: BProc, prc: PSym) =
   linefmt(p, cpsStmts, "$1 = ($2) ClE_0;$n",
           [rdLoc(p.locals[n.local]), getTypeDesc(p.module, ls.typ)])
 
-func containsResult(n: CgNode): bool =
-  result = false
-  case n.kind
-  of cnkAtoms - {cnkLocal}:
-    discard "ignore"
-  of cnkLocal:
-    if n.local == resultId:
-      result = true
-  of cnkWithOperand:
-    result = containsResult(n.operand)
-  of cnkWithItems:
-    for i in 0..<n.len:
-      if containsResult(n[i]): return true
-
-type
-  InitResultEnum = enum Unknown, InitSkippable, InitRequired
-
-proc allPathsAsgnResult(n: CgNode): InitResultEnum =
-  # Exceptions coming from calls don't have not be considered here:
-  #
-  # proc bar(): string = raise newException(...)
-  #
-  # proc foo(): string =
-  #   # optimized out: 'reset(result)'
-  #   result = bar()
-  #
-  # try:
-  #   a = foo()
-  # except:
-  #   echo "a was not written to"
-  #
-  template allPathsInBranch(it) =
-    let a = allPathsAsgnResult(it)
-    case a
-    of InitRequired: return InitRequired
-    of InitSkippable: discard
-    of Unknown:
-      # sticky, but can be overwritten by InitRequired:
-      result = Unknown
-
-  result = Unknown
-  case n.kind
-  of cnkStmtList:
-    for it in n:
-      result = allPathsAsgnResult(it)
-      if result != Unknown: return result
-  of cnkAsgn, cnkFastAsgn:
-    if n[0].kind == cnkLocal and n[0].local == resultId:
-      if not containsResult(n[1]): result = InitSkippable
-      else: result = InitRequired
-    elif containsResult(n):
-      result = InitRequired
-  of cnkReturnStmt:
-      if true:
-        # This is a bare `return` statement, if `result` was not initialized
-        # anywhere else (or if we're not sure about this) let's require it to be
-        # initialized. This avoids cases like #9286 where this heuristic lead to
-        # wrong code being generated.
-        result = InitRequired
-  of cnkIfStmt:
-    result = InitSkippable
-    # the condition must not use 'result':
-    if containsResult(n[0]):
-      return InitRequired
-
-    allPathsInBranch(n[1])
-    # if the 'if' statement is not exhaustive and yet it touched 'result'
-    # in some way, say Unknown.
-    result = Unknown
-  of cnkCaseStmt:
-    if containsResult(n[0]): return InitRequired
-    result = InitSkippable
-    var exhaustive = skipTypes(n[0].typ,
-        abstractVarRange-{tyTypeDesc}).kind notin {tyFloat..tyFloat64, tyString}
-    for i in 1..<n.len:
-      let it = n[i]
-      allPathsInBranch(it.lastSon)
-      if not isOfBranch(it): exhaustive = true
-    if not exhaustive: result = Unknown
-  of cnkRepeatStmt:
-    result = allPathsAsgnResult(n[0])
-    # a 'repeat' loop is always executed at least once
-    if result == InitSkippable: result = Unknown
-  of cnkAtoms - {cnkLocal, cnkReturnStmt}:
-    result = Unknown
-  of cnkLocal:
-    # some path reads from 'result' before it was written to!
-    if n.local == resultId: result = InitRequired
-  of cnkTryStmt:
-    # We need to watch out for the following problem:
-    # try:
-    #   result = stuffThatRaises()
-    # except:
-    #   discard "result was not set"
-    #
-    # So ... even if the assignment to 'result' is the very first
-    # assignment this is not good enough! The only pattern we allow for
-    # is 'finally: result = x'
-    result = InitSkippable
-    allPathsInBranch(n[0])
-    for i in 1..<n.len:
-      if n[i].kind == cnkFinally:
-        result = allPathsAsgnResult(n[i].lastSon)
-      else:
-        allPathsInBranch(n[i].lastSon)
-  of cnkWithOperand:
-    allPathsInBranch(n.operand)
-  else:
-    for it in n.items:
-      allPathsInBranch(it)
-
 proc isNoReturn(m: BModule; s: PSym): bool {.inline.} =
   sfNoReturn in s.flags and m.config.exc != excGoto
 
@@ -864,22 +753,9 @@ proc startProc*(m: BModule, id: ProcedureId; procBody: sink Body): BProc =
     if not isInvalidReturnType(m.config, prc.typ[0]):
       # declare the result symbol:
       assignLocalVar(p, resNode)
-      if sfNoInit notin prc.flags:
-        initLocalVar(p, res, immediateAsgn=false)
     else:
       p.locals[res] = initResultParamLoc(p.config, resNode)
       scopeMangledParam(p, p.body[res].name)
-      # We simplify 'unsureAsgn(result, nil); unsureAsgn(result, x)'
-      # to 'unsureAsgn(result, x)'
-      # Sketch why this is correct: If 'result' points to a stack location
-      # the 'unsureAsgn' is a nop. If it points to a global variable the
-      # global is either 'nil' or points to valid memory and so the RC operation
-      # succeeds without touching not-initialized memory.
-      if sfNoInit in prc.flags: discard
-      elif p.body.code != nil and
-           allPathsAsgnResult(p.body.code) == InitSkippable: discard
-      else:
-        resetLoc(p, p.locals[res])
       if skipTypes(resNode.typ, abstractInst).kind == tyArray:
         #incl(res.locFlags, lfIndirect)
         p.locals[res].storage = OnUnknown
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 32500e74733..120515f6cdb 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -91,6 +91,9 @@ func toValue*(id: GlobalId, typ: PType): Value =
 func toValue*(id: ProcedureId, typ: PType): Value =
   Value(node: MirNode(kind: mnkProc, typ: typ, prc: id))
 
+func toValue*(kind: range[mnkParam..mnkLocal], sym: PSym): Value =
+  Value(node: MirNode(kind: kind, typ: sym.typ, sym: sym))
+
 # --------- MirBuffer interface ----------
 
 func len*(b: MirBuffer): int {.inline.} =
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 02c01e6e805..c8ba345245a 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -11,6 +11,7 @@ import
     types
   ],
   compiler/mir/[
+    analysis,
     datatables,
     mirbodies,
     mirenv,
@@ -371,6 +372,59 @@ proc extractStringLiterals(tree: MirTree, env: var MirEnv,
       changes.replaceMulti(tree, i, bu):
         bu.use toValue(c, tree[i].typ)
 
+proc injectResultInit(tree: MirTree, resultVar: PSym, changes: var Changeset) =
+  ## Injects a default-initialization for the result variable, if deemed
+  ## necessary by data-flow analysis.
+  ##
+  ## For targets that don't default-initialize locals automatically,
+  ## default-initialization is necessary for the result variable if:
+  ## * it is partially modified, read from, or otherwise used without having
+  ##   been fully assigned first
+  ## * a procedure exit is reached and the variable is not definitely
+  ##   initialized
+  # future direction: once possible, extend this pass to apply to all local
+  # variables
+  func isResult(tree: MirTree, n: OpValue): bool =
+    tree[n].kind == mnkLocal and tree[n].sym.kind == skResult
+
+  func requiresInit(tree: MirTree): bool =
+    let
+      dfg = computeDfg(tree)
+      all = dfg.subgraphFor(NodePosition(0) .. NodePosition(tree.len))
+    var s: TraverseState
+
+    for op, n in traverse(dfg, all, 0, s):
+      case op
+      of opDef, opKill:
+        if isResult(tree, skipConversions(tree, n)):
+          # the result variable is fully assigned or reset -> quit the
+          # path
+          s.exit = true
+
+      of opUse, opConsume, opMutate, opInvalidate:
+        if isResult(tree, getRoot(tree, n)):
+          # the result variable is read from or modified before it was
+          # initialized
+          return true
+
+      of opMutateGlobal:
+        discard "not relevant"
+
+    # the exit flag indicates that traversal reached the end of the body
+    # (without ``result`` being an initialized). The a > b check makes sure
+    # an empty procedure body also requires initialization of the result
+    # var
+    result = s.exit or all.a > all.b
+
+  if requiresInit(tree):
+    assert tree[0].kind == mnkScope
+    let at = tree.child(NodePosition 0, 0)
+    changes.insert(tree, at, at, bu):
+      bu.subTree mnkInit:
+        bu.use toValue(mnkLocal, resultVar)
+        bu.buildMagicCall mDefault, resultVar.typ:
+          discard
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   config: ConfigRef, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
@@ -389,6 +443,12 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       preventRvo(body.code, c)
 
   batch:
+    if target == targetC and (prc.kind in routineKinds) and
+       (sfNoInit notin prc.flags) and not prc.typ[0].isEmptyType():
+      # the procedure has a result variable and initialization of it is
+      # allowed
+      injectResultInit(body.code, prc.ast[resultPos].sym, c)
+
     lowerSwap(body.code, c)
     if target == targetVm:
       # only the C and VM targets need the extraction, and only the VM
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index bb0d6bccf45..a1b82a55203 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -686,14 +686,17 @@ iterator traverse*(c: DataFlowGraph, span: Subgraph, start: InstrPos,
       of DataFlowOps:
         yield (DataFlowOpcode(instr.op), instr.val)
 
-      inc pc
-
-      if state.exit or pc == start:
+      if state.exit or pc + 1 == start:
         # abort the current path if we either reached the instruction we
         # started at or the path was manually killed
         state.exit = false
         abort()
 
+      # increment *after* the abort handling, otherwise it wouldn't be
+      # possible to detect that the end wasn't reached when an abort is
+      # triggered by the very last instruction
+      inc pc
+
   assert queue.len <= 1
 
   # don't set `exit` to true if nothing was traversed
diff --git a/tests/compiler/tmir_exec2.nim b/tests/compiler/tmir_exec2.nim
new file mode 100644
index 00000000000..39ecf5d7f9b
--- /dev/null
+++ b/tests/compiler/tmir_exec2.nim
@@ -0,0 +1,40 @@
+discard """
+  description: '''
+    Tests for the behaviour of the traversal routines from ``mirexec.nim``
+  '''
+  target: native
+"""
+
+include compiler/sem/mirexec
+
+# setup a very basic graph for testing:
+var graph = DataFlowGraph(instructions:
+  @[Instr(node: NodePosition 0, op: opDef),
+    Instr(node: NodePosition 1, op: opUse)])
+
+block forward_traverse_empty_slice:
+  # ensure that the exit flag is not set to true when no instructions are
+  # traversed
+  let empty = graph.subgraphFor(NodePosition(4)..NodePosition(5))
+  var s = TraverseState()
+  for _ in traverse(graph, empty, empty.a, s):
+    discard
+  doAssert s.exit == false
+
+  # the flag is also set to false if it was set to true externally
+  s.exit = true
+  for _ in traverse(graph, empty, empty.a, s):
+    discard
+  doAssert s.exit == false
+
+block forward_traverse_abort_path_on_last:
+  # aborting the main path on the very last operation of the traversed
+  # subgraph must not lead to the exit flag being set
+  let all = graph.subgraphFor(NodePosition(0)..NodePosition(1))
+  var s = TraverseState()
+  for op, _ in traverse(graph, all, all.a, s):
+    if op == opUse:
+      # abort the path on the last operation of the traversed subgraph
+      s.exit = true
+
+  doAssert s.exit == false

From 8a6a476d89ecdd0d64394728910267a31c5a8dad Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 27 Feb 2024 20:42:02 +0000
Subject: [PATCH 014/169] build(deps): Bump dawidd6/action-download-artifact
 from 3.1.1 to 3.1.2 (#1210)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 3.1.1 to 3.1.2.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v3.1.2</h2>
<h2>What's Changed</h2>
<ul>
<li>Read workflow_search input as a boolean by <a
href="https://github.com/klutchell"><code>@​klutchell</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/273">dawidd6/action-download-artifact#273</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/klutchell"><code>@​klutchell</code></a>
made their first contribution in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/273">dawidd6/action-download-artifact#273</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.1.1...v3.1.2">https://github.com/dawidd6/action-download-artifact/compare/v3.1.1...v3.1.2</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/71072fbb1229e1317f1a8de6b04206afb461bd67"><code>71072fb</code></a>
Read workflow_search input as a boolean (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/273">#273</a>)</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.1.1...v3.1.2">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=3.1.1&new-version=3.1.2)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 9bc6c6939ed..28b483edd74 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v3.1.1
+        uses: dawidd6/action-download-artifact@v3.1.2
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v3.1.1
+        uses: dawidd6/action-download-artifact@v3.1.2
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v3.1.1
+        uses: dawidd6/action-download-artifact@v3.1.2
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v3.1.1
+        uses: dawidd6/action-download-artifact@v3.1.2
         with:
           workflow: ci.yml
           workflow_conclusion: success

From 8b68b0d610b28ea47204ed0ca4fe9d1fcc19dad8 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 28 Feb 2024 22:08:17 +0100
Subject: [PATCH 015/169] make `.computedGoto` pragma a no-op (#1212)

## Summary

The `.computedGoto` pragma is now a no-op pragma usable in pragma
statements everywhere. It's seldomly useful, and since the current
implementation complicates the rework of the C code generator,
dedicated C code generator support is removed for now.

## Details

* remove the `.computedGoto` implementation from `cgen`
* remove `compat.flattenStmts`, `ccgutils.stmtsContainsPragma`, and
  `ccgutils.getPragmaStmt`; they were only used by the `.computedGoto`
  implementation
* as a consequence, `cnkPragmaStmt` is no longer used; the node kind is
  removed too
* without `cnkPragmaStmt`, `mnkPNode` is also obsolete; it's removed
  too
* remove the now-unused report kinds associated with the
  `.computedGoto` pragma
---
 compiler/ast/report_enums.nim                 |  5 -
 compiler/backend/ccgexprs.nim                 |  1 -
 compiler/backend/ccgstmts.nim                 | 96 +------------------
 compiler/backend/ccgutils.nim                 | 15 ---
 compiler/backend/cgir.nim                     |  7 +-
 compiler/backend/cgirgen.nim                  | 16 ----
 compiler/backend/cgirutils.nim                |  3 -
 compiler/backend/compat.nim                   | 15 ---
 compiler/backend/jsgen.nim                    |  1 -
 compiler/front/cli_reporter.nim               | 15 ---
 compiler/mir/mirgen.nim                       |  9 --
 compiler/mir/mirtrees.nim                     | 12 +--
 compiler/mir/utils.nim                        |  6 --
 compiler/vm/vmgen.nim                         |  2 +-
 doc/manual.rst                                | 43 +--------
 .../tcase_computedgoto_holed_enum.nim         | 23 -----
 16 files changed, 8 insertions(+), 261 deletions(-)
 delete mode 100644 tests/lang_stmts/casestmt/tcase_computedgoto_holed_enum.nim

diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index 2e893630aec..78a92bcdfd0 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -628,11 +628,6 @@ type
     # Codegen
     rsemRttiRequestForIncompleteObject
     rsemExpectedNimcallProc
-    rsemExpectedExhaustiveCaseForComputedGoto
-    rsemExpectedUnholyEnumForComputedGoto
-    rsemTooManyEntriesForComputedGoto
-    rsemExpectedLow0ForComputedGoto
-    rsemExpectedCaseForComputedGoto
     rsemDisallowedRangeForComputedGoto
     rsemExpectedParameterForJsPattern
     rsemExpectedLiteralForGoto
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 628bc3b1262..24acfe516de 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -2129,7 +2129,6 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
     assert p.config.exc == excGoto
     genTryGoto(p, n)
   of cnkRaiseStmt: genRaiseStmt(p, n)
-  of cnkPragmaStmt: discard
   of cnkInvalid, cnkType, cnkAstLit, cnkMagic, cnkRange, cnkBinding, cnkExcept,
      cnkFinally, cnkBranch, cnkLabel, cnkStmtListExpr, cnkField:
     internalError(p.config, n.info, "expr(" & $n.kind & "); unknown node kind")
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index 97ad08400ee..c418c427ce7 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -189,97 +189,6 @@ proc genGotoForCase(p: BProc; caseStmt: CgNode) =
     genStmts(p, it.lastSon)
     endBlock(p)
 
-proc genAsgn(p: BProc, e: CgNode)
-
-proc genComputedGoto(p: BProc; n: CgNode) =
-  # first pass: Generate array of computed labels:
-
-  # flatten the loop body because otherwise let and var sections
-  # wrapped inside stmt lists by inject destructors won't be recognised
-  # XXX: ^^ this doesn't work as intended (see the comment in
-  #      ``flattenStmts``)
-  let n = n.flattenStmts()
-  var casePos = -1
-  var arraySize: int
-  for i in 0..<n.len:
-    let it = n[i]
-    if it.kind == cnkCaseStmt:
-      # XXX: move the checks into the semantic analysis phase
-      if not isOfBranch(it[^1]):
-        localReport(p.config, it.info, reportSem rsemExpectedExhaustiveCaseForComputedGoto)
-        return
-
-      casePos = i
-      if enumHasHoles(it[0].typ):
-        localReport(p.config, it.info, reportSem rsemExpectedUnholyEnumForComputedGoto)
-        return
-
-      let aSize = lengthOrd(p.config, it[0].typ)
-      if aSize > 10_000:
-        localReport(p.config, it.info, reportSem rsemTooManyEntriesForComputedGoto)
-        return
-
-      arraySize = toInt(aSize)
-      if firstOrd(p.config, it[0].typ) != 0:
-        localReport(p.config, it.info, reportSem rsemExpectedLow0ForComputedGoto)
-        return
-
-  if casePos < 0:
-    localReport(p.config, n.info, reportSem rsemExpectedCaseForComputedGoto)
-    return
-
-  var id = p.labels+1
-  inc p.labels, arraySize+1
-  let tmp = "TMP$1_" % [id.rope]
-  var gotoArray = "static void* $#[$#] = {" % [tmp, arraySize.rope]
-  for i in 1..arraySize-1:
-    gotoArray.addf("&&TMP$#_, ", [rope(id+i)])
-  gotoArray.addf("&&TMP$#_};$n", [rope(id+arraySize)])
-  line(p, cpsLocals, gotoArray)
-
-  for j in 0..<casePos:
-    genStmts(p, n[j])
-
-  let caseStmt = n[casePos]
-  var a: TLoc
-  initLocExpr(p, caseStmt[0], a)
-  # first goto:
-  lineF(p, cpsStmts, "goto *$#[$#];$n", [tmp, a.rdLoc])
-
-  for i in 1..<caseStmt.len:
-    startBlock(p)
-    let it = caseStmt[i]
-    for j in 0..<it.len-1:
-      if it[j].kind == cnkRange:
-        localReport(p.config, it.info, reportSem rsemDisallowedRangeForComputedGoto)
-        return
-
-      let val = getOrdValue(it[j])
-      lineF(p, cpsStmts, "TMP$#_:$n", [intLiteral(toInt64(val)+id+1)])
-
-    genStmts(p, it.lastSon)
-
-    for j in casePos+1..<n.len:
-      genStmts(p, n[j])
-
-    for j in 0..<casePos:
-      # prevent new local declarations
-      # compile declarations as assignments
-      let it = n[j]
-      if it.kind == cnkDef:
-        genAsgn(p, it)
-      else:
-        genStmts(p, it)
-
-    var a: TLoc
-    initLocExpr(p, caseStmt[0], a)
-    lineF(p, cpsStmts, "goto *$#[$#];$n", [tmp, a.rdLoc])
-    endBlock(p)
-
-  for j in casePos+1..<n.len:
-    genStmts(p, n[j])
-
-
 proc genRepeatStmt(p: BProc, t: CgNode) =
   # we don't generate labels here as for example GCC would produce
   # significantly worse code
@@ -288,10 +197,7 @@ proc genRepeatStmt(p: BProc, t: CgNode) =
 
   if true:
     var loopBody = t[0]
-    if loopBody.stmtsContainPragma(wComputedGoto) and
-       hasComputedGoto in CC[p.config.cCompiler].props:
-      genComputedGoto(p, loopBody)
-    else:
+    if true:
       startBlock(p, "while (1) {$n")
       genStmts(p, loopBody)
 
diff --git a/compiler/backend/ccgutils.nim b/compiler/backend/ccgutils.nim
index 99e3adc7e41..a00f4316543 100644
--- a/compiler/backend/ccgutils.nim
+++ b/compiler/backend/ccgutils.nim
@@ -14,7 +14,6 @@ import
     hashes, strutils
   ],
   compiler/ast/[
-    wordrecg,
     ast,
     types
   ],
@@ -28,22 +27,8 @@ import
   ],
   compiler/backend/[
     cgendata,
-    cgir
   ]
 
-proc getPragmaStmt*(n: CgNode, w: TSpecialWord): CgNode =
-  case n.kind
-  of cnkStmtList:
-    for i in 0..<n.len:
-      result = getPragmaStmt(n[i], w)
-      if result != nil: break
-  of cnkPragmaStmt:
-    if n.pragma == w: return n
-  else: discard
-
-proc stmtsContainPragma*(n: CgNode, w: TSpecialWord): bool =
-  result = getPragmaStmt(n, w) != nil
-
 proc hashString*(conf: ConfigRef; s: string): BiggestInt =
   # has to be the same algorithm as strmantle.hashString!
   if CPU[conf.target.targetCPU].bit == 64:
diff --git a/compiler/backend/cgir.nim b/compiler/backend/cgir.nim
index 877c9df9ac2..912a3ae19f4 100644
--- a/compiler/backend/cgir.nim
+++ b/compiler/backend/cgir.nim
@@ -9,8 +9,7 @@ import
   ],
   compiler/ast/[
     ast_types,
-    lineinfos,
-    wordrecg
+    lineinfos
   ],
   compiler/mir/[
     mirtrees
@@ -109,7 +108,6 @@ type
     # expression or not
 
     cnkVoidStmt   ## discard the operand value (i.e., do nothing with it)
-    cnkPragmaStmt ## a single compiler directive
     cnkEmitStmt   ## an ``emit`` statement
     cnkAsmStmt    ## an ``asm`` statement
 
@@ -149,7 +147,7 @@ const
   cnkWithOperand*  = {cnkConv, cnkHiddenConv, cnkDeref, cnkAddr, cnkHiddenAddr,
                       cnkDerefView, cnkObjDownConv, cnkObjUpConv, cnkCast,
                       cnkLvalueConv}
-  cnkAtoms*        = {cnkInvalid..cnkMagic, cnkReturnStmt, cnkPragmaStmt}
+  cnkAtoms*        = {cnkInvalid..cnkMagic, cnkReturnStmt}
     ## node kinds that denote leafs
   cnkWithItems*    = AllKinds - cnkWithOperand - cnkAtoms
     ## node kinds for which the ``items`` iterator is available
@@ -200,7 +198,6 @@ type
     of cnkMagic:      magic*: TMagic
     of cnkLabel:      label*: BlockId
     of cnkLocal:      local*: LocalId
-    of cnkPragmaStmt: pragma*: TSpecialWord
     of cnkWithOperand: operand*: CgNode
     of cnkWithItems:
       kids*: seq[CgNode]
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 18c3f8ad58b..baa1a3b7de5 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -42,7 +42,6 @@ import
   ]
 
 from compiler/ast/ast import newSym, newType, rawAddSon
-from compiler/ast/idents import whichKeyword
 from compiler/sem/semdata import makeVarType
 
 type
@@ -608,19 +607,6 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   else:
     unreachable()
 
-proc translateNode(n: PNode): CgNode =
-  ## Translates the content of a ``mnkPNode`` node to a ``CgNode``.
-  case n.kind
-  of nkPragma:
-    # XXX: consider adding a dedicated ``mnkPragma`` MIR node
-    # only simple pragmas reach here
-    assert n.len == 1
-    assert n[0].kind == nkIdent
-    CgNode(kind: cnkPragmaStmt, info: n.info, pragma: whichKeyword(n[0].ident))
-  else:
-    # cannot reach here
-    unreachable(n.kind)
-
 proc bodyToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
               cr: var TreeCursor): CgNode =
   ## Generates the ``CgNode`` tree for the body of a construct that implies
@@ -709,8 +695,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     newStmt(cnkBreakStmt, info, [newLabelNode(BlockId idx, info)])
   of mnkReturn:
     newNode(cnkReturnStmt, info)
-  of mnkPNode:
-    translateNode(n.node)
   of mnkVoid:
     var res = exprToIr(tree, cl, cr)
     if res.typ.isEmptyType():
diff --git a/compiler/backend/cgirutils.nim b/compiler/backend/cgirutils.nim
index 335a20bcfa2..f68f8fbd214 100644
--- a/compiler/backend/cgirutils.nim
+++ b/compiler/backend/cgirutils.nim
@@ -36,9 +36,6 @@ proc treeRepr*(n: CgNode): string =
       result.add "strVal: \""
       result.add n.strVal
       result.add "\""
-    of cnkPragmaStmt:
-      result.add "pragma: "
-      result.add $n.pragma
     of cnkField:
       result.add "field: "
       result.add n.field.name.s
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 0da17d3d620..a0db57b1383 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -124,21 +124,6 @@ proc toBitSet*(conf: ConfigRef; s: CgNode): TBitSet =
     else:
       bitSetIncl(result, toInt64(getOrdValue(it) - first))
 
-proc flattenStmts*(n: CgNode): CgNode =
-  ## Duplicate of `flattenStmts <trees.html#flattenStmts,PNode>`_
-  proc unnestStmts(n: CgNode, result: var CgNode) =
-    case n.kind
-    of cnkStmtList:
-      for it in n.items:
-        unnestStmts(it, result)
-    else:
-      result.kids.add n
-
-  result = CgNode(kind: cnkStmtList)
-  unnestStmts(n, result)
-  if result.len == 1:
-    result = result[0]
-
 proc newSymNode*(env: MirEnv, s: PSym): CgNode {.inline.} =
   case s.kind
   of skConst:
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index cfd859f9567..58e66953a1a 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -2446,7 +2446,6 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
   of cnkAsmStmt, cnkEmitStmt: genAsmOrEmitStmt(p, n)
   of cnkTryStmt: genTry(p, n)
   of cnkRaiseStmt: genRaiseStmt(p, n)
-  of cnkPragmaStmt: discard
   of cnkInvalid, cnkMagic, cnkRange, cnkBinding, cnkExcept, cnkFinally,
      cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkField:
     internalError(p.config, n.info, "gen: unknown node type: " & $n.kind)
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 1ca21286a25..cf89556fe88 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -1993,21 +1993,6 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
     of rsemDisallowedRangeForComputedGoto:
       result = "range notation not available for computed goto"
 
-    of rsemExpectedCaseForComputedGoto:
-      result = "no case statement found for computed goto"
-
-    of rsemExpectedLow0ForComputedGoto:
-      result = "case statement has to start at 0 for computed goto"
-
-    of rsemTooManyEntriesForComputedGoto:
-      result = "case statement has too many cases for computed goto"
-
-    of rsemExpectedUnholyEnumForComputedGoto:
-      result = "case statement cannot work on enums with holes for computed goto"
-
-    of rsemExpectedExhaustiveCaseForComputedGoto:
-      result = "case statement must be exhaustive for computed goto"
-
     of rsemExpectedNimcallProc:
       result = r.symstr & " needs to have the 'nimcall' calling convention"
 
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 3a1666de2e4..b599a46b798 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1963,15 +1963,6 @@ proc gen(c: var TCtx, n: PNode) =
       of wEmit:
         c.builder.useSource(c.sp, it)
         genAsmOrEmitStmt(c, mnkEmit, it[1])
-      of wComputedGoto:
-        # the MIR doesn't handle this directive, but the code generators
-        # might. As such, we need to keep it via a ``mnkPNode``. Since the
-        # directive might be combined with some other directive in a
-        # single statement, we split it out into a standalone pragma statement
-        # first
-        # XXX: ideally, sem or transf would split pragma statement up
-        c.builder.useSource(c.sp, it)
-        c.add MirNode(kind: mnkPNode, node: newTree(nkPragma, [it]))
       else:     discard
 
   of nkAsmStmt:
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 85578bf341f..5db9af07b8a 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -252,12 +252,6 @@ type
     # structural changes, as not all node kinds are able to use the length
     # field at the moment
 
-    mnkPNode ## depending on the context, either statement or something else.
-             ## If it appears as a statement, it is expected to not have any
-             ## obsersvable effects
-             ## XXX: eventually, everything that currently requires
-             ##      ``mnkPNode`` should be expressable directly in the IR
-
   EffectKind* = enum
     ekMutate    ## the value in the location is mutated
     ekReassign  ## a new value is assigned to the location
@@ -301,8 +295,6 @@ type
                       ## for a break, the label of the block to break out of
     of mnkEnd:
       start*: MirNodeKind ## the kind of the corresponding start node
-    of mnkPNode:
-      node*: PNode
     of mnkTag:
       effect*: EffectKind ## the effect that happens when the operator the
                           ## tagged value is passed to is executed
@@ -331,7 +323,7 @@ const
     ## Node kinds that represent definition statements (i.e. something that
     ## introduces a named entity)
 
-  AtomNodes* = {mnkNone..mnkType, mnkMagic, mnkBreak, mnkReturn, mnkPNode}
+  AtomNodes* = {mnkNone..mnkType, mnkMagic, mnkBreak, mnkReturn}
     ## Nodes that don't support sub nodes.
 
   SubTreeNodes* = AllNodeKinds - AtomNodes - {mnkEnd}
@@ -365,7 +357,7 @@ const
     ## Nodes that may be appear in atom-expecting slots.
 
   StmtNodes* = {mnkScope, mnkStmtList, mnkIf, mnkCase, mnkRepeat, mnkTry,
-                mnkBlock, mnkBreak, mnkReturn, mnkRaise, mnkPNode, mnkInit,
+                mnkBlock, mnkBreak, mnkReturn, mnkRaise, mnkInit,
                 mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkDestroy, mnkEmit,
                 mnkAsm} + DefNodes
 
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 735978b6b1a..b408c47c9b3 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -59,9 +59,6 @@ func `$`(n: MirNode): string =
   of mnkEnd:
     result.add " start: "
     result.add $n.start
-  of mnkPNode:
-    result.add " node: "
-    result.add $n.node.kind
   of mnkTag:
     result.add " effect: "
     result.add $n.effect
@@ -496,9 +493,6 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
     tree "destroy ":
       valueToStr()
       result.add "\n"
-  of mnkPNode:
-    result.add repeat("  ", indent)
-    result.add "PNode " & $n.node & "\n"
   of mnkBreak:
     result.add repeat("  ", indent)
     result.add "break L" & $n.label.int & "\n"
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 822c863cd5e..7d99e1cd1f1 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -3197,7 +3197,7 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
       genCastIntFloat(c, n, dest)
   of cnkType:
     genTypeLit(c, n, n.typ, dest)
-  of cnkPragmaStmt, cnkAsmStmt, cnkEmitStmt:
+  of cnkAsmStmt, cnkEmitStmt:
     unused(c, n, dest)
   of cnkInvalid, cnkMagic, cnkRange, cnkExcept, cnkFinally, cnkBranch,
      cnkBinding, cnkLabel, cnkStmtListExpr, cnkField, cnkToSlice:
diff --git a/doc/manual.rst b/doc/manual.rst
index 53af501e4e9..2c0efbada36 100644
--- a/doc/manual.rst
+++ b/doc/manual.rst
@@ -6594,47 +6594,8 @@ If the `line` pragma is used with a parameter, the parameter needs be a
 
 computedGoto pragma
 -------------------
-The `computedGoto` pragma can be used to tell the compiler how to
-compile a Nim `case`:idx: in a `while true` statement.
-Syntactically it has to be used as a statement inside the loop:
-
-.. code-block:: nim
-
-  type
-    MyEnum = enum
-      enumA, enumB, enumC, enumD, enumE
-
-  proc vm() =
-    var instructions: array[0..100, MyEnum]
-    instructions[2] = enumC
-    instructions[3] = enumD
-    instructions[4] = enumA
-    instructions[5] = enumD
-    instructions[6] = enumC
-    instructions[7] = enumA
-    instructions[8] = enumB
-
-    instructions[12] = enumE
-    var pc = 0
-    while true:
-      {.computedGoto.}
-      let instr = instructions[pc]
-      case instr
-      of enumA:
-        echo "yeah A"
-      of enumC, enumD:
-        echo "yeah CD"
-      of enumB:
-        echo "yeah B"
-      of enumE:
-        break
-      inc(pc)
-
-  vm()
-
-As the example shows, `computedGoto` is mostly useful for interpreters. If
-the underlying backend (C compiler) does not support the computed goto
-extension the pragma is simply ignored.
+The `computedGoto` pragma is kept for backwards compatibility. It can be used
+in pragma statements, but has no effect.
 
 
 immediate pragma
diff --git a/tests/lang_stmts/casestmt/tcase_computedgoto_holed_enum.nim b/tests/lang_stmts/casestmt/tcase_computedgoto_holed_enum.nim
deleted file mode 100644
index ee6105b069d..00000000000
--- a/tests/lang_stmts/casestmt/tcase_computedgoto_holed_enum.nim
+++ /dev/null
@@ -1,23 +0,0 @@
-discard """
-  errormsg: "case statement cannot work on enums with holes for computed goto"
-  line: 21
-  description: '''
-    . From ComputedGoto: bad codegen with enum with holes
-    . There are two possible solutions:
-      Raise an error if the enum has holes
-      Complicate the codegen a bit by generating a set[uint16]
-      of the enum coverage and then use it to generate the jump tables.
-    . IMHO, error is the way to go. If you want speed, design your enums properly.
-  '''
-"""
-
-type
-  X = enum
-    A = 0, B = 100
-
-var z = A
-while true:
-  {.computedGoto.}
-  case z
-  of A: discard
-  of B: discard
\ No newline at end of file

From dff5aea072c823e27756f8f4bb27e14c27ed2023 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 29 Feb 2024 02:59:20 +0100
Subject: [PATCH 016/169] fix(mirgen): respect `--panics:on` for overflow
 checks (#1213)

## Summary

Fix overflow checks for binary integer arithmetic being treated as
potentially raising exceptions when panics are enabled (`--panics:on`).
This didn't affect correctness, but some optimizations were inhibited.

## Details

Use `buildDefectMagicCall` for emitting the binary arithmetic operation
in `mirgen`. If panics are enabled, this makes sure a `mnkCall` is
emitted rather than a `mnkCheckedCall`.

Checked calls (i.e., calls that can raise an exception) introduce
unstructured control-flow, which, depending on where the call is
located, can result in the compiler having to place additional
`wasMoved` and/or destructor calls.

An `--expandArc`-based test for making sure that all run-time checks
are correctly treated as not raising an exception is added.
---
 compiler/mir/mirgen.nim                   |  2 +-
 tests/exception/truntime_check_panics.nim | 58 +++++++++++++++++++++++
 2 files changed, 59 insertions(+), 1 deletion(-)
 create mode 100644 tests/exception/truntime_check_panics.nim

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index b599a46b798..b1498f11023 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -894,7 +894,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     if optOverflowCheck in c.userOptions:
       const Map = [mAddI: mAddI, mSubI, mMulI, mDivI, mModI,
                    mSucc: mAddI, mPred: mSubI]
-      c.buildCheckedMagicCall Map[m], n.typ:
+      c.buildDefectMagicCall Map[m], n.typ:
         arg n[1]
         arg n[2]
     else:
diff --git a/tests/exception/truntime_check_panics.nim b/tests/exception/truntime_check_panics.nim
new file mode 100644
index 00000000000..d770f2a4c5a
--- /dev/null
+++ b/tests/exception/truntime_check_panics.nim
@@ -0,0 +1,58 @@
+discard """
+  description: '''
+    Ensure that the compiler-inserted run-time checks don't have exceptional
+    exits when panics are enabled.
+  '''
+  targets: native
+  matrix: "--panics:on --hints:off --expandArc:test"
+  action: compile
+  nimout: '''
+--expandArc: test
+scope:
+  def a: array[0..0, int]
+  chckIndex(arg a, arg i)
+  discard a[i]
+  chckBounds(arg a, arg 0, arg i)
+  def _0: openArray[int] = toOpenArray a, 0, i
+  def _1: int = addI(arg i, arg i)
+  def _2: int = unaryMinusI(arg i)
+  def _3: range 0..1(int) = chckRange(arg i, arg 0, arg 1)
+  chckField(arg <D0>, arg o.kind, arg false, arg "field \'x\' is not accessible for type \'Object\' using \'kind = ")
+  discard o.kind.x
+  def _5: bool = isNil(arg r)
+  def _4: bool = not(arg _5)
+  if _4:
+    chckObj(arg r, arg type(Sub:ObjectType))
+  discard r.(Sub)
+  def _6: float = mulF64(arg f, arg f)
+  chckNaN(arg _6)
+
+-- end of expandArc ------------------------'''
+"""
+
+# make sure all run-time checks are enabled
+{.push boundChecks: on, overflowChecks: on, rangeChecks: on, objChecks: on,
+       fieldChecks: on, infChecks: on, nanChecks: on.}
+
+type
+  Sub = ref object of RootObj
+  Object = object
+    case kind: bool
+    of true:
+      x: int
+    else:
+      discard
+
+# export the procedure so that it's not omitted
+proc test(i: int, f: float, o: Object, r: ref RootObj) {.exportc.} =
+  var a: array[1, int]
+  discard a[i]                 # index check
+  discard toOpenArray(a, 0, i) # bound check
+  discard i + i                # overflow check for binary arithmetic
+  discard -i                   # overflow check for unary arithmetic
+  discard range[0..1](i)       # range check
+  discard o.x                  # field check
+  discard Sub(r)               # object check
+  discard f * f                # infinity and nan check
+
+{.pop.}
\ No newline at end of file

From 12f0aa45abab91601f53cc79854a27376c403d0f Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 29 Feb 2024 23:17:08 +0100
Subject: [PATCH 017/169] internal: implement `--profiler:on` support with MIR
 pass (#1214)

## Summary

Make routine instrumentation with `nimProfile` calls a MIR pass, moving
more logic out of the C code generator and working towards
`--profiler:on` support with all backends. `nimProfile` calls are also
no longer inserted into loops within `.asmNoStackFrame` routines.

## Details

* require a `ModuleGraph` instance for `mirpasses.applyPasses`, so that
  compilerprocs can be looked up
* add the `injectProfilerCalls` MIR pass. It injects `nimProfile` in
  the same way that `cgen` does
* remove injection of `nimProfile` calls from `cgen`
* don't instrument loops within `.asmNoStackFrame` procedures;
  injection of `nimProfile` at procedure entry was already skipped for
  these procedures
* temporarily remove the `optProfiler` option from symbols when in JIT
  mode, that code generated for compile-time execution is not
  instrumented
* add a test for the `--profiler:on` feature, to make sure it works and
  keeps working
---
 compiler/backend/backends.nim        |  2 +-
 compiler/backend/ccgstmts.nim        |  4 --
 compiler/backend/cgen.nim            |  7 ----
 compiler/mir/mirpasses.nim           | 41 +++++++++++++++++-
 compiler/vm/vmjit.nim                | 18 ++++++--
 tests/compilerfeatures/tprofiler.nim | 63 ++++++++++++++++++++++++++++
 6 files changed, 119 insertions(+), 16 deletions(-)
 create mode 100644 tests/compilerfeatures/tprofiler.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 5fe5bd5fe03..b2cbf3fdf9a 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -342,7 +342,7 @@ proc process(body: var MirBody, prc: PSym, graph: ModuleGraph,
     of backendNimVm:   targetVm
     of backendInvalid: unreachable()
 
-  applyPasses(body, prc, env, graph.config, target)
+  applyPasses(body, prc, env, graph, target)
 
 proc translate*(id: ProcedureId, body: PNode, graph: ModuleGraph,
                 config: BackendConfig, idgen: IdGenerator,
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index c418c427ce7..811116a43c1 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -200,10 +200,6 @@ proc genRepeatStmt(p: BProc, t: CgNode) =
     if true:
       startBlock(p, "while (1) {$n")
       genStmts(p, loopBody)
-
-      if optProfiler in p.options:
-        # invoke at loop body exit:
-        linefmt(p, cpsStmts, "#nimProfile();$n", [])
       endBlock(p)
 
   dec(p.withinLoop)
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 9556a1f08ef..86e358e5375 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -258,10 +258,6 @@ template appcg(m: BModule, sec: TCFileSection, frmt: FormatStr,
            args: untyped) =
   m.s[sec].add(ropecg(m, frmt, args))
 
-template appcg(p: BProc, sec: TCProcSection, frmt: FormatStr,
-           args: untyped) =
-  p.s(sec).add(ropecg(p.module, frmt, args))
-
 template line(p: BProc, sec: TCProcSection, r: Rope) =
   p.s(sec).add(indentLine(p, r))
 
@@ -824,9 +820,6 @@ proc finishProc*(p: BProc, id: ProcedureId): string =
       generatedProc.add(initFrame(p, procname, quotedFilename(p.config, prc.info)))
     else:
       generatedProc.add(p.s(cpsLocals))
-    if optProfiler in prc.options:
-      # invoke at proc entry for recursion:
-      appcg(p, cpsInit, "\t#nimProfile();$n", [])
     # this pair of {} was added because C++ is stricter with its control flow
     # integrity checks, leaving them in
     if beforeRetNeeded in p.flags: generatedProc.add("{")
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index c8ba345245a..a561fda2b4c 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -8,8 +8,12 @@ import
   compiler/ast/[
     ast_query,
     ast_types,
+    lineinfos,
     types
   ],
+  compiler/front/[
+    in_options
+  ],
   compiler/mir/[
     analysis,
     datatables,
@@ -20,6 +24,10 @@ import
     mirtrees,
     sourcemaps
   ],
+  compiler/modules/[
+    modulegraphs,
+    magicsys
+  ],
   compiler/sem/[
     aliasanalysis,
     mirexec
@@ -425,8 +433,33 @@ proc injectResultInit(tree: MirTree, resultVar: PSym, changes: var Changeset) =
         bu.buildMagicCall mDefault, resultVar.typ:
           discard
 
+proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
+                         changes: var Changeset) =
+  ## Instruments the body with calls to the ``nimProfile`` compiler runtime
+  ## procedure. Profiler calls are placed:
+  ## * at the beginning of a procedure's body
+  ## * at the end of a loop's body
+  let
+    voidType = graph.getSysType(unknownLineInfo, tyVoid)
+    prc = graph.getCompilerProc("nimProfile")
+    prcId = env.procedures.add(prc)
+
+  # insert the entry call within the outermost scope:
+  changes.insert(tree, tree.child(NodePosition 0, 0), NodePosition 0, bu):
+    bu.subTree mnkVoid:
+      bu.buildCall prcId, prc.typ, voidType:
+        discard "no arguments"
+
+  for i in search(tree, {mnkEnd}):
+    if tree[i].start == mnkRepeat:
+      # insert the call before the end node:
+      changes.insert(tree, i - 1, i, bu):
+        bu.subTree mnkVoid:
+          bu.buildCall prcId, prc.typ, voidType:
+            discard "no arguments"
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
-                  config: ConfigRef, target: TargetBackend) =
+                  graph: ModuleGraph, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
   ## `prc`. `target` is the targeted backend and is used to enable/disable
   ## certain passes. Passes may register new entities with `env`.
@@ -455,6 +488,12 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       # requires the extraction for cstring literals
       extractStringLiterals(body.code, env, c)
 
+  # instrument the body with profiler calls after all lowerings, but before
+  # optimization
+  if (sfPure notin prc.flags) and (optProfiler in prc.options):
+    batch:
+      injectProfilerCalls(body.code, graph, env, c)
+
   # eliminate temporaries after all other passes
   batch:
     eliminateTemporaries(body.code, c)
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 7f87eea38f1..1b9a96a6e11 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -25,6 +25,9 @@ import
     backends,
     cgir
   ],
+  compiler/front/[
+    in_options,
+  ],
   compiler/mir/[
     datatables,
     mirbodies,
@@ -175,6 +178,15 @@ template runCodeGen(c: var TCtx, cg: var CodeGenCtx, b: Body,
   swapState(c, cg)
   r
 
+proc applyPasses(c: var TCtx, env: var MirEnv, prc: PSym, body: var MirBody) =
+  let restore = optProfiler in prc.options
+  # don't instrument procedures when using the JIT
+  if restore:
+    prc.options.excl optProfiler
+  applyPasses(body, prc, env, c.graph, targetVm)
+  if restore:
+    prc.options.incl optProfiler
+
 proc genStmt*(jit: var JitState, c: var TCtx; n: PNode): VmGenResult =
   ## Generates and emits code for the standalone top-level statement `n`.
   preCheck(jit.gen.env, n)
@@ -184,7 +196,7 @@ proc genStmt*(jit: var JitState, c: var TCtx; n: PNode): VmGenResult =
 
   # `n` is expected to have been put through ``transf`` already
   var mirBody = generateMirCode(c, jit.gen.env, n, isStmt = true)
-  applyPasses(mirBody, c.module, jit.gen.env, c.config, targetVm)
+  applyPasses(c, jit.gen.env, c.module, mirBody)
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
@@ -216,7 +228,7 @@ proc genExpr*(jit: var JitState, c: var TCtx, n: PNode): VmGenResult =
   let cp = checkpoint(jit.gen.env)
 
   var mirBody = generateMirCode(c, jit.gen.env, n)
-  applyPasses(mirBody, c.module, jit.gen.env, c.config, targetVm)
+  applyPasses(c, jit.gen.env, c.module, mirBody)
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
@@ -255,7 +267,7 @@ proc genProc(jit: var JitState, c: var TCtx, s: PSym): VmGenResult =
   echoInput(c.config, s, body)
   var mirBody = generateCode(c.graph, jit.gen.env, s, selectOptions(c), body)
   echoMir(c.config, s, mirBody)
-  applyPasses(mirBody, s, jit.gen.env, c.config, targetVm)
+  applyPasses(c, jit.gen.env, s, mirBody)
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
diff --git a/tests/compilerfeatures/tprofiler.nim b/tests/compilerfeatures/tprofiler.nim
new file mode 100644
index 00000000000..88e71fe8f4d
--- /dev/null
+++ b/tests/compilerfeatures/tprofiler.nim
@@ -0,0 +1,63 @@
+discard """
+  description: '''
+    Ensure that the built-in instrumentation with profiler callback calls
+    works
+  '''
+  targets: "c js vm"
+  matrix: "--profiler:on"
+  knownIssue.js vm: '''
+    The `system/profile.nim` module is not available for the targets
+  '''
+"""
+
+var
+  traces: array[3, StackTrace]
+  enabled = true
+  numTraces = 0
+
+# instrumentation needs to be disabled for the callbacks, otherwise there'd be
+# an infinite recursion
+{.push profiler: off.}
+
+proc enabledCallback(): bool =
+  result = enabled
+  # XXX: an issue with the profiler runtime requires disabling the callback
+  #      until the `profileCallback` is done
+  enabled = false
+
+proc profileCallback(st: StackTrace) =
+  traces[numTraces] = st
+  inc numTraces
+  enabled = true # re-enable
+
+{.pop.}
+
+# nothing will happen before the hook is set
+profilerHook = profileCallback
+# the "profiling requested" callback guards whether to invoke the profiler
+# callback
+profilingRequestedHook = enabledCallback
+
+proc test() =
+  # the callback is invoked when a procedure is entered
+  var i = 0
+  while i < 2:
+    inc i
+    # the callback is also invoked at the end of while loop's body
+
+test() # run once
+
+proc testPure() {.asmNoStackFrame.} =
+  # pure routines aren't instrumented
+  var i = 0
+  while i < 2:
+    inc i
+
+# disable the callback so that the traces can be inspected
+enabled = false
+
+# validate the traces:
+doAssert numTraces == 3
+# the end of the list is signaled by a nil cstring
+doAssert traces[0].lines[0..2] == [cstring"test", "tprofiler", nil]
+doAssert traces[0].files[0..2] == [cstring"tprofiler.nim", "tprofiler.nim", nil]
\ No newline at end of file

From fff9caeaeec26a1ae419b0979bd0f7a23147303b Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 3 Mar 2024 20:59:57 +0100
Subject: [PATCH 018/169] make the CGIR goto-based and fix exception-handling
 bugs (#1215)

## Summary

* extend the MIR's design with goto-based control-flow primitives
* implement the new control-flow primitives for the CGIR
* make the C code generator use the new control-flow primitives
* (C backend) fix multiple bugs with `getCurrentException` returning
  the wrong exception
* (C backend) fix exceptions being leaked when aborting a `finally`
  section

### Details

The main goals of replacing the higher-level control-flow primitives in
the MIR with lower-level, goto-based ones are to:
* be able to express more complex control-flow
* make control-flow-related transformations easier and/or possible
* reduce the cost of computing the data-flow graph
* make evolving the language and MIR easier

A guiding principle was that the design should allow for enough freedom
to generate efficient code with all three code generators (which differ
significantly in control-flow-related capabilities).

To be able to implement this incrementally, as a first step, the new
control-flow primitives are only added to the CGIR, with only `cgen`
actually supporting them. So that `jsgen` and `vmgen` continue to work
without change, the legacy primitives are kept, with `cgirgen_legacy`
(a full copy of the original `cgirgen`) continuing to produce the
legacy CGIR.

### MIR

An in-depth description of syntax and behaviour is added to
`docs/mir.rst`. The gist of the design is that:
* terminators of basic-blocks become explicit (an exception being `If`)
* jump targets are directly specified on jump/fork-like operations
  (e.g., `Goto`, `CheckedCall`, etc.)
* intercepted control-flow (via `finally` sections) is also specified
  on jump/fork-like operations
* `finally` sections are *not* required to be duplicated for each
  unique control-flow passing through them
* jump targets and join points are identified by *labels*, which are
  integers IDs unique within a body

As a consequence of this design, there's no more statement-in-statement
nesting.

### CGIR & Translation

The CGIR implements all the new control-flow primitives from the MIR,
with the only difference being that the CGIR's `ContinueStmt` doesn't
track the possible exits of a `Finally` section (it's information
irrelevant to the code generators).

`cgirgen` handles translation of the old-style primitives still used by
the MIR to the new-style ones. While not strictly needed at the moment,
translation is disabled of intra-procedure unreachable code is
disabled, meaning that unreachable code is effectively dropped. This is
so that `Finally` sections that never exit normally (e.g.,
`finally: return`) can be ensured to work.

### C code generation

The CGIR is first translated into a small, low-level, C-specific IR
(all implemented in `ccgflow`). Here, the focus is on figuring out what
C code to produce for `Finally` sections; unnecessary gotos are also
eliminated.

#### Finally Handling

The previous strategy for `finally` was to:
* emit an error-state considering version of the `finally` at the end
  of the `try`
* duplicate the body of all enclosing `finally`s at `break`s and
  `return`s

Now, only a single version of the `finally` section is ever emitted. If
the `finally` section has more than one possible exit, a run-time
dispatcher is used, like so:
```c
{
  NI32 Target0_;
  L1_1_:
  Target0_ = 0;
  goto L1_;
  L1_2_:
  Target0_ = 1;
  L1_: // never jumped to from the outside
  NI32 oldNimErr0_ = *nimErr_; *nimErr_ = NIM_FALSE; // temporarily disable error mode
  // ... body of the finally ...
  *nimErr_ = oldNimErr0_;
  switch (Target0_) {
  case 0: goto L2_;
  case 1: goto L3_;
  }
}
```

Depending on the context and complexity of the code in-between, an
optimizing C compiler is able to eliminate the dispatcher and
`Target0_` assignment by directly inlining the body at a `goto L1_1_;`.

For the common case of a `Finally` section having two exits - one for
exceptional control-flow cases, and one for the -, a
`if (NIM_UNLIKELY(*nimErr_)) goto <error_label>; goto <non_error>` is
used instead of a full dispatcher. This mirrors how the exit of a
`finally` section previously looked like.

The idea behind not duplicating `Finally` sections is that it reduces
the amount of C code the compiler has to output. Nonetheless, the IR
from `ccgflow` is flexible enough to use the duplication strategy,
should this be needed again.

#### Exception Handling

Whether control-flow crosses the boundary of a (i.e., leaves it) is
encoded in the MIR/CGIR via the `Leave` item in target lists. `ccgflow`
uses this information to make sure that leaving a `Finally` via
unstructured control-flow properly aborts the active exception (if any)
and that leaving an `Except` properly pops the handler.

#### Other

The IR from `ccgflow` then drives the rest of C code generation. Since
there's no more statement-in-statement nesting, recursion reduces
significantly.

A side-effect of the flatter representation is that less C scopes are
used (only `if`, loops, `finally`, and `except` use C scopes), which
seems to harm C compiler optimization.

Support for the legacy control-flow primitives is fully removed.

### Exception Handling Runtime

The runtime part of exception handling for the C target is partially
overhauled. For compatibility with the `csources` compiler, the new
version is guarded behind the `nimskullNewExceptionRt` condsym.

A distinction is now made between an *in-flight* exception and the
*current* exception. Previously, both were treated as being one and the
same.

An exception becomes *in-flight* once it is raised (`raiseException2`),
and stops being in-flight when it is caught (`nimCatchException`).
While in-flight, an exception can be aborted (`nimAbortException`), by
breaking out of an intercepting `finally`. On being caught by a
handler, the exception is associated with the handler and the handler
pushed to the handler stack. When control-flow leaves the handler
(`nimLeaveExcept`), the handler is popped from the stack.

The new runtime fixes the `currentException` not being updated when
breaking out of a `finally` or raising from within an `except` handler.
In addition, an exception caught by a handler can now be raised again
within the handler (e.g., `except CatchableError as e: raise e`)
without reference cycles being introduced.
---
 compiler/backend/backends.nim                 |  10 +-
 compiler/backend/ccgcalls.nim                 |  70 +-
 compiler/backend/ccgexprs.nim                 |  81 +-
 compiler/backend/ccgflow.nim                  | 543 +++++++++++
 compiler/backend/ccgstmts.nim                 | 428 ++++----
 compiler/backend/cgen.nim                     |  35 +-
 compiler/backend/cgendata.nim                 |  21 +-
 compiler/backend/cgir.nim                     |  68 +-
 compiler/backend/cgirgen.nim                  | 448 +++++++--
 compiler/backend/cgirgen_legacy.nim           | 920 ++++++++++++++++++
 compiler/backend/cgirutils.nim                |   3 +-
 compiler/backend/compat.nim                   |   5 +
 compiler/backend/jsbackend.nim                |   7 +-
 compiler/backend/jsgen.nim                    |   2 +-
 compiler/front/condsyms.nim                   |   1 +
 compiler/mir/mirbridge.nim                    |   9 +-
 compiler/vm/vmbackend.nim                     |   4 +-
 compiler/vm/vmgen.nim                         |   3 +-
 compiler/vm/vmjit.nim                         |   4 +-
 doc/mir.rst                                   | 153 ++-
 lib/system/excpt.nim                          | 104 +-
 tests/exception/tfinally6.nim                 |   2 +-
 tests/exception/tleave_except2.nim            |  87 ++
 tests/exception/treraise2.nim                 |  58 ++
 .../tdestruction_in_unreachable.nim           |  35 +
 25 files changed, 2620 insertions(+), 481 deletions(-)
 create mode 100644 compiler/backend/ccgflow.nim
 create mode 100644 compiler/backend/cgirgen_legacy.nim
 create mode 100644 tests/exception/tleave_except2.nim
 create mode 100644 tests/exception/treraise2.nim
 create mode 100644 tests/lang_objects/destructor/tdestruction_in_unreachable.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index b2cbf3fdf9a..80b9999af09 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -15,7 +15,8 @@ import
   compiler/backend/[
     cgmeth,
     cgir,
-    cgirgen
+    cgirgen,
+    cgirgen_legacy
   ],
   compiler/front/[
     msgs,
@@ -370,6 +371,13 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
   result = cgirgen.generateIR(graph, idgen, env, owner, body)
   echoOutput(graph.config, owner, result)
 
+proc generateIRLegacy*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
+                 owner: PSym, body: sink MirBody): Body =
+  ## Translates the MIR code provided by `code` into legacy ``CgNode`` IR and,
+  ## if enabled, echoes the result.
+  result = cgirgen_legacy.generateIR(graph, idgen, env, owner, body)
+  echoOutput(graph.config, owner, result)
+
 # ------- handling of lifted globals ---------
 
 proc produceFragmentsForGlobals(
diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index 1b164a61efb..a9cdb221b2d 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -35,33 +35,59 @@ proc reportObservableStore(p: BProc; le, ri: CgNode) =
         # cannot analyse the location; assume the worst
         return true
 
-  if le != nil and locationEscapes(p, le, p.nestedTryStmts.len > 0):
+  # XXX: this whole procedure needs to be removed; RVO calls must only be used
+  #      if safe
+  var inTryStmt = false
+  # analyse the target to check whether a local exception handler or finally
+  # is reached
+  case ri[^1].kind
+  of cnkLabel:
+    inTryStmt = true
+  of cnkTargetList:
+    for it in ri[^1].items:
+      if it.kind == cnkLabel:
+        inTryStmt = true
+        break
+  else:
+    discard "no local exception handler or finally is reached"
+
+  if le != nil and locationEscapes(p, le, inTryStmt):
     localReport(p.config, le.info, reportSem rsemObservableStores)
 
-proc isHarmlessStore(p: BProc; canRaise: bool; d: TLoc): bool =
-  if d.k in {locTemp, locNone} or not canRaise:
+proc observableInExcept(n: CgNode): bool =
+  ## Computes whether the call expression `n` has an exceptional exit
+  ## that leads to an exception handler within the current procedure.
+  let target = n[^1]
+  case target.kind
+  of cnkLabel:      true # can only be an exception handler (of finally)
+  of cnkTargetList: target[^1].kind == cnkLabel
+  else:
+    unreachable()
+
+proc isHarmlessStore(p: BProc; ri: CgNode, d: TLoc): bool =
+  if d.k in {locTemp, locNone} or ri.kind != cnkCheckedCall:
     result = true
-  elif d.k == locLocalVar and p.withinTryWithExcept == 0:
+  elif d.k == locLocalVar and not observableInExcept(ri):
     # we cannot observe a store to a local variable if the current proc
     # has no error handler:
     result = true
   else:
     result = false
 
-proc exitCall(p: BProc, callee: CgNode, canRaise: bool) =
+proc exitCall(p: BProc, call: CgNode) =
   ## Emits the exceptional control-flow related post-call logic.
-  if p.config.exc == excGoto:
+  if call.kind == cnkCheckedCall:
     if nimErrorFlagDisabled in p.flags:
-      if callee.kind == cnkProc and sfNoReturn in p.env[callee.prc].flags and
-         canRaiseConservative(p.env, callee):
+      if call[0].kind == cnkProc and sfNoReturn in p.env[call[0].prc].flags and
+         canRaiseConservative(p.env, call[0]):
         # when using goto-exceptions, noreturn doesn't map to "doesn't return"
         # at the C-level. In order to still support dispatching to wrapper
         # procedures around ``raise`` from inside ``.compilerprocs``, we emit
         # an exit after the call
         p.flags.incl beforeRetNeeded
         lineF(p, cpsStmts, "goto BeforeRet_;$n", [])
-    elif canRaise:
-      raiseExit(p)
+    else:
+      raiseExit(p, call[^1])
 
 proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
                callee, params: Rope) =
@@ -86,17 +112,17 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
         pl.add(addrLoc(p.config, d))
         pl.add(~");$n")
         line(p, cpsStmts, pl)
-        exitCall(p, ri[0], canRaise)
+        exitCall(p, ri)
     else:
       pl.add(~")")
-      if isHarmlessStore(p, canRaise, d):
+      if isHarmlessStore(p, ri, d):
         if d.k == locNone: getTemp(p, typ[0], d)
         assert(d.t != nil)        # generate an assignment to d:
         var list: TLoc
         initLoc(list, locCall, d.lode, OnUnknown)
         list.r = pl
         genAssignment(p, d, list)
-        exitCall(p, ri[0], canRaise)
+        exitCall(p, ri)
       else:
         var tmp: TLoc
         getTemp(p, typ[0], tmp)
@@ -104,12 +130,12 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
         initLoc(list, locCall, d.lode, OnUnknown)
         list.r = pl
         genAssignment(p, tmp, list)
-        exitCall(p, ri[0], canRaise)
+        exitCall(p, ri)
         genAssignment(p, d, tmp)
   else:
     pl.add(~");$n")
     line(p, cpsStmts, pl)
-    exitCall(p, ri[0], canRaise)
+    exitCall(p, ri)
 
 proc reifiedOpenArray(p: BProc, n: CgNode): bool {.inline.} =
   # all non-parameter openArrays are reified
@@ -197,7 +223,7 @@ proc genArgNoParam(p: BProc, n: CgNode, needsTmp = false): Rope =
   result = rdLoc(a)
 
 proc genParams(p: BProc, ri: CgNode, typ: PType): Rope =
-  for i in 1..<ri.len:
+  for i in 1..<(1 + numArgs(ri)):
     if i < typ.len:
       assert(typ.n[i].kind == nkSym)
       let paramType = typ.n[i]
@@ -251,7 +277,7 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
   let canRaise = ri.kind == cnkCheckedCall
   if typ[0] != nil:
     if isInvalidReturnType(p.config, typ[0]):
-      if ri.len > 1: pl.add(~", ")
+      if numArgs(ri) > 0: pl.add(~", ")
       # the destination is guaranteed to be either a temporary or an lvalue
       # that can be modified in-place
       if true:
@@ -264,8 +290,8 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
           getTemp(p, typ[0], d)
         pl.add(addrLoc(p.config, d))
         genCallPattern()
-        exitCall(p, ri[0], canRaise)
-    elif isHarmlessStore(p, canRaise, d):
+        exitCall(p, ri)
+    elif isHarmlessStore(p, ri, d):
       if d.k == locNone: getTemp(p, typ[0], d)
       assert(d.t != nil)        # generate an assignment to d:
       var list: TLoc
@@ -275,7 +301,7 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
       else:
         list.r = PatProc % [rdLoc(op), pl, pl.addComma, rawProc]
       genAssignment(p, d, list)
-      exitCall(p, ri[0], canRaise)
+      exitCall(p, ri)
     else:
       var tmp: TLoc
       getTemp(p, typ[0], tmp)
@@ -287,11 +313,11 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
       else:
         list.r = PatProc % [rdLoc(op), pl, pl.addComma, rawProc]
       genAssignment(p, tmp, list)
-      exitCall(p, ri[0], canRaise)
+      exitCall(p, ri)
       genAssignment(p, d, tmp)
   else:
     genCallPattern()
-    exitCall(p, ri[0], canRaise)
+    exitCall(p, ri)
 
 proc genAsgnCall(p: BProc, le, ri: CgNode, d: var TLoc) =
   if ri[0].typ.skipTypes({tyGenericInst, tyAlias, tySink}).callConv == ccClosure:
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 24acfe516de..1a1aa504c38 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -294,11 +294,11 @@ template binaryArithOverflowRaw(p: BProc, t: PType, a, b: TLoc;
   var result = getTempName(p.module)
   linefmt(p, cpsLocals, "$1 $2;$n", [storage, result])
   lineCg(p, cpsStmts, "if (#$2($3, $4, &$1)) { #raiseOverflow(); $5};$n",
-      [result, cpname, rdCharLoc(a), rdCharLoc(b), raiseInstr(p)])
+      [result, cpname, rdCharLoc(a), rdCharLoc(b), raiseInstr(p, e.exit)])
   if size < p.config.target.intSize or t.kind in {tyRange, tyEnum}:
     linefmt(p, cpsStmts, "if ($1 < $2 || $1 > $3){ #raiseOverflow(); $4}$n",
             [result, intLiteral(firstOrd(p.config, t)), intLiteral(lastOrd(p.config, t)),
-            raiseInstr(p)])
+            raiseInstr(p, e.exit)])
   result
 
 proc binaryArithOverflow(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
@@ -324,7 +324,7 @@ proc binaryArithOverflow(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
     # result is only for overflows.
     if m in {mDivI, mModI}:
       linefmt(p, cpsStmts, "if ($1 == 0){ #raiseDivByZero(); $2}$n",
-              [rdLoc(b), raiseInstr(p)])
+              [rdLoc(b), raiseInstr(p, e.exit)])
 
     let res = binaryArithOverflowRaw(p, t, a, b,
       if t.kind == tyInt64: prc64[m] else: prc[m])
@@ -338,7 +338,7 @@ proc unaryArithOverflow(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
   initLocExpr(p, e[1], a)
   t = skipTypes(e.typ, abstractRange)
   linefmt(p, cpsStmts, "if ($1 == $2){ #raiseOverflow(); $3}$n",
-          [rdLoc(a), intLiteral(firstOrd(p.config, t)), raiseInstr(p)])
+          [rdLoc(a), intLiteral(firstOrd(p.config, t)), raiseInstr(p, e.exit)])
   case m
   of mUnaryMinusI:
     putIntoDest(p, d, e, "((NI$2)-($1))" % [rdLoc(a), rope(getSize(p.config, t) * 8)])
@@ -631,7 +631,7 @@ proc genFieldCheck(p: BProc, e: CgNode) =
 
     discard cgsym(p.module, raiseProc) # make sure the compilerproc is generated
     linefmt(p, cpsStmts, "{ $1($3, $4); $2} $n",
-            [raiseProc, raiseInstr(p), strLit, toStr])
+            [raiseProc, raiseInstr(p, e.exit), strLit, toStr])
 
 proc genUncheckedArrayElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   var a, b: TLoc
@@ -660,7 +660,7 @@ proc genCStringElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   putIntoDest(p, d, n,
               ropecg(p.module, "$1[$2]", [rdLoc(a), rdCharLoc(b)]), a.storage)
 
-proc genBoundsCheck(p: BProc; arr, a, b: TLoc) =
+proc genBoundsCheck(p: BProc; arr, a, b: TLoc, exit: CgNode) =
   # types that map to C pointers need to be skipped here too, since no
   # dereference is generated for ``ptr array`` and the like
   let ty = skipTypes(arr.t, abstractVarRange + {tyPtr, tyRef, tyLent})
@@ -670,29 +670,29 @@ proc genBoundsCheck(p: BProc; arr, a, b: TLoc) =
       linefmt(p, cpsStmts,
         "if ($2-$1 != -1 && " &
         "((NU)($1) >= (NU)($3.Field1) || (NU)($2) >= (NU)($3.Field1))){ #raiseIndexError(); $4}$n",
-        [rdLoc(a), rdLoc(b), rdLoc(arr), raiseInstr(p)])
+        [rdLoc(a), rdLoc(b), rdLoc(arr), raiseInstr(p, exit)])
     else:
       linefmt(p, cpsStmts,
         "if ($2-$1 != -1 && " &
         "((NU)($1) >= (NU)($3Len_0) || (NU)($2) >= (NU)($3Len_0))){ #raiseIndexError(); $4}$n",
-        [rdLoc(a), rdLoc(b), rdLoc(arr), raiseInstr(p)])
+        [rdLoc(a), rdLoc(b), rdLoc(arr), raiseInstr(p, exit)])
   of tyArray:
     let first = intLiteral(firstOrd(p.config, ty))
     linefmt(p, cpsStmts,
       "if ($2-$1 != -1 && " &
       "($2-$1 < -1 || $1 < $3 || $1 > $4 || $2 < $3 || $2 > $4)){ #raiseIndexError(); $5}$n",
-      [rdCharLoc(a), rdCharLoc(b), first, intLiteral(lastOrd(p.config, ty)), raiseInstr(p)])
+      [rdCharLoc(a), rdCharLoc(b), first, intLiteral(lastOrd(p.config, ty)), raiseInstr(p, exit)])
   of tySequence, tyString:
     linefmt(p, cpsStmts,
       "if ($2-$1 != -1 && " &
       "((NU)($1) >= (NU)$3 || (NU)($2) >= (NU)$3)){ #raiseIndexError(); $4}$n",
-      [rdLoc(a), rdLoc(b), lenExpr(p, arr), raiseInstr(p)])
+      [rdLoc(a), rdLoc(b), lenExpr(p, arr), raiseInstr(p, exit)])
   of tyUncheckedArray, tyCstring:
     discard "no checks are used"
   else:
     unreachable(ty.kind)
 
-proc genIndexCheck(p: BProc; x: CgNode, arr, idx: TLoc) =
+proc genIndexCheck(p: BProc; x: CgNode, arr, idx: TLoc, exit: CgNode) =
   ## Emits the index check logic + subsequent raise operation. `x` is
   ## the array expression the `arr` loc resulted from from.
   let ty = arr.t.skipTypes(abstractVar + tyUserTypeClasses +
@@ -703,22 +703,22 @@ proc genIndexCheck(p: BProc; x: CgNode, arr, idx: TLoc) =
     if firstOrd(p.config, ty) == 0 and lastOrd(p.config, ty) >= 0:
       linefmt(p, cpsStmts, "if ((NU)($1) > (NU)($2)){ #raiseIndexError2($1, $2); $3}$n",
               [rdCharLoc(idx), intLiteral(lastOrd(p.config, ty)),
-               raiseInstr(p)])
+               raiseInstr(p, exit)])
     else:
       linefmt(p, cpsStmts, "if ($1 < $2 || $1 > $3){ #raiseIndexError3($1, $2, $3); $4}$n",
               [rdCharLoc(idx), first, intLiteral(lastOrd(p.config, ty)),
-               raiseInstr(p)])
+               raiseInstr(p, exit)])
   of tySequence, tyString:
     linefmt(p, cpsStmts,
             "if ((NU)($1) >= (NU)$2){ #raiseIndexError2($1,$2-1); $3}$n",
-            [rdCharLoc(idx), lenExpr(p, arr), raiseInstr(p)])
+            [rdCharLoc(idx), lenExpr(p, arr), raiseInstr(p, exit)])
   of tyOpenArray, tyVarargs:
     if reifiedOpenArray(p, x):
       linefmt(p, cpsStmts, "if ((NU)($1) >= (NU)($2.Field1)){ #raiseIndexError2($1,$2.Field1-1); $3}$n",
-              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p)])
+              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p, exit)])
     else:
       linefmt(p, cpsStmts, "if ((NU)($1) >= (NU)($2Len_0)){ #raiseIndexError2($1,$2Len_0-1); $3}$n",
-              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p)])
+              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p, exit)])
   of tyCstring:
     discard "no bound checks"
   else:
@@ -766,18 +766,19 @@ proc genArrayLikeElem(p: BProc; n: CgNode; d: var TLoc) =
 
 proc genEcho(p: BProc, n: CgNode) =
   ## Generates and emits the code for the magic echo call.
-  if n.len == 1:
+  let argCount = numArgs(n)
+  if argCount == 0:
     linefmt(p, cpsStmts, "#echoBinSafe(NIM_NIL, 0);$n", [])
   else:
     # allocate a temporary array and fill it with the arguments:
     var tmp: TLoc
     getTemp(p, n[1].typ, tmp) # the first argument stores the type to use
-    for i in 2..<n.len:
+    for i in 2..<(1 + argCount):
       var a: TLoc
       initLocExpr(p, n[i], a)
       linefmt(p, cpsStmts, "$1[$2] = $3;$n", [rdLoc(tmp), i-2, rdLoc(a)])
 
-    linefmt(p, cpsStmts, "#echoBinSafe($1, $2);$n", [rdLoc(tmp), n.len-2])
+    linefmt(p, cpsStmts, "#echoBinSafe($1, $2);$n", [rdLoc(tmp), argCount-1])
 
 proc strLoc(p: BProc; d: TLoc): Rope =
   result = byRefLoc(p, d)
@@ -1514,7 +1515,7 @@ proc genRangeChck(p: BProc, n: CgNode, d: var TLoc) =
     if n0t.kind in {tyUInt, tyUInt64}:
       linefmt(p, cpsStmts, "if ($1 > ($6)($3)){ #raiseRangeErrorNoArgs(); $5}$n",
         [rdCharLoc(a), genLiteral(p, n[2], dest), genLiteral(p, n[3], dest),
-        raiser, raiseInstr(p), getTypeDesc(p.module, n0t)])
+        raiser, raiseInstr(p, n.exit), getTypeDesc(p.module, n0t)])
     else:
       let raiser =
         case skipTypes(n.typ, abstractVarRange).kind
@@ -1531,7 +1532,7 @@ proc genRangeChck(p: BProc, n: CgNode, d: var TLoc) =
           ""
       linefmt(p, cpsStmts, "if ($6($1) < $2 || $6($1) > $3){ $4($1, $2, $3); $5}$n",
         [rdCharLoc(a), genLiteral(p, n[2], dest), genLiteral(p, n[3], dest),
-        raiser, raiseInstr(p), boundaryCast])
+        raiser, raiseInstr(p, n.exit), boundaryCast])
   putIntoDest(p, d, n, "(($1) ($2))" %
       [getTypeDesc(p.module, dest), rdCharLoc(a)], a.storage)
 
@@ -1568,7 +1569,8 @@ proc binaryFloatArith(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
     putIntoDest(p, d, e, ropecg(p.module, "(($4)($2) $1 ($4)($3))",
                               [opr[m], rdLoc(a), rdLoc(b),
                               getSimpleTypeDesc(p.module, e[1].typ)]))
-    linefmt(p, cpsStmts, "if ($1 != 0.0 && $1*0.5 == $1) { #raiseFloatOverflow($1); $2}$n", [rdLoc(d), raiseInstr(p)])
+    linefmt(p, cpsStmts, "if ($1 != 0.0 && $1*0.5 == $1) { #raiseFloatOverflow($1); $2}$n",
+            [rdLoc(d), raiseInstr(p, e.exit)])
 
 proc skipAddr(n: CgNode): CgNode =
   if n.kind == cnkHiddenAddr: n.operand
@@ -1758,18 +1760,18 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     # NOTE: if the value is a signaling NaN, the comparison itself results in
     #       a float-point exception (which might result in a trap)
     linefmt(p, cpsStmts, "if ($1 != $1){ #raiseFloatInvalidOp(); $2}$n",
-            [rdLoc(a), raiseInstr(p)])
+            [rdLoc(a), raiseInstr(p, e.exit)])
   of mChckIndex:
     var arr, a: TLoc
     initLocExpr(p, e[1], arr)
     initLocExpr(p, e[2], a)
-    genIndexCheck(p, e[1], arr, a)
+    genIndexCheck(p, e[1], arr, a, e.exit)
   of mChckBounds:
     var arr, a, b: TLoc
     initLocExpr(p, e[1], arr)
     initLocExpr(p, e[2], a)
     initLocExpr(p, e[3], b)
-    genBoundsCheck(p, arr, a, b)
+    genBoundsCheck(p, arr, a, b, e.exit)
   of mChckField:
     genFieldCheck(p, e)
   of mChckObj:
@@ -1781,7 +1783,7 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     # the nil-check is expected to have taken place already
     linefmt(p, cpsStmts, "if (!#isObj($2, $3)){ #raiseObjectConversionError(); $4}$n",
             [nilCheck, r, genTypeInfo2Name(p.module, e[2].typ),
-             raiseInstr(p)])
+             raiseInstr(p, e.exit)])
   of mSamePayload:
     var a, b: TLoc
     initLocExpr(p, e[1], a)
@@ -1899,10 +1901,6 @@ proc genArrayConstr(p: BProc, n: CgNode, d: var TLoc) =
       arr.r = "$1[$2]" % [rdLoc(d), intLiteral(i)]
       expr(p, n[i], arr)
 
-proc genStmtList(p: BProc, n: CgNode) =
-  for i in 0..<n.len:
-    genStmts(p, n[i])
-
 proc downConv(p: BProc, n: CgNode, d: var TLoc) =
   ## Generates and emits the code for the ``cnkObjDownConv`` (conversion to
   ## sub-type) expression `n`.
@@ -2104,18 +2102,19 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
       genTupleElem(p, n, d)
   of cnkDeref, cnkDerefView: genDeref(p, n, d)
   of cnkFieldAccess: genRecordField(p, n, d)
-  of cnkBlockStmt: genBlock(p, n)
-  of cnkStmtList: genStmtList(p, n)
   of cnkIfStmt: genIf(p, n)
   of cnkObjDownConv: downConv(p, n, d)
   of cnkObjUpConv: upConv(p, n, d)
   of cnkClosureConstr: genClosure(p, n, d)
   of cnkEmpty: discard
-  of cnkRepeatStmt: genRepeatStmt(p, n)
+  of cnkLoopJoinStmt:
+    startBlock(p, "while (1) {$n")
+  of cnkFinally:
+    startBlock(p)
+  of cnkEnd, cnkContinueStmt, cnkLoopStmt:
+    endBlock(p)
   of cnkDef: genSingleVar(p, n[0], n[1])
   of cnkCaseStmt: genCase(p, n)
-  of cnkReturnStmt: genReturnStmt(p, n)
-  of cnkBreakStmt: genBreakStmt(p, n)
   of cnkAsgn, cnkFastAsgn:
     genAsgn(p, n)
   of cnkVoidStmt:
@@ -2125,12 +2124,14 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
     line(p, cpsStmts, "(void)(" & a.r & ");\L")
   of cnkAsmStmt: genAsmStmt(p, n)
   of cnkEmitStmt: genEmit(p, n)
-  of cnkTryStmt:
-    assert p.config.exc == excGoto
-    genTryGoto(p, n)
+  of cnkExcept:
+    genExcept(p, n)
   of cnkRaiseStmt: genRaiseStmt(p, n)
-  of cnkInvalid, cnkType, cnkAstLit, cnkMagic, cnkRange, cnkBinding, cnkExcept,
-     cnkFinally, cnkBranch, cnkLabel, cnkStmtListExpr, cnkField:
+  of cnkJoinStmt, cnkGotoStmt:
+    unreachable("handled separately")
+  of cnkInvalid, cnkType, cnkAstLit, cnkMagic, cnkRange, cnkBinding, cnkBranch,
+     cnkLabel, cnkTargetList, cnkStmtListExpr, cnkField, cnkStmtList,
+     cnkLeave, cnkResume, cnkLegacyNodes:
     internalError(p.config, n.info, "expr(" & $n.kind & "); unknown node kind")
 
 proc getDefaultValue(p: BProc; typ: PType; info: TLineInfo): Rope =
diff --git a/compiler/backend/ccgflow.nim b/compiler/backend/ccgflow.nim
new file mode 100644
index 00000000000..8c54e85efe5
--- /dev/null
+++ b/compiler/backend/ccgflow.nim
@@ -0,0 +1,543 @@
+## Implements the translation of CGIR to a code listing for an abstract
+## machine that focuses on control-flow and exception handling.
+##
+## This code listing is intended for consumption by the C code generator.
+
+import
+  std/[
+    options,
+    packedsets,
+    tables
+  ],
+  compiler/backend/[
+    cgir
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+type
+  COpcode* = enum
+    opJump       ## unconditional jump
+    opErrJump    ## jump if in error mode
+    opDispJump   ## jump part of a dispatcher
+    opLabel      ## jump target
+
+    opSetTarget  ## set the value of a dispatcher's discriminator
+    opDispatcher ## start of a dispatcher
+
+    opBackup     ## backup the error state in a local variable and clear it
+    opRestore    ## restore the error from a local variable
+
+    opStmts      ## slice of statements
+    opStmt       ## control-flow relevant single statement. A label
+                 ## specifier is passed along
+    # future direction: ``CStmt`` should be removed and all unstructured
+    # control-flow bits modeled with the other instructions. Checked calls
+    # used as an assignment source currently block this, as they might
+    # require an assignment-to-temporary
+
+    opAbort
+    opPopHandler
+
+  JumpOp = range[opJump..opDispJump]
+
+  CLabelId* = distinct uint32
+  CLabelSpecifier* = uint32
+    ## used for identifying the extra labels attached to finally sections
+
+  CLabel* = tuple
+    ## Name of a label.
+    id: CLabelId
+    specifier: Option[CLabelSpecifier]
+
+  CInstr* = object
+    case op*: COpcode
+    of opJump, opErrJump, opLabel, opDispJump:
+      label*: CLabel
+    of opSetTarget, opDispatcher:
+      discr*: uint32 ## ID of the discriminator variable
+      value*: int    ## either the value, or number of dispatcher branches
+    of opStmts:
+      stmts*: Slice[int]
+    of opStmt:
+      stmt*: int
+      specifier*: CLabelSpecifier
+    of opBackup, opRestore, opAbort:
+      local*: uint32 ## ID of the backup variable
+    of opPopHandler:
+      discard
+
+  FinallyInfo* = object
+    routes: seq[PathIndex]
+    numExits: int
+      ## number of exits the finally has. Pre-computed for efficiency
+    numErr: int
+      ## number of exceptional jump paths going through this finalizer
+    numNormal: int
+      ## number of non-exception jump paths going through this finalizer
+
+    discriminator: uint32
+      ## ID of the discriminator variable to use for the dispatcher
+    errBackupId: uint32
+      ## only valid if the finally is entered by exceptional control-flow
+
+  PathKind = enum
+    pkError
+    pkNormal
+  PathIndex = uint32
+    ## Index of a ``PathItem`` within the item storage.
+  PathItemTarget = object
+    label: CLabelId
+    isCleanup: bool
+  PathItem = object
+    ## Represents a step in a jump path. A jump path is a chain of finally
+    ## sections plus final target an intercepted goto visits.
+    ##
+    ## An item is part of two intrusive linked-lists: one doubly-linked-list
+    ## representing a single chain, and one singly-linked-list for the
+    ## adjacent chains. The "none" value for a pointer is represented by it
+    ## pointing to the node itself.
+    prev, next: PathIndex
+    sibling: PathIndex
+
+    target: PathItemTarget
+      ## the identifier of the jump target
+    kinds: set[PathKind]
+      ## the kinds of control-flow (exception or normal) reaching the path
+      ## item
+
+  Paths = seq[PathItem]
+    ## The data storage for multiple jump paths, with the items layed out
+    ## "tail first", meaning that the final target of a jump chain comes
+    ## *before* the others. The idea is to uniquely identify jump paths
+    ## within a body while merging common trailing paths.
+    ##
+    ## Consider the two jump paths E->D->C->B->A and G->F->C->B->A. If
+    ## both are added to the storage, the content would look like this:
+    ##
+    ##    (0: A) -> (1: B) -> (2: C) -> (3: D) -> (4: E)
+    ##                                \ (5: F) -> (6: G)
+    ##
+    ## The numbers represent the items' index in the sequence. The `sibling`
+    ## item of 3 is 5 (all other items have no siblings); the `next` pointer
+    ## of 5 points to 2. As can be seen, common trailing paths are merged into
+    ## one.
+
+  Context = object
+    ## Local state used during the translation bundled into an object for
+    ## convenience.
+    paths: Paths
+    stmtToPath: Table[int, int]
+    finallys: Table[CLabelId, FinallyInfo]
+    cleanups: Table[CLabelId, FinallyInfo]
+      ## cleanup here refers to the exception-related cleanup when
+      ## exiting a finally or except section
+
+const
+  ExitLabel* = CLabelId(0)
+    ## The label of the procedure exit.
+  ResumeLabel* = ExitLabel
+    ## The C label that a ``cnkResume`` targets.
+
+func `==`*(a, b: CLabelId): bool {.borrow.}
+
+func toCLabel*(n: CgNode): CLabelId =
+  ## Returns the ID of the C label the label-like node `n` represents.
+  case n.kind
+  of cnkResume:
+    ResumeLabel
+  of cnkLabel:
+    CLabelId(ord(n.label) + 2)
+  of cnkLeave:
+    toCLabel(n[0])
+  else:
+    unreachable(n.kind)
+
+func toCLabel*(n: CgNode, specifier: Option[CLabelSpecifier]
+              ): CLabel {.inline.} =
+  (toCLabel(n), specifier)
+
+func toBlockId*(id: CLabelId): BlockId =
+  ## If `id` was converted to from a valid CGIR label, converts it back to
+  ## the CGIR label.
+  BlockId(ord(id) - 2)
+
+func rawAdd(p: var Paths, x: openArray[PathItemTarget]): PathIndex =
+  ## Appends the chain `x` to `p` without any deduplication or
+  ## linking with the existing items. Returns the index of the
+  ## tail item.
+  result = p.len.PathIndex
+  for i in countdown(x.high, 0):
+    let pos = p.len.PathIndex
+    p.add PathItem(prev: (if i > 0: pos + 1 else: pos),
+                   next: (if i < x.high: pos - 1 else: pos),
+                   sibling: pos,
+                   target: x[i])
+
+func add(p: var Paths, path: openArray[PathItemTarget]): PathIndex =
+  ## Adds `path` to the `p`. Only the sub-path of `path` not yet present in
+  ## `p` is added. The index of the *head* item of the added (or existing)
+  ## path is returned.
+  if p.len == 0:
+    discard rawAdd(p, path)
+    p[0].next = 0'u32
+    return p.high.PathIndex
+
+  var pos = 0'u32 ## the current search position
+  for i in countdown(path.len-1, 0):
+    # search the sibling list for a matching item:
+    while p[pos].target != path[i] and pos != p[pos].sibling:
+      pos = p[pos].sibling
+
+    if p[pos].target != path[i]:
+      # no item was found, meaning that this is the end of the common paths.
+      # Add the remaining items to the storage.
+      let next = rawAdd(p, path.toOpenArray(0, i))
+      p[pos].sibling = next
+      # only set the next pointer if there was a common sub-path (otherwise
+      # there's no next item):
+      if i != path.high:
+        p[next].next = p[pos].next
+      return p.high.PathIndex
+
+    # it's a match! continue down the chain
+    if i > 0:
+      if p[pos].prev == pos:
+        # there's no next item, append the remaining new targets to the
+        # pre-existing path
+        let next = rawAdd(p, path.toOpenArray(0, i-1))
+        p[pos].prev = next
+        p[next].next = pos
+        return p.high.PathIndex
+      else:
+        pos = p[pos].prev
+
+  # the chain `path` already exists in `p`
+  result = pos
+
+func incl(p: var Paths, at: PathIndex, kind: PathKind) =
+  ## Marks all items following and including `at` with `kind`.
+  var i = at
+  while p[i].next != i:
+    p[i].kinds.incl kind
+    i = p[i].next
+  p[i].kinds.incl kind
+
+func needsDispatcher(f: FinallyInfo): bool =
+  # a dispatcher is required if re are more than one exits. An exception is
+  # the case where one exit is only taken when in error mode and the other is
+  # not. If a dispatcher is required, the finally has sub-labels.
+  f.numExits > 1 and
+    not(f.routes.len == 2 and f.numErr == 1 and f.numNormal == 1)
+
+func needsSpecifier(c: Context, target: PathItemTarget): bool =
+  # cleanup sections don't have a unique label themselves, so using a
+  # specifier is required
+  target.isCleanup or
+    ((target.label in c.finallys) and
+     needsDispatcher(c.finallys[target.label]))
+
+proc append(targets: var seq[PathItemTarget],
+            redirects: Table[BlockId, CgNode],
+            exits: PackedSet[BlockId], n: CgNode) =
+  ## Appends all jump targets `n` represents to `targets`, following
+  ## `redirects` and turning all labels part of `exits` into the
+  ## "before return" label.
+  template addTarget(t: CLabelId; cleanup = false) =
+    targets.add PathItemTarget(label: t, isCleanup: cleanup)
+
+  case n.kind
+  of cnkLabel:
+    if n.label in redirects:
+      append(targets, redirects, exits, redirects[n.label])
+    elif n.label in exits:
+      addTarget ExitLabel
+    else:
+      addTarget toCLabel(n)
+  of cnkTargetList:
+    # only the final target could possibly be redirected
+    let hasRedir = n[^1].kind == cnkLabel and n[^1].label in redirects
+    for i in 0..<n.len - ord(hasRedir):
+      case n[i].kind
+      of cnkLeave:
+        addTarget toCLabel(n[i][0]), cleanup=true
+      of cnkResume:
+        addTarget toCLabel(n[i])
+      of cnkLabel:
+        if n[i].label in exits:
+          addTarget ExitLabel
+        else:
+          addTarget toCLabel(n[i])
+      else:
+        unreachable()
+
+    if hasRedir:
+      append(targets, redirects, exits, redirects[n[^1].label])
+  else:
+    unreachable()
+
+proc gatherRedirectsAndFinallys(c: var Context, stmts: CgNode
+                               ): Table[BlockId, CgNode] =
+  #ä First pass: gather the redirects for redundant labels. Consider:
+  ##   L1:
+  ##   goto L2
+  ##
+  ## Here, all jumps to L1 can jump to L2 directly. This pattern is
+  ## especially common with compiler-generated cleanup sections.
+  ##
+  ## The table for the finally sections is also populated.
+  for i in 0..<stmts.len - 1:
+    case stmts[i].kind
+    of cnkJoinStmt:
+      var j = i + 1
+      # skip join and end statements:
+      while j < stmts.len and stmts[j].kind in {cnkJoinStmt, cnkEnd}:
+        inc j
+
+      # if the label is followed directly by a goto statement, all jumps to
+      # the label can jump to the goto's target instead
+      if j < stmts.len and stmts[j].kind == cnkGotoStmt:
+        result[stmts[i][0].label] = stmts[j][0]
+    of cnkFinally:
+      # make sure a table entry exists for the finally section:
+      c.finallys[toCLabel(stmts[i][0])] = FinallyInfo()
+    else:
+      discard
+
+proc toInstrList*(stmts: CgNode, isFull: bool): seq[CInstr] =
+  ## Turns the statements list `stmts` into an instruction list for the
+  ## abstract machine. `isFull` signals whether the end of the statement list
+  ## can be considered the end of the procedure, which allows for the merging
+  ## of some control-flow paths.
+  var c = Context()
+  let redirects = gatherRedirectsAndFinallys(c, stmts) # first pass
+
+  # mark the labels of the trailing joins as being the same as the exit
+  # label...
+  var exits: PackedSet[BlockId]
+  if isFull:
+    # ... but only of stmts constitute the whole body
+    for i in countdown(stmts.len - 1, 0):
+      if stmts[i].kind == cnkJoinStmt:
+        exits.incl stmts[i][0].label
+      else:
+        break
+
+  # second pass: collect all jump paths, using the table of redirections to
+  # eliminate unnecessary breaks in the paths
+  var targets: seq[PathItemTarget]
+  for i, it in stmts.pairs:
+    template exit(x: CgNode; isErr = false) =
+      targets.setLen(0)
+      targets.append(redirects, exits, x)
+
+      # a single jump is only of relevance if it targets a finally directly
+      if targets.len > 1 or targets[0].label in c.finallys:
+        let id = c.paths.add(targets)
+        if isErr: incl(c.paths, id, pkError)
+        else:     incl(c.paths, id, pkNormal)
+
+        # remember the path associated with the statement for later:
+        c.stmtToPath[i] = id.int
+
+    case it.kind
+    of cnkDef, cnkAsgn, cnkFastAsgn:
+      if it[1].kind == cnkCheckedCall:
+        exit(it[1][^1], true)
+    of cnkRaiseStmt, cnkCheckedCall:
+      exit(it[^1], true)
+    of cnkGotoStmt:
+      exit(it[0])
+    of cnkCaseStmt:
+      for j in 1..<it.len:
+        exit(it[j][^1])
+    of cnkExcept:
+      if it.len > 1:
+        exit(it[^1], true)
+    else:
+      discard
+
+  # register every path item with the finally section it targets, and compute
+  # some statistics that are used during the later code generation:
+  for i, it in c.paths.pairs:
+    func setup(f: var FinallyInfo, it: PathItem) =
+      f.routes.add i.PathIndex
+      f.numExits += ord(it.next.int != i)
+      f.numErr += ord(pkError in it.kinds)
+      f.numNormal += ord(pkNormal in it.kinds)
+
+    if it.target.isCleanup:
+      setup(c.cleanups.mgetOrPut(it.target.label, FinallyInfo()), it)
+    elif it.target.label in c.finallys:
+      setup(c.finallys[it.target.label], it)
+
+  # construction of the instruction list follows
+
+  proc label(code: var seq[CInstr], id: CLabelId;
+             spec = none(CLabelSpecifier)) {.nimcall.} =
+    # a label must always be preceded by some code, so no length guard is
+    # required
+    if code[^1].op in {opJump, opErrJump} and code[^1].label.id == id and
+       code[^1].label.specifier == spec:
+      # optimization: remove the preceding jump if it targets the label
+      code.setLen(code.len - 1)
+    code.add CInstr(op: opLabel, label: (id, spec))
+
+  proc jump(code: var seq[CInstr], target: CLabelId) {.nimcall.} =
+    code.add CInstr(op: opJump, label: (target, none CLabelSpecifier))
+
+  proc jump(code: var seq[CInstr], op: JumpOp, c: Context,
+            path: PathIndex) {.nimcall.} =
+    let target = c.paths[path].target
+    if needsSpecifier(c, target):
+      code.add CInstr(op: op, label: (target.label, some path))
+    else:
+      code.add CInstr(op: op, label: (target.label, none CLabelSpecifier))
+
+  proc stmt(code: var seq[CInstr], c: Context, pos: int) {.nimcall.} =
+    if (let path = c.stmtToPath.getOrDefault(pos, -1); path != -1 and
+        needsSpecifier(c, c.paths[path].target)):
+      # a label specifier, and thus a separate instruction, is needed
+      code.add CInstr(op: opStmt, stmt: pos, specifier: CLabelSpecifier path)
+    elif code.len > 0 and code[^1].op == opStmts and
+         code[^1].stmts.b == pos + 1:
+      # append to the sequence
+      inc code[^1].stmts.b
+    else:
+      # start a new sequence
+      code.add CInstr(op: opStmts, stmts: pos..pos)
+
+  var
+    code: seq[CInstr]
+    nextDispId = 0'u32
+    nextRecoverID = 0'u32
+
+  for i, it in stmts.pairs:
+    case it.kind
+    of cnkFinally:
+      stmt code, c, i
+      let
+        clabel = toCLabel(it[0])
+        f = addr c.finallys[clabel]
+
+      # allocate and set the ID for the discriminator variable:
+      f.discriminator = nextDispId
+      inc nextDispId
+
+      # emit the entry-point(s); one for each route
+      if needsDispatcher(f[]):
+        # an entry point looks like this:
+        #   L1_1_:
+        #   Target = ...
+        #   goto L1_
+        for i, entry in f.routes.pairs:
+          label code, clabel, some(entry)
+          code.add CInstr(op: opSetTarget, discr: f.discriminator, value: i)
+          # jump to the main code:
+          jump code, clabel
+
+      # the body follows:
+      label code, clabel
+      if f.numErr > 0:
+        # backing up the error state is only needed when the finally is
+        # entered by exceptional control-flow
+        f.errBackupId = nextRecoverID
+        code.add CInstr(op: opBackup, local: nextRecoverID)
+        inc nextRecoverID
+
+    of cnkContinueStmt:
+      let
+        clabel = toCLabel(it[0])
+        f {.cursor.} = c.finallys[clabel]
+
+      # no need to restore the error state if control-flow never reaches the
+      # end of the finally anyway
+      if f.numErr > 0 and f.numExits > 0:
+        code.add CInstr(op: opRestore, local: f.errBackupId)
+
+      if f.numExits == 0:
+        discard "the end is never reached; nothing to do"
+      elif not needsDispatcher(f) and f.routes.len == 2:
+        # optimization: if two paths go through a finally, with one of them
+        # an exceptional jump path and the other one not, instead of using a
+        # full dispatcher we emit:
+        #   if err: goto error_exit
+        #   goto normal_exit
+        let exit = if c.paths[f.routes[0]].kinds == {pkError}: 0 else: 1
+        jump code, opErrJump, c, c.paths[f.routes[exit]].next
+        jump code, opJump,    c, c.paths[f.routes[1 - exit]].next
+      else:
+        assert f.routes.len == f.numExits
+        # a dispatcher is only required if there is more than one exit
+        let op = if f.numExits > 1: opDispJump
+                 else:              opJump
+
+        if op == opDispJump:
+          code.add CInstr(op: opDispatcher, discr: f.discriminator,
+                          value: f.numExits)
+
+        for it in f.routes.items:
+          jump code, op, c, c.paths[it].next
+
+      # emit the exception-related cleanup after the dispatcher:
+      if clabel in c.cleanups:
+        let cleanup {.cursor.} = c.cleanups[clabel]
+        # a dispatcher is not worth the overhead, emit an abort instruction
+        # for each route
+        for entry in cleanup.routes.items:
+          label code, clabel, some(entry)
+          # TODO: omit the cleanup logic as a whole, if the finally section is
+          #       never entered via an exception
+          if f.numErr > 0:
+            code.add CInstr(op: opAbort, local: f.errBackupId)
+          jump code, opJump, c, PathIndex c.paths[entry].next
+
+      stmt code, c, i
+
+    of cnkJoinStmt:
+      # XXX: labels that were redirected cannot be eliminated yet, as case
+      #      statements (which are handled outside of ccgflow) might still
+      #      target them
+      label code, toCLabel(it[0])
+    of cnkExcept:
+      # an except section is a label followed by the filter logic
+      label code, toCLabel(it[0])
+      stmt code, c, i
+    of cnkEnd:
+      let clabel = toCLabel(it[0])
+      # emit the cleanup for except sections:
+      if clabel in c.cleanups:
+        let cleanup {.cursor.} = c.cleanups[clabel]
+        # a dispatcher is not worth the overhead, emit a pop instruction
+        # for each route
+        for entry in cleanup.routes.items:
+          label code, clabel, some(entry)
+          code.add CInstr(op: opPopHandler)
+          jump code, opJump, c, PathIndex c.paths[entry].next
+
+      stmt code, c, i
+
+    of cnkGotoStmt:
+      let target = it[0]
+      if (let path = c.stmtToPath.getOrDefault(i, -1); path != -1):
+        jump code, opJump, c, PathIndex path
+      elif target.kind == cnkLabel:
+        jump code, toCLabel(target)
+      else:
+        jump code, toCLabel(target[^1])
+    of cnkRaiseStmt:
+      stmt code, c, i # the statement handles the exception setup part
+      # the goto part is the same as for a normal goto
+      let target = it[^1]
+      if target.kind == cnkLabel:
+        jump code, toCLabel(target)
+      elif (let path = c.stmtToPath.getOrDefault(i, -1); path != -1):
+        jump code, opJump, c, PathIndex path
+      else:
+        jump code, toCLabel(target[^1])
+
+    else:
+      stmt code, c, i
+
+  result = code
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index 811116a43c1..feb064bd623 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -15,29 +15,14 @@ const
   stringCaseThreshold = 8
     # above X strings a hash-switch for strings is generated
 
-proc inExceptBlockLen(p: BProc): int =
-  for x in p.nestedTryStmts:
-    if x.inExcept: result.inc
-
-proc startBlockInternal(p: BProc, blk: int) =
-  inc(p.labels)
+proc startBlockInternal(p: BProc) =
   let result = p.blocks.len
   setLen(p.blocks, result + 1)
-  p.blocks[result].id = p.labels
-  p.blocks[result].blk = blk
-  p.blocks[result].nestedTryStmts = p.nestedTryStmts.len.int16
-  p.blocks[result].nestedExceptStmts = p.inExceptBlockLen.int16
 
 template startBlock(p: BProc, start: FormatStr = "{$n",
-                args: varargs[Rope]) =
+                args: varargs[Rope]) {.used.} =
   lineCg(p, cpsStmts, start, args)
-  startBlockInternal(p, 0)
-
-template startBlock(p: BProc, id: BlockId) =
-  lineCg(p, cpsStmts, "{$n", [])
-  startBlockInternal(p, id.int + 1)
-
-proc endBlock(p: BProc)
+  startBlockInternal(p)
 
 proc loadInto(p: BProc, le, ri: CgNode, a: var TLoc) {.inline.} =
   if ri.kind in {cnkCall, cnkCheckedCall} and
@@ -54,10 +39,6 @@ proc loadInto(p: BProc, le, ri: CgNode, a: var TLoc) {.inline.} =
     a.flags.incl(lfEnforceDeref)
     expr(p, ri, a)
 
-proc assignLabel(b: var TBlock): Rope {.inline.} =
-  b.label = "LA" & b.id.rope
-  result = b.label
-
 proc blockBody(b: var TBlock): Rope =
   result = b.sections[cpsLocals]
   if b.frameLen > 0:
@@ -80,48 +61,9 @@ proc endBlock(p: BProc) =
   var blockEnd: Rope
   if frameLen > 0:
     blockEnd.addf("FR_.len-=$1;$n", [frameLen.rope])
-  if p.blocks[topBlock].label != "":
-    blockEnd.addf("} $1: ;$n", [p.blocks[topBlock].label])
-  else:
-    blockEnd.addf("}$n", [])
+  blockEnd.addf("}$n", [])
   endBlock(p, blockEnd)
 
-proc stmtBlock(p: BProc, n: CgNode) =
-  startBlock(p)
-  genStmts(p, n)
-  endBlock(p)
-
-proc blockLeaveActions(p: BProc, howManyTrys, howManyExcepts: int) =
-  # Called by return and break stmts.
-  # Deals with issues faced when jumping out of try/except/finally stmts.
-
-  var stack = newSeq[typeof(p.nestedTryStmts[0])](0)
-
-  inc p.withinBlockLeaveActions
-  for i in 1..howManyTrys:
-    let tryStmt = p.nestedTryStmts.pop
-    # Pop this try-stmt of the list of nested trys
-    # so we don't infinite recurse on it in the next step.
-    stack.add(tryStmt)
-
-    # Find finally-stmt for this try-stmt
-    # and generate a copy of its sons
-    var finallyStmt = tryStmt.fin
-    if finallyStmt != nil:
-      genStmts(p, finallyStmt[0])
-
-  dec p.withinBlockLeaveActions
-
-  # push old elements again:
-  for i in countdown(howManyTrys-1, 0):
-    p.nestedTryStmts.add(stack[i])
-
-  # Pop exceptions that was handled by the
-  # except-blocks we are in
-  block:
-    for i in countdown(howManyExcepts-1, 0):
-      linefmt(p, cpsStmts, "#popCurrentException();$n", [])
-
 proc genGotoVar(p: BProc; value: CgNode) =
   case value.kind
   of cnkIntLit, cnkUIntLit:
@@ -166,15 +108,7 @@ proc genIf(p: BProc, n: CgNode) =
 
   initLocExprSingleUse(p, n[0], a)
   lineF(p, cpsStmts, "if ($1)$n", [rdLoc(a)])
-  stmtBlock(p, n[1])
-
-proc genReturnStmt(p: BProc, t: CgNode) =
-  p.flags.incl beforeRetNeeded
-  genLineDir(p, t)
-  blockLeaveActions(p,
-    howManyTrys    = p.nestedTryStmts.len,
-    howManyExcepts = p.inExceptBlockLen)
-  lineF(p, cpsStmts, "goto BeforeRet_;$n", [])
+  startBlock(p)
 
 proc genGotoForCase(p: BProc; caseStmt: CgNode) =
   for i in 1..<caseStmt.len:
@@ -186,71 +120,51 @@ proc genGotoForCase(p: BProc; caseStmt: CgNode) =
         return
       let val = getOrdValue(it[j])
       lineF(p, cpsStmts, "NIMSTATE_$#:$n", [val.rope])
-    genStmts(p, it.lastSon)
-    endBlock(p)
 
-proc genRepeatStmt(p: BProc, t: CgNode) =
-  # we don't generate labels here as for example GCC would produce
-  # significantly worse code
-  inc(p.withinLoop)
-  genLineDir(p, t)
+    lineCg(p, cpsStmts, "goto $1;$n", [it[^1].label])
+    endBlock(p)
 
-  if true:
-    var loopBody = t[0]
-    if true:
-      startBlock(p, "while (1) {$n")
-      genStmts(p, loopBody)
-      endBlock(p)
-
-  dec(p.withinLoop)
-
-proc genBlock(p: BProc, n: CgNode) =
-  startBlock(p, n[0].label)
-  genStmts(p, n[1])
-  endBlock(p)
-
-proc genBreakStmt(p: BProc, t: CgNode) =
-  assert t[0].kind == cnkLabel
-  var idx = p.blocks.high
-  # search for the ``TBlock`` that corresponds to the label. `blk` stores the
-  # ID offset by 1, which has to be accounted for here
-  while idx >= 0 and p.blocks[idx].blk != (t[0].label.int + 1):
-    dec idx
-
-  let label = assignLabel(p.blocks[idx])
-  blockLeaveActions(p,
-    p.nestedTryStmts.len - p.blocks[idx].nestedTryStmts,
-    p.inExceptBlockLen - p.blocks[idx].nestedExceptStmts)
-  genLineDir(p, t)
-  lineF(p, cpsStmts, "goto $1;$n", [label])
+proc exit(n: CgNode): CgNode =
+  # XXX: exists as a convenience for overflow check, index check, etc.
+  #      code gen. Should be removed once those are fully lowered prior
+  #      to code generation
+  case n.kind
+  of cnkCheckedCall: n[^1]
+  else:              nil
+
+proc useLabel(p: BProc, label: CLabel) {.inline.} =
+  if label.id == ExitLabel:
+    p.flags.incl beforeRetNeeded
+
+proc raiseInstr(p: BProc, n: CgNode): Rope =
+  if n != nil:
+    case n.kind
+    of cnkLabel:
+      # easy case, simply goto the target:
+      result = ropecg(p.module, "goto $1;", [n.label])
+    of cnkTargetList:
+      # the first non-leave operand is the initial jump target
+      let label = toCLabel(n[0], p.specifier)
+      useLabel(p, label)
+      result = ropecg(p.module, "goto $1;", [label])
+    else:
+      unreachable(n.kind)
+  else:
+    # absence of an node storing the target means "never exits"
+    if hasAssume in CC[p.config.cCompiler].props:
+      result = "__asume(0);"
+    else:
+      # don't just fall-through; doing so would inhibit C compiler
+      # optimizations
+      p.flags.incl beforeRetNeeded
+      result = "goto BeforeRet_;"
 
-proc raiseExit(p: BProc) =
+proc raiseExit(p: BProc, n: CgNode) =
   assert p.config.exc == excGoto
   if nimErrorFlagDisabled notin p.flags:
     p.flags.incl nimErrorFlagAccessed
-    if p.nestedTryStmts.len == 0:
-      p.flags.incl beforeRetNeeded
-      # easy case, simply goto 'ret':
-      lineCg(p, cpsStmts, "if (NIM_UNLIKELY(*nimErr_)) goto BeforeRet_;$n", [])
-    else:
-      lineCg(p, cpsStmts, "if (NIM_UNLIKELY(*nimErr_)) goto LA$1_;$n",
-        [p.nestedTryStmts[^1].label])
-
-proc raiseInstr(p: BProc): Rope =
-  if p.config.exc == excGoto:
-    let L = p.nestedTryStmts.len
-    if L == 0:
-      p.flags.incl beforeRetNeeded
-      # easy case, simply goto 'ret':
-      result = ropecg(p.module, "goto BeforeRet_;$n", [])
-    else:
-      # raise inside an 'except' must go to the finally block,
-      # raise outside an 'except' block must go to the 'except' list.
-      result = ropecg(p.module, "goto LA$1_;$n",
-        [p.nestedTryStmts[L-1].label])
-      # + ord(p.nestedTryStmts[L-1].inExcept)])
-  else:
-    result = ""
+    lineCg(p, cpsStmts, "if (NIM_UNLIKELY(*nimErr_)) $1$n",
+           [raiseInstr(p, n)])
 
 proc genRaiseStmt(p: BProc, t: CgNode) =
   if t[0].kind != cnkEmpty:
@@ -272,12 +186,11 @@ proc genRaiseStmt(p: BProc, t: CgNode) =
     genLineDir(p, t)
     # reraise the last exception:
     linefmt(p, cpsStmts, "#reraiseException();$n", [])
-  let gotoInstr = raiseInstr(p)
-  if gotoInstr != "":
-    line(p, cpsStmts, gotoInstr)
+
+  # the goto is emitted separately
 
 template genCaseGenericBranch(p: BProc, b: CgNode, e: TLoc,
-                          rangeFormat, eqFormat: FormatStr, labl: TLabel) =
+                          rangeFormat, eqFormat: FormatStr, labl: BlockId) =
   var x, y: TLoc
   for i in 0..<b.len - 1:
     if b[i].kind == cnkRange:
@@ -289,49 +202,24 @@ template genCaseGenericBranch(p: BProc, b: CgNode, e: TLoc,
       initLocExpr(p, b[i], x)
       lineCg(p, cpsStmts, eqFormat, [rdCharLoc(e), rdCharLoc(x), labl])
 
-proc genCaseSecondPass(p: BProc, t: CgNode,
-                       labId, until: int): TLabel =
-  var lend = getLabel(p)
-  for i in 1..until:
-    lineF(p, cpsStmts, "LA$1_: ;$n", [rope(labId + i)])
-    if isOfBranch(t[i]):
-      stmtBlock(p, t[i][^1])
-      lineF(p, cpsStmts, "goto $1;$n", [lend])
-    else:
-      stmtBlock(p, t[i][0])
-  result = lend
-
 template genIfForCaseUntil(p: BProc, t: CgNode,
                        rangeFormat, eqFormat: FormatStr,
-                       until: int, a: TLoc): TLabel =
+                       until: int, a: TLoc) =
   # generate a C-if statement for a Nim case statement
-  var res: TLabel
-  var labId = p.labels
   for i in 1..until:
-    inc(p.labels)
     if isOfBranch(t[i]):
       genCaseGenericBranch(p, t[i], a, rangeFormat, eqFormat,
-                           "LA" & rope(p.labels) & "_")
+                           t[i][^1].label)
     else:
-      lineF(p, cpsStmts, "goto LA$1_;$n", [rope(p.labels)])
-  if until < t.len-1:
-    inc(p.labels)
-    var gotoTarget = p.labels
-    lineF(p, cpsStmts, "goto LA$1_;$n", [rope(gotoTarget)])
-    res = genCaseSecondPass(p, t, labId, until)
-    lineF(p, cpsStmts, "LA$1_: ;$n", [rope(gotoTarget)])
-  else:
-    res = genCaseSecondPass(p, t, labId, until)
-  res
+      linefmt(p, cpsStmts, "goto $1;$n", [t[i][^1].label])
 
 template genCaseGeneric(p: BProc, t: CgNode,
                     rangeFormat, eqFormat: FormatStr) =
   var a: TLoc
   initLocExpr(p, t[0], a)
-  var lend = genIfForCaseUntil(p, t, rangeFormat, eqFormat, t.len-1, a)
-  fixLabel(p, lend)
+  genIfForCaseUntil(p, t, rangeFormat, eqFormat, t.len-1, a)
 
-proc genCaseStringBranch(p: BProc, b: CgNode, e: TLoc, labl: TLabel,
+proc genCaseStringBranch(p: BProc, b: CgNode, e: TLoc, labl: BlockId,
                          branches: var openArray[Rope]) =
   var x: TLoc
   for i in 0..<b.len - 1:
@@ -353,15 +241,11 @@ proc genStringCase(p: BProc, t: CgNode) =
     newSeq(branches, bitMask + 1)
     var a: TLoc
     initLocExpr(p, t[0], a) # fist pass: generate ifs+goto:
-    var labId = p.labels
     for i in 1..<t.len:
-      inc(p.labels)
       if isOfBranch(t[i]):
-        genCaseStringBranch(p, t[i], a, "LA" & rope(p.labels) & "_",
-                            branches)
+        genCaseStringBranch(p, t[i], a, t[i][^1].label, branches)
       else:
         # else statement: nothing to do yet
-        # but we reserved a label, which we use later
         discard
     linefmt(p, cpsStmts, "switch (#hashString($1) & $2) {$n",
             [rdLoc(a), bitMask])
@@ -371,10 +255,8 @@ proc genStringCase(p: BProc, t: CgNode) =
              [intLiteral(j), branches[j]])
     lineF(p, cpsStmts, "}$n", []) # else statement:
     if not isOfBranch(t[^1]):
-      lineF(p, cpsStmts, "goto LA$1_;$n", [rope(p.labels)])
-    # third pass: generate statements
-    var lend = genCaseSecondPass(p, t, labId, t.len-1)
-    fixLabel(p, lend)
+      lineCg(p, cpsStmts, "goto $1;$n", [t[^1][0].label])
+
   else:
     genCaseGeneric(p, t, "", "if (#eqStrings($1, $2)) goto $3;$n")
 
@@ -424,10 +306,11 @@ proc genOrdinalCase(p: BProc, n: CgNode) =
   # generate if part (might be empty):
   var a: TLoc
   initLocExpr(p, n[0], a)
-  var lend = if splitPoint > 0: genIfForCaseUntil(p, n,
+  if splitPoint > 0:
+    genIfForCaseUntil(p, n,
                     rangeFormat = "if ($1 >= $2 && $1 <= $3) goto $4;$n",
                     eqFormat = "if ($1 == $2) goto $3;$n",
-                    splitPoint, a) else: ""
+                    splitPoint, a)
 
   # generate switch part (might be empty):
   if splitPoint+1 < n.len:
@@ -441,12 +324,11 @@ proc genOrdinalCase(p: BProc, n: CgNode) =
         # else part of case statement:
         lineF(p, cpsStmts, "default:$n", [])
         hasDefault = true
-      stmtBlock(p, branch.lastSon)
-      lineF(p, cpsStmts, "break;$n", [])
+
+      linefmt(p, cpsStmts, "goto $1;$n", [branch[^1].label])
     if (hasAssume in CC[p.config.cCompiler].props) and not hasDefault:
       lineF(p, cpsStmts, "default: __assume(0);$n", [])
     lineF(p, cpsStmts, "}$n", [])
-  if lend != "": fixLabel(p, lend)
 
 proc genCase(p: BProc, t: CgNode) =
   genLineDir(p, t)
@@ -477,98 +359,38 @@ proc bodyCanRaise(p: BProc; n: CgNode): bool =
       if bodyCanRaise(p, it): return true
     result = false
 
-proc genTryGoto(p: BProc; t: CgNode) =
-  let fin = if t[^1].kind == cnkFinally: t[^1] else: nil
-  inc p.labels
-  let lab = p.labels
-  let hasExcept = t[1].kind == cnkExcept
-  if hasExcept: inc p.withinTryWithExcept
-  p.nestedTryStmts.add((fin, false, Natural lab))
+proc genExcept(p: BProc, n: CgNode) =
+  ## Generates and emits the C code for an ``Except`` join point.
 
-  p.flags.incl nimErrorFlagAccessed
-
-  var errorFlagSet = false ## tracks whether the error flag is set to 'true'
-    ## on a control-flow path connected to the finally section
+  if n.len > 1:
+    # it's a handler with a filter/matcher
+    var condExpr = ""
+    for j in 1..<n.len - 1:
+      assert n[j].kind == cnkType
+      if condExpr != "":
+        condExpr.add("||")
 
-  template checkSetsErrorFlag(n: CgNode) =
-    if fin != nil and not errorFlagSet:
-      errorFlagSet = bodyCanRaise(p, n)
+      # make sure the Exception type is available in the module:
+      discard
+        getTypeDesc(p.module, p.module.g.graph.getCompilerProc("Exception").typ)
 
-  genStmts(p, t[0])
-  checkSetsErrorFlag(t[0])
+      appcg(p.module, condExpr, "#isObj(#nimBorrowCurrentException()->Sup.m_type, $1)",
+            [genTypeInfo2Name(p.module, n[j].typ)])
 
-  if 1 < t.len and t[1].kind == cnkExcept:
-    startBlock(p, "if (NIM_UNLIKELY(*nimErr_)) {$n")
+    # jump to the next handler in the chain if the filter doesn't apply
+    linefmt(p, cpsStmts, "if (!($1)) {$2}$n",
+            [condExpr, raiseInstr(p, n[^1])])
   else:
-    startBlock(p)
-  linefmt(p, cpsStmts, "LA$1_:;$n", [lab])
-
-  p.nestedTryStmts[^1].inExcept = true
-  var i = 1
-  while (i < t.len) and (t[i].kind == cnkExcept):
-
-    inc p.labels
-    let nextExcept = p.labels
-    p.nestedTryStmts[^1].label = nextExcept
-
-    if t[i].len == 1:
-      # general except section:
-      if i > 1: lineF(p, cpsStmts, "else", [])
-      startBlock(p)
-      # we handled the exception, remember this:
-      linefmt(p, cpsStmts, "*nimErr_ = NIM_FALSE;$n", [])
-      genStmts(p, t[i][0])
-      checkSetsErrorFlag(t[i][0])
-    else:
-      var orExpr = ""
-      for j in 0..<t[i].len - 1:
-        assert(t[i][j].kind == cnkType)
-        if orExpr != "": orExpr.add("||")
-        let checkFor = genTypeInfo2Name(p.module, t[i][j].typ)
-        let memberName = "Sup.m_type"
-        appcg(p.module, orExpr, "#isObj(#nimBorrowCurrentException()->$1, $2)", [memberName, checkFor])
-
-      if i > 1: line(p, cpsStmts, "else ")
-      startBlock(p, "if ($1) {$n", [orExpr])
-      # we handled the exception, remember this:
-      linefmt(p, cpsStmts, "*nimErr_ = NIM_FALSE;$n", [])
-      genStmts(p, t[i][^1])
-      checkSetsErrorFlag(t[i][^1])
-
-    linefmt(p, cpsStmts, "#popCurrentException();$n", [])
-    linefmt(p, cpsStmts, "LA$1_:;$n", [nextExcept])
-    endBlock(p)
-
-    inc(i)
-  discard pop(p.nestedTryStmts)
-  endBlock(p)
+    discard "catch-all handler, nothing to check"
 
-  if i < t.len and t[i].kind == cnkFinally:
-    startBlock(p)
-    # future direction: the code generator should track for each procedure
-    # whether it observes the error flag. If the finally clause's body
-    # doesn't observes it itself, and also doesn't call any procedure that
-    # does, we can also omit the save/restore pair
-    if not errorFlagSet:
-      # this is an optimization; if the error flag is proven to never be
-      # 'true' when the finally section is reached, we don't need to erase
-      # nor restore it:
-      genStmts(p, t[i][0])
-    else:
-      # pretend we did handle the error for the safe execution of the 'finally' section:
-      p.procSec(cpsLocals).add(ropecg(p.module, "NIM_BOOL oldNimErrFin$1_;$n", [lab]))
-      linefmt(p, cpsStmts, "oldNimErrFin$1_ = *nimErr_; *nimErr_ = NIM_FALSE;$n", [lab])
-      genStmts(p, t[i][0])
-      # this is correct for all these cases:
-      # 1. finally is run during ordinary control flow
-      # 2. finally is run after 'except' block handling: these however set the
-      #    error back to nil.
-      # 3. finally is run for exception handling code without any 'except'
-      #    handler present or only handlers that did not match.
-      linefmt(p, cpsStmts, "*nimErr_ = oldNimErrFin$1_;$n", [lab])
-    endBlock(p)
-  raiseExit(p)
-  if hasExcept: inc p.withinTryWithExcept
+  startBlock(p)
+  p.flags.incl nimErrorFlagAccessed
+  # exit error mode:
+  lineCg(p, cpsStmts, "*nimErr_ = NIM_FALSE;$n", [])
+  # setup the handler frame:
+  var tmp: TLoc
+  getTemp(p, p.module.g.graph.getCompilerProc("ExceptionFrame").typ, tmp)
+  lineCg(p, cpsStmts, "#nimCatchException($1);$n", [addrLoc(p.config, tmp)])
 
 proc genAsmOrEmitStmt(p: BProc, t: CgNode, isAsmStmt=false): Rope =
   var res = ""
@@ -677,7 +499,7 @@ proc genAsgn(p: BProc, e: CgNode) =
     genLineDir(p, ri)
     loadInto(p, le, ri, a)
 
-proc genStmts(p: BProc, t: CgNode) =
+proc genStmt(p: BProc, t: CgNode) =
   var a: TLoc
 
   let isPush = p.config.hasHint(rsemExtendedContext)
@@ -685,3 +507,79 @@ proc genStmts(p: BProc, t: CgNode) =
   expr(p, t, a)
   if isPush: popInfoContext(p.config)
   internalAssert p.config, a.k in {locNone, locTemp, locLocalVar, locExpr}
+
+proc gen(p: BProc, code: openArray[CInstr], stmts: CgNode) =
+  ## Generates and emits the C code for `code` and `stmts`. This is the main
+  ## driver of C code generation.
+  var pos = 0
+  while pos < code.len:
+    let it = code[pos]
+    case it.op
+    of opLabel:
+      lineCg(p, cpsStmts, "$1:;$n", [it.label])
+    of opJump:
+      useLabel(p, it.label)
+      lineCg(p, cpsStmts, "goto $1;$n", [it.label])
+    of opDispJump:
+      # must only be part of a dispatcher
+      unreachable()
+    of opSetTarget:
+      lineCg(p, cpsStmts, "Target$1_ = $2;$n", [$it.discr, it.value])
+    of opDispatcher:
+      lineF(p, cpsLocals, "NU8 Target$1_;$N", [$it.discr])
+      lineF(p, cpsStmts, "switch (Target$1_) {$n", [$it.discr])
+      for i in 0..<it.value:
+        inc pos
+        useLabel(p, code[pos].label)
+        lineCg(p, cpsStmts, "case $1: goto $2;$n", [i, code[pos].label])
+
+      # help the C compiler a bit by making the case statement exhaustive
+      if hasAssume in CC[p.config.cCompiler].props:
+        lineF(p, cpsStmts, "default: __assume(0);$n", [])
+      # TODO: use ``__builtin_unreachable();`` for compiler supporting the
+      #       GCC built-ins
+      lineF(p, cpsStmts, "}$n", [])
+    of opBackup:
+      if nimErrorFlagDisabled notin p.flags:
+        p.flags.incl nimErrorFlagAccessed
+        lineCg(p, cpsStmts, "NI32 oldNimErrFin$1_ = *nimErr_; *nimErr_ = NIM_FALSE;$n",
+              [$it.local])
+    of opRestore:
+      if nimErrorFlagDisabled notin p.flags:
+        p.flags.incl nimErrorFlagAccessed
+        lineCg(p, cpsStmts, "*nimErr_ = oldNimErrFin$1_;$n", [$it.local])
+    of opErrJump:
+      if nimErrorFlagDisabled notin p.flags:
+        useLabel(p, code[pos].label)
+        p.flags.incl nimErrorFlagAccessed
+        lineCg(p, cpsStmts, "if (NIM_UNLIKELY(*nimErr_)) goto $1;$n",
+               [it.label])
+
+    of opStmts:
+      # generate the code for all statements; no label specifier is set
+      p.specifier = none CLabelSpecifier
+      for i in it.stmts.items:
+        genStmt(p, stmts[i])
+    of opStmt:
+      p.specifier = some it.specifier
+      genStmt(p, stmts[it.stmt])
+
+    of opAbort:
+      if nimErrorFlagDisabled in p.flags:
+        lineCg(p, cpsStmts, "#nimAbortException();$n", [])
+      else:
+        # there's only something to abort when the finalizer was intercepted a
+        # raise
+        lineCg(p, cpsStmts, "if (NIM_UNLIKELY(oldNimErrFin$1_)) #nimAbortException();$n",
+               [$it.local])
+    of opPopHandler:
+      lineCg(p, cpsStmts, "#nimLeaveExcept();$n", [])
+
+    inc pos
+
+proc genStmts*(p: BProc, n: CgNode) =
+  ## Generates and emits the C code for the statement list node `n`, which
+  ## makes up the full body of the procedure. This is the external entry
+  ## point into the C code generator.
+  assert n.kind == cnkStmtList
+  gen(p, toInstrList(n, true), n)
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 86e358e5375..0dbcd114bc3 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -62,12 +62,15 @@ import
     compat,
     extccomp,
     ccgutils,
+    ccgflow,
     cgendata,
     cgir
   ],
   compiler/plugins/[
   ]
 
+import std/options as std_options
+
 # xxx: reports are a code smell meaning data types are misplaced...
 #      like the backend report sem errors.
 from compiler/ast/reports_sem import SemReport,
@@ -159,6 +162,23 @@ proc cgFormatValue(result: var string; value: BiggestInt) =
 proc cgFormatValue(result: var string; value: Int128) =
   result.addInt128 value
 
+proc cgFormatValue(result: var string; value: BlockId) =
+  # the trailing underscore makes sure that the name doesn't collide
+  # with other names
+  result.add "LA"
+  result.addInt value.uint32
+  result.add "_"
+
+proc cgFormatValue(result: var string, value: CLabel) =
+  if value.id == ExitLabel:
+    result.add "BeforeRet_"
+  else:
+    cgFormatValue(result, toBlockId(value.id))
+    # specifier:
+    if value.specifier.isSome:
+      result.addInt value.specifier.unsafeGet
+      result.add "_"
+
 # TODO: please document
 macro ropecg(m: BModule, frmt: static[FormatStr], args: untyped): Rope =
   args.expectKind nnkBracket
@@ -318,7 +338,7 @@ proc registerLateProc(m: BModule, s: PSym): ProcedureId =
 proc accessThreadLocalVar(p: BProc)
 proc emulatedThreadVars*(conf: ConfigRef): bool {.inline.}
 proc useProc(m: BModule, id: ProcedureId)
-proc raiseInstr(p: BProc): Rope
+proc raiseInstr(p: BProc, n: CgNode): Rope
 
 proc getTempName(m: BModule): Rope =
   result = m.tmpBase & rope(m.labels)
@@ -578,22 +598,15 @@ proc fillProcLoc*(m: BModule; id: ProcedureId) =
   if id notin m.procs:
     m.procs[id] = ProcLoc(name: mangleName(m.g.graph, m.g.env[id]))
 
-proc getLabel(p: BProc): TLabel =
-  inc(p.labels)
-  result = "LA" & rope(p.labels) & "_"
-
-proc fixLabel(p: BProc, labl: TLabel) =
-  lineF(p, cpsStmts, "$1: ;$n", [labl])
-
 proc genVarPrototype*(m: BModule, id: GlobalId)
 proc genProcPrototype*(m: BModule, id: ProcedureId)
-proc genStmts*(p: BProc, t: CgNode)
+proc genStmt(p: BProc, t: CgNode)
 proc expr(p: BProc, n: CgNode, d: var TLoc)
 proc putLocIntoDest(p: BProc, d: var TLoc, s: TLoc)
 proc intLiteral(i: BiggestInt): Rope
 proc intLiteral(p: BProc, i: Int128, ty: PType): Rope
 proc genLiteral(p: BProc, n: CgNode): Rope
-proc raiseExit(p: BProc)
+proc raiseExit(p: BProc, n: CgNode)
 
 proc initLocExpr(p: BProc, e: CgNode, result: var TLoc) =
   initLoc(result, locNone, e, OnUnknown)
@@ -848,7 +861,7 @@ proc genPartial*(p: BProc, n: CgNode) =
   ## is intended for CG IR that wasn't already available when calling
   ## `startProc`.
   synchronize(p.locals, p.body.locals)
-  genStmts(p, n)
+  gen(p, toInstrList(n, isFull=false), n)
 
 proc genProcPrototype(m: BModule, id: ProcedureId) =
   let sym = m.g.env[id]
diff --git a/compiler/backend/cgendata.nim b/compiler/backend/cgendata.nim
index 1141bf9637e..4ebb9262597 100644
--- a/compiler/backend/cgendata.nim
+++ b/compiler/backend/cgendata.nim
@@ -41,6 +41,7 @@ import
     pathutils
   ]
 
+import std/options as std_options
 
 type
   SymbolMap*[T] = object
@@ -136,15 +137,7 @@ type
   BModule* = ref TCGen
   BProc* = ref TCProc
   TBlock* = object
-    id*: int                  ## the ID of the label; positive means that it
-    blk*: int                 ## the ``BlockId`` + 1 of the block.
-                              ## '0' if the ``TBlock`` doesn't correspond to a
-                              ## ``cnkBlockStmt``
-    label*: Rope              ## generated text for the label
-                              ## nil if label is not used
     sections*: TCProcSections ## the code belonging
-    nestedTryStmts*: int16    ## how many try statements is it nested into
-    nestedExceptStmts*: int16 ## how many except statements is it nested into
     frameLen*: int16
 
   TCProcFlag* = enum
@@ -160,21 +153,18 @@ type
     flags*: set[TCProcFlag]
     lastLineInfo*: TLineInfo  ## to avoid generating excessive 'nimln' statements
     currLineInfo*: TLineInfo  ## AST codegen will make this superfluous
-    nestedTryStmts*: seq[tuple[fin: CgNode, inExcept: bool, label: Natural]]
-                              ## in how many nested try statements we are
-                              ## (the vars must be volatile then)
-                              ## bool is true when are in the except part of a try block
     labels*: Natural          ## for generating unique labels in the C proc
     blocks*: seq[TBlock]      ## nested blocks
     options*: TOptions        ## options that should be used for code
                               ## generation; this is the same as prc.options
                               ## unless prc == nil
     module*: BModule          ## used to prevent excessive parameter passing
-    withinLoop*: int          ## > 0 if we are within a loop
-    withinTryWithExcept*: int ## required for goto based exception handling
-    withinBlockLeaveActions*: int ## complex to explain
     sigConflicts*: CountTable[string]
 
+    specifier*: Option[uint32]
+    # XXX: `specifier` is a hack. Some parts of the code generator manually
+    #      emit gotos, and thus need a label specifier, but they shouldn't
+
     body*: Body               ## the procedure's full body
     locals*: OrdinalSeq[LocalId, TLoc]
       ## the locs for all locals of the procedure
@@ -319,7 +309,6 @@ proc newProc*(prc: PSym, module: BModule): BProc =
   result.options = if prc != nil: prc.options
                    else: module.config.options
   newSeq(result.blocks, 1)
-  result.nestedTryStmts = @[]
   result.sigConflicts = initCountTable[string]()
 
 proc newModuleList*(g: ModuleGraph): BModuleList =
diff --git a/compiler/backend/cgir.nim b/compiler/backend/cgir.nim
index 912a3ae19f4..2b489202d4f 100644
--- a/compiler/backend/cgir.nim
+++ b/compiler/backend/cgir.nim
@@ -43,6 +43,9 @@ type
     cnkMagic         ## name of a magic procedure. Only valid in the callee
                      ## slot of ``cnkCall`` and ``cnkCheckedCall`` nodes
 
+    cnkResume        ## leave the current procedure as part of exceptional
+                     ## control-flow
+
     cnkCall          ## a procedure call. The first operand is the procedure,
                      ## the following operands the arguments
     cnkCheckedCall   ## like ``cnkCall``, but the call might raise an exception
@@ -103,9 +106,8 @@ type
 
     cnkStmtList
     cnkStmtListExpr
-    # future direction: remove ``cnkStmtListExpr``. The code generators know
-    # based on the context a statement list appears in whether its an
-    # expression or not
+    # XXX: both stmtlist and stmtlistexpr are obsolete. They're only kept for
+    #      grouping the top-level statements under a single node
 
     cnkVoidStmt   ## discard the operand value (i.e., do nothing with it)
     cnkEmitStmt   ## an ``emit`` statement
@@ -115,23 +117,29 @@ type
                   ## evaluates to 'true'
     cnkRepeatStmt ## execute the body indefinitely
     cnkCaseStmt   ## a ``case`` statement
+    cnkBranch     ## the branch of a ``case`` statement
     cnkBlockStmt  ## an (optionally) labeled block
+    cnkTryStmt
 
+    cnkGotoStmt
+    cnkLoopStmt   ## jump back to a loop join point
     cnkBreakStmt  ## break out of labeled block, or, if no label is provided,
                   ## the closest ``repeat`` loop
     cnkRaiseStmt  ## raise(x) -- set the `x` as the current exception and start
                   ## exceptional control-flow. `x` can be ``cnkEmpty`` in which
                   ## case "set current exception" part is skipped
-    # future direction: lower the high-level raise statements (which means
-    # "set the current exception" + "start exceptional control-flow") into
-    # just "start exceptional control-flow"
     cnkReturnStmt
+    cnkContinueStmt## jump to the next target in the active jump list
 
-    cnkTryStmt
-    cnkExcept
+    cnkJoinStmt   ## join point for gotos
+    cnkLoopJoinStmt## join point for loops
+    cnkEnd        ## marks the end of a structured control-flow block
+                  ## (identified by the label)
+    cnkExcept     ## special join point, representing an exception handler
     cnkFinally
 
-    cnkBranch     ## the branch of a ``case`` statement
+    cnkTargetList ## an ordered list of jump target/actions
+    cnkLeave
 
     cnkDef        ## starts the lifetime of a local and optionally assigns an
                   ## initial value
@@ -147,12 +155,19 @@ const
   cnkWithOperand*  = {cnkConv, cnkHiddenConv, cnkDeref, cnkAddr, cnkHiddenAddr,
                       cnkDerefView, cnkObjDownConv, cnkObjUpConv, cnkCast,
                       cnkLvalueConv}
-  cnkAtoms*        = {cnkInvalid..cnkMagic, cnkReturnStmt}
+  cnkAtoms*        = {cnkInvalid..cnkResume, cnkReturnStmt}
     ## node kinds that denote leafs
   cnkWithItems*    = AllKinds - cnkWithOperand - cnkAtoms
     ## node kinds for which the ``items`` iterator is available
 
   cnkLiterals* = {cnkIntLit, cnkUIntLit, cnkFloatLit, cnkStrLit}
+  cnkLegacyNodes* = {cnkBlockStmt, cnkTryStmt, cnkReturnStmt, cnkBreakStmt,
+                     cnkRepeatStmt}
+    ## node kinds that belong to the legacy control-flow representation
+  cnkNewCfNodes* = {cnkGotoStmt, cnkJoinStmt, cnkLeave, cnkResume,
+                    cnkContinueStmt, cnkLoopStmt, cnkLoopJoinStmt,
+                    cnkEnd, cnkTargetList}
+    ## node kinds that belong to the new-style control-flow representation
 
 type
   Local* = object
@@ -184,7 +199,8 @@ type
     info*: TLineInfo
     typ*: PType
     case kind*: CgNodeKind
-    of cnkInvalid, cnkEmpty, cnkType, cnkNilLit, cnkReturnStmt: discard
+    of cnkInvalid, cnkEmpty, cnkType, cnkNilLit, cnkReturnStmt, cnkResume:
+      discard
     of cnkIntLit, cnkUIntLit:
       # future direction: use a ``BiggestUint`` for uint values
       intVal*: BiggestInt
@@ -281,18 +297,34 @@ proc merge*(dest: var Body, source: Body): CgNode =
   # merge the locals:
   let offset = dest.locals.merge(source.locals)
 
-  proc update(n: CgNode, offset: uint32) {.nimcall.} =
+  proc update(n: CgNode, offset, labelOffset: uint32) {.nimcall.} =
     ## Offsets the ID of all references-to-``Local`` in `n` by `offset`.
     case n.kind
     of cnkLocal:
       n.local.uint32 += offset
-    of cnkAtoms - {cnkLocal}:
+    of cnkLabel:
+      n.label.uint32 += labelOffset
+    of cnkAtoms - {cnkLocal, cnkLabel}:
+      discard "nothing to do"
+    of cnkWithOperand:
+      update(n.operand, offset, labelOffset)
+    of cnkWithItems:
+      for it in n.items:
+        update(it, offset, labelOffset)
+
+  proc computeNextLabel(n: CgNode, highest: var uint32) =
+    ## Computes the highest ID value used by labels within `n` and writes it
+    ## to `highest`.
+    case n.kind
+    of cnkLabel:
+      highest = max(n.label.uint32, highest)
+    of cnkAtoms - {cnkLabel}:
       discard "nothing to do"
     of cnkWithOperand:
-      update(n.operand, offset)
+      computeNextLabel(n.operand, highest)
     of cnkWithItems:
       for it in n.items:
-        update(it, offset)
+        computeNextLabel(it, highest)
 
   result = source.code
 
@@ -300,8 +332,10 @@ proc merge*(dest: var Body, source: Body): CgNode =
     # make things easier by supporting `dest` being uninitialized
     dest.code = source.code
   elif source.code.kind != cnkEmpty:
-    # update references to locals in source's code:
-    update(source.code, offset.get(LocalId(0)).uint32)
+    var labelOffset = 0'u32
+    computeNextLabel(dest.code, labelOffset)
+    # update references to locals and labels in source's code:
+    update(source.code, offset.get(LocalId(0)).uint32, labelOffset + 1)
 
     # merge the code fragments:
     case dest.code.kind
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index baa1a3b7de5..72963ea341c 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -41,10 +41,17 @@ import
     int128
   ]
 
+import std/options as std_options
+from std/sequtils import delete
+
 from compiler/ast/ast import newSym, newType, rawAddSon
 from compiler/sem/semdata import makeVarType
 
 type
+  NodeLabelPair = tuple
+    node: CgNode
+    target: LabelId
+
   TranslateCl = object
     graph: ModuleGraph
     idgen: IdGenerator
@@ -56,9 +63,25 @@ type
     localsMap: Table[int, LocalId]
       ## maps a sybmol ID to the corresponding local. Needed because normal
       ## local variables reach here as ``PSym``s
-    blocks: seq[LabelId]
+    blocks: seq[tuple[input, actual: LabelId]]
       ## the stack of enclosing blocks for the currently processed node
 
+    numLabels: int
+      ## incremented when a new label ID is allocated
+    exits: seq[NodeLabelPair]
+      ## non-exception goto-like statements that need patching when crossing
+      ## ``try``, ``finally``, or ``except`` boundaries
+    raiseExits: seq[NodeLabelPair]
+      ## similar to `exits`, but for exceptional control-flow statements/
+      ## nodes. The label doesn't matter, it's only there so that `raiseExits`
+      ## can be passed to the same procedures as `exits`
+    returnLabel: Option[LabelId]
+      ## the label to be placed after all other statements. A label is only
+      ## allocated if an ``mnkReturn`` appears somewhere in the MIR code
+    isActive: bool
+      ## whether translation of statements is enabled. Used to eliminate
+      ## unreachable code
+
     locals: Store[LocalId, Local]
       ## the in-progress list of all locals in the translated body
 
@@ -85,6 +108,12 @@ template isFilled(x: LocalId): bool =
   # temporaries, which can never map to the result variable
   x.int != 0
 
+func delete[T](s: var seq[T], a, b: int) =
+  # XXX: this procedure is a workaround for ``sequtils.delete`` not handling
+  #      empty slices properly (an IndexDefect is erroneously raised)
+  if b > a:
+    sequtils.delete(s, a..(b-1))
+
 func newMagicNode(magic: TMagic, info: TLineInfo): CgNode =
   CgNode(kind: cnkMagic, info: info, magic: magic)
 
@@ -94,6 +123,12 @@ func get(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
 
   inc cr.pos
 
+func skip(body: MirBody, cr: var TreeCursor) =
+  ## Skips over the node or sub-tree at the cursor.
+  let next = uint32 body.code.sibling(NodePosition cr.pos)
+  assert next > cr.pos
+  cr.pos = next
+
 func enter(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
   assert t.code[cr.pos].kind in SubTreeNodes, "not a sub-tree"
   result = get(t, cr)
@@ -212,17 +247,6 @@ func addIfNotEmpty(stmts: var seq[CgNode], n: sink CgNode) =
   if n.kind != cnkEmpty:
     stmts.add n
 
-func toSingleNode(stmts: sink seq[CgNode]): CgNode =
-  ## Creates a single ``CgNode`` from a list of *statements*
-  case stmts.len
-  of 0:
-    result = newEmpty()
-  of 1:
-    result = move stmts[0]
-  else:
-    result = newNode(cnkStmtList)
-    result.kids = stmts
-
 proc newDefaultCall(info: TLineInfo, typ: PType): CgNode =
   ## Produces the tree for a ``default`` magic call.
   newExpr(cnkCall, info, typ, [newMagicNode(mDefault, info)])
@@ -259,11 +283,28 @@ proc genObjConv(n: CgNode, a, b, t: PType): CgNode =
     if diff < 0: cnkObjUpConv else: cnkObjDownConv,
     n.info, t): n
 
+proc disable(cl: var TranslateCl) =
+  # consider the following MIR:
+  #   try:
+  #     return
+  #     def _1 = ...
+  #   finally:
+  #     =destroy(name _1)
+  #
+  # Although nonesense, this is currently both legal and possible MIR. If
+  # translation would be disabled beyond the ``return``, then the temporary
+  # wouldn't be registered. Therefore, disable is a no-op when in an unscoped
+  # contexts (such as the above)
+  # XXX: eliminating unreachable code needs to happen much earlier, either in
+  #      ``mirgen`` or ``transf``
+  if not cl.inUnscoped:
+    cl.isActive = false
+
 # forward declarations:
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode
+              cr: var TreeCursor, stmts: var seq[CgNode])
 proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, allowExpr=false): seq[CgNode]
+               cr: var TreeCursor, stmts: var seq[CgNode], allowExpr=false)
 
 proc handleSpecialConv(c: ConfigRef, n: CgNode, info: TLineInfo,
                        dest: PType): CgNode =
@@ -608,93 +649,279 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     unreachable()
 
 proc bodyToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode =
+              cr: var TreeCursor, stmts: var seq[CgNode]) =
   ## Generates the ``CgNode`` tree for the body of a construct that implies
   ## some form of control-flow.
   let prev = cl.inUnscoped
   # assume the body is unscoped until stated otherwise
   cl.inUnscoped = true
-  result = stmtToIr(tree, env, cl, cr)
+  stmtToIr(tree, env, cl, cr, stmts)
   cl.inUnscoped = prev
 
 proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor): CgNode
+              cr: var TreeCursor, stmts: var seq[CgNode])
+
+func newLabel(cl: var TranslateCl): LabelId =
+  ## Allocates a new label ID and returns it.
+  result = LabelId(cl.numLabels)
+  inc cl.numLabels
+
+func getReturnLabel(cl: var TranslateCl): LabelId =
+  ## Returns the label that points to the end of the current procedure.
+  if cl.returnLabel.isSome:
+    result = cl.returnLabel.unsafeGet()
+  else:
+    # allocate a new label first
+    result = newLabel(cl)
+    cl.returnLabel = some result
+
+func node(lbl: LabelId): CgNode =
+  newLabelNode(BlockId(lbl))
+
+proc patch(stmt: CgNode, target: sink CgNode) =
+  ## Appends `target` to the goto-like statement `stmt`, always wrapping
+  ## `target` in a ``cnkTargetList`` if there's none yet.
+  if stmt[^1] == nil:
+    stmt[^1] = newTree(cnkTargetList, unknownLineInfo, target)
+  else:
+    # a target list already exists
+    stmt[^1].kids.add target
+
+proc patchSingle(stmt: CgNode, target: sink CgNode) =
+  ## Appends `target` to the goto-like statement `stmt`.
+  if stmt[^1] == nil:
+    stmt[^1] = target
+  else:
+    stmt[^1].kids.add target
+
+proc patch(x: seq[NodeLabelPair], start: int, exit: LabelId) =
+  for i in start..<x.len:
+    patch(x[i].node, node(exit))
+
+proc patchLeave(x: seq[NodeLabelPair], start: int, exit: LabelId) =
+  for i in start..<x.len:
+    patch(x[i].node, newTree(cnkLeave, x[i].node.info, node(exit)))
+
+proc patchResume(x: seq[NodeLabelPair], start: int) =
+  for i in start..<x.len:
+    patch(x[i].node, newNode(cnkResume, x[i].node.info))
+
+proc join(stmts: var seq[CgNode], cl: var TranslateCl, info: TLineInfo,
+          target: LabelId, required: bool) =
+  ## Emits a join statement with label `target`, enabling translation
+  ## again if it's disabled and an exit targetting `target` exists.
+  ## If `required` is false and a join statement was immediately emitted
+  ## prior, no new join statement is emitted.
+  var label = target
+
+  # if allowed and possible, coalesce a join with the previous one:
+  if not required and stmts.len > 0 and stmts[^1].kind == cnkJoinStmt:
+    label = stmts[^1][0].label.LabelId
+
+  var
+    i = 0
+    found = false
+  # search for exits targetting `target`, update them with the correct label,
+  # and then remove them from the list
+  while i < cl.exits.len:
+    if cl.exits[i][1] == target:
+      patchSingle(cl.exits[i][0], node(label))
+      cl.exits.del(i)
+      # remember that at least one exit was found:
+      found = true
+    else:
+      inc i
+
+  # emit the join, but only if no coalescing took place and the label is
+  # actually targeted:
+  if label == target and (found or required):
+    stmts.add newTree(cnkJoinStmt, info, node(label))
+
+  if found or true:
+    # code is alive if following a join that is targeted by an alive goto
+    # XXX: translation has to be forcefully enabled at a join, even if not
+    #      within a scoped context: the surrounding scope might itself be
+    #      part of an unscoped context. This is a temporary workaround, see
+    #      `disable <#disable,TranslateCl>`_
+    cl.isActive = true
+
+template join(info: TLineInfo, lbl: LabelId; required = false) =
+  join(stmts, cl, info, lbl, required)
+
+template goto(kind: CgNodeKind, info: TLineInfo, target: LabelId) =
+  ## Emits a fixed goto-like statement targeting `target`.
+  stmts.add newStmt(kind, info, node(target))
+
+template exit(lbl: LabelId) =
+  ## Emits a goto statement and registers it with `lbl` as the target.
+  if cl.isActive:
+    let n = newStmt(cnkGotoStmt, unknownLineInfo, nil)
+    stmts.add n
+    cl.exits.add((n, lbl))
+    cl.disable()
+
+template guarded(lbl: LabelId, body: untyped) =
+  ## Updates all exits emitted as part of `body` with a leave instruction
+  ## targetting `lbl`.
+  let
+    raiseStart = cl.raiseExits.len
+    exitStart = cl.exits.len
+  body
+  patchLeave(cl.raiseExits, raiseStart, lbl)
+  patchLeave(cl.exits, exitStart, lbl)
 
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode =
+              cr: var TreeCursor, stmts: var seq[CgNode]) =
+
+  # skip the statement if translation is disabled
+  if not cl.isActive:
+    tree.skip(cr)
+    return
+
   let n {.cursor.} = tree.get(cr)
   let info = cr.info ## the source information of `n`
 
-  template body(): CgNode =
-    bodyToIr(tree, env, cl, cr)
+  template body() =
+    bodyToIr(tree, env, cl, cr, stmts)
 
-  template to(kind: CgNodeKind, args: varargs[untyped]): CgNode =
+  template to(kind: CgNodeKind, args: varargs[untyped]) =
     let r = newStmt(kind, info, args)
     leave(tree, cr)
-    r
+    stmts.add r
 
-  template toList(k: CgNodeKind, body: untyped): CgNode =
+  template toList(k: CgNodeKind, body: untyped) =
     let res {.inject.} = newStmt(k, info)
     while tree[cr].kind != mnkEnd:
       body
     leave(tree, cr)
-    res
+    stmts.add res
 
   case n.kind
   of DefNodes:
-    defToIr(tree, env, cl, n, cr)
+    stmts.addIfNotEmpty defToIr(tree, env, cl, n, cr)
   of mnkAsgn, mnkInit, mnkSwitch:
     let
       dst = lvalueToIr(tree, cl, cr)
       (src, useFast) = sourceExprToIr(tree, cl, cr)
     to (if useFast: cnkFastAsgn else: cnkAsgn), dst, src
   of mnkRepeat:
-    to cnkRepeatStmt, body()
+    let label = newLabel(cl)
+    stmts.add newTree(cnkLoopJoinStmt, info, node(label))
+    body()
+    stmts.add newStmt(cnkLoopStmt, info, node(label))
+    leave(tree, cr)
   of mnkBlock:
-    cl.blocks.add n.label # push the label to the stack
-    let body = body()
-    cl.blocks.setLen(cl.blocks.len - 1) # pop block from the stack
-    to cnkBlockStmt, newLabelNode(cl.blocks.len.BlockId, info), body
+    cl.blocks.add (n.label, newLabel(cl))
+    body()
+    join info, cl.blocks.pop().actual
+    leave(tree, cr)
   of mnkTry:
-    let res = newStmt(cnkTryStmt, info, [body()])
     assert n.len <= 2
+    let
+      raiseExitStart = cl.raiseExits.len
+      exitStart      = cl.exits.len
+
+    body() # body of the try block
+    let target = newLabel(cl)
+    exit target # jump past the except and/or finally sections
 
     for _ in 0..<n.len:
       let it {.cursor.} = enter(tree, cr)
 
       case it.kind
       of mnkExcept:
-        for _ in 0..<it.len:
-          let br {.cursor.} = enter(tree, cr)
-          assert br.kind == mnkBranch
-
-          let excpt = newNode(cnkExcept, cr.info)
-          for j in 0..<br.len:
-            excpt.add tbExceptItem(tree, cl, cr)
-
-          excpt.add body()
-          res.add excpt
-
-          leave(tree, cr)
-
+        # only translate the except section if it's actually entered
+        if raiseExitStart < cl.raiseExits.len:
+          var next = newLabel(cl)
+            ## the label of the next except branch
+          for i in raiseExitStart..<cl.raiseExits.len:
+            patchSingle(cl.raiseExits[i][0], node(next))
+
+          # translating the handler could add new exceptional exits, so pop
+          # the raise exits first
+          cl.raiseExits.setLen(raiseExitStart)
+
+          for bIdx in 0..<it.len:
+            let br {.cursor.} = enter(tree, cr)
+            assert br.kind == mnkBranch
+
+            let
+              this = next ## label of the current except branch
+              excpt = newTree(cnkExcept, cr.info, node(this))
+            for j in 0..<br.len:
+              excpt.add tbExceptItem(tree, cl, cr)
+
+            # no filters mean that this is a catch-all branch
+            if br.len > 0:
+              if bIdx == it.len-1:
+                # last branch in the handler block
+                excpt.add nil
+                cl.raiseExits.add (excpt, LabelId(0))
+              else:
+                # setup the label for the follow-up handler
+                next = newLabel(cl)
+                excpt.add node(next)
+
+            stmts.add excpt
+            guarded this:
+              cl.isActive = true # each branch starts as active
+              body() # body of the handler
+              exit target # jump to the after the try statement
+              stmts.add newStmt(cnkEnd, excpt.info, [node(this)])
+
+            leave(tree, cr)
+
+        else:
+          # skip all branches
+          for _ in 0..<it.len:
+            tree.skip(cr)
       of mnkFinally:
-        res.add newTree(cnkFinally, cr.info, body())
+        # only translate the finally if it's actually entered
+        if raiseExitStart < cl.raiseExits.len or exitStart < cl.exits.len:
+          let label = newLabel(cl)
+          # add the finalizer as an intermediate target
+          patch(cl.raiseExits, raiseExitStart, label)
+          patch(cl.exits, exitStart, label)
+
+          # remember the states prior to translating the body:
+          let
+            raiseExitStart2 = cl.raiseExits.len
+            exitStart2 = cl.exits.len
+
+          stmts.add newStmt(cnkFinally, info, node(label))
+          guarded label:
+            cl.isActive = true
+            body()
+
+          if not cl.isActive:
+            # the finally section has no structured exit. Discard all
+            # intercepted exits; their final target is the finally
+            cl.raiseExits.delete(raiseExitStart, raiseExitStart2)
+            cl.exits.delete(exitStart, exitStart2)
+
+          stmts.add newStmt(cnkContinueStmt, info, node(label))
+        else:
+          tree.skip(cr) # skip the body
+
       else:
         unreachable(it.kind)
 
       leave(tree, cr)
 
+    cl.disable()
+    # if structured control-flow exits the try statement, the join will enable
+    # translation again
+    join info, target
     leave(tree, cr)
-    res
   of mnkBreak:
     # find the stack index of the enclosing 'block' identified by the break's
-    # label; we use the index as the ID
+    # label
     var idx = cl.blocks.high
-    while idx >= 0 and cl.blocks[idx] != n.label:
+    while idx >= 0 and cl.blocks[idx].input != n.label:
       dec idx
-    newStmt(cnkBreakStmt, info, [newLabelNode(BlockId idx, info)])
+    exit cl.blocks[idx].actual
   of mnkReturn:
-    newNode(cnkReturnStmt, info)
+    exit getReturnLabel(cl)
   of mnkVoid:
     var res = exprToIr(tree, cl, cr)
     if res.typ.isEmptyType():
@@ -703,17 +930,32 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     else:
       res = newStmt(cnkVoidStmt, info, [res])
     leave(tree, cr)
-    res
+    stmts.add res
   of mnkIf:
-    to cnkIfStmt, valueToIr(tree, cl, cr), body()
+    let label = newLabel(cl)
+    stmts.add newStmt(cnkIfStmt, info, [valueToIr(tree, cl, cr), node(label)])
+    body()
+    stmts.add newStmt(cnkEnd, info, [node(label)])
+    # if control-flow reaches the ``if`` itself, it also reaches the code
+    # following the ``if``
+    cl.isActive = true
+    leave(tree, cr)
   of mnkRaise:
     # the operand can either be empty or an lvalue expression
-    to cnkRaiseStmt:
-      case tree[cr].kind
-      of mnkNone: atomToIr(tree, cl, cr)
-      else:       lvalueToIr(tree, cl, cr)
+    let
+      arg {.cursor.} = tree.get(cr)
+      res = newStmt(cnkRaiseStmt, info):
+        case arg.kind
+        of mnkNone: newEmpty()
+        else:       lvalueToIr(tree, cl, arg, cr)
+
+    res.add nil # reserve a slot for the label
+    cl.raiseExits.add (res, LabelId(0))
+    stmts.add res
+    cl.disable()
+    leave(tree, cr)
   of mnkCase:
-    caseToIr(tree, env, cl, n, cr)
+    caseToIr(tree, env, cl, n, cr, stmts)
   of mnkAsm:
     toList cnkAsmStmt:
       res.add valueToIr(tree, cl, cr)
@@ -721,31 +963,55 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     toList cnkEmitStmt:
       res.add valueToIr(tree, cl, cr)
   of mnkStmtList:
-    toList cnkStmtList:
-      res.kids.addIfNotEmpty stmtToIr(tree, env, cl, cr)
+    while tree[cr].kind != mnkEnd:
+      stmtToIr(tree, env, cl, cr, stmts)
+    leave(tree, cr)
   of mnkScope:
-    toSingleNode scopeToIr(tree, env, cl, cr)
+    scopeToIr(tree, env, cl, cr, stmts)
   of mnkDestroy:
     unreachable("a 'destroy' that wasn't lowered")
   of AllNodeKinds - StmtNodes:
     unreachable(n.kind)
 
 proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor): CgNode =
+              cr: var TreeCursor, stmts: var seq[CgNode]) =
   assert n.kind == mnkCase
-  result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
+  let
+    exit = newLabel(cl)
+    result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
+  # whether the statement has a structured exit is computed manually
+  var doesExit = false
+
+  stmts.add result # add the case statement already
   for j in 0..<n.len:
     let br {.cursor.} = enter(tree, cr)
 
     result.add newTree(cnkBranch, cr.info)
-    if br.len > 0:
-      for x in 0..<br.len:
-        assert tree[cr].kind in {mnkConst, mnkLiteral}
-        result[^1].add atomToIr(tree, cl, cr)
+    for x in 0..<br.len:
+      assert tree[cr].kind in {mnkConst, mnkLiteral}
+      result[^1].add atomToIr(tree, cl, cr)
+
+    let label = newLabel(cl)
+    result[^1].add node(label)
+
+    # start each branch as active again:
+    cl.isActive = true
+
+    join cr.info, label, required=true
+    bodyToIr(tree, env, cl, cr, stmts)
+    if cl.isActive:
+      doesExit = true
+      goto cnkGotoStmt, result.info, exit
 
-    result[^1].add bodyToIr(tree, env, cl, cr)
     leave(tree, cr)
 
+  # we used manual gotos, so emission of a join statement has to be forced
+  join result.info, exit, required=true
+  if doesExit:
+    cl.isActive = true
+  else:
+    cl.disable()
+
   leave(tree, cr)
 
 proc exprToIr(tree: MirBody, cl: var TranslateCl,
@@ -810,8 +1076,13 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
 
     treeOp kind:
       res.add argToIr(tree, cl, cr)[1]
-  of mnkCall, mnkCheckedCall:
+  of mnkCall:
     callToIr(tree, cl, n, cr)
+  of mnkCheckedCall:
+    let res = callToIr(tree, cl, n, cr)
+    res.kids.add nil # reserve the slot for the target
+    cl.raiseExits.add (res, LabelId(0))
+    res
   of UnaryOps:
     const Map = [mnkNeg: cnkNeg]
     treeOp Map[n.kind]:
@@ -840,53 +1111,59 @@ proc genDefFor(sym: sink CgNode): CgNode =
     unreachable()
 
 proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, allowExpr = false): seq[CgNode] =
+               cr: var TreeCursor, stmts: var seq[CgNode],
+               allowExpr = false) =
   let
     ends =
       if allowExpr: {mnkEnd} + Atoms
       else:         {mnkEnd}
     prev = cl.defs.len
     prevInUnscoped = cl.inUnscoped
+    start = stmts.len
 
   # a scope is entered, meaning that we're no longer in an unscoped context
   cl.inUnscoped = false
 
-  var stmts: seq[CgNode]
   # translate all statements:
   while cr.hasNext(tree) and tree[cr].kind notin ends:
-    stmts.addIfNotEmpty stmtToIr(tree, env, cl, cr)
+    stmtToIr(tree, env, cl, cr, stmts)
 
   if cr.hasNext(tree) and tree[cr].kind == mnkEnd:
     leave(tree, cr) # close the sub-tree
 
   if cl.defs.len > prev:
-    # insert all the lifted defs at the start
+    # insert all the lifted defs at the start of the scope
     for i in countdown(cl.defs.high, prev):
-      stmts.insert genDefFor(move cl.defs[i])
+      stmts.insert genDefFor(move cl.defs[i]), start
 
     # "pop" the elements that were added as part of this scope:
     cl.defs.setLen(prev)
 
   cl.inUnscoped = prevInUnscoped
 
-  result = stmts
-
 proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
         start: NodePosition): CgNode =
   ## Translate `tree` to the corresponding ``CgNode`` representation.
   var cr = TreeCursor(pos: start.uint32)
-  var nodes = scopeToIr(tree, env, cl, cr, allowExpr=true)
+  var stmts: seq[CgNode]
+  scopeToIr(tree, env, cl, cr, stmts, allowExpr=true)
+  if cl.raiseExits.len > 0:
+    # there's unhandled exceptional control-flow
+    patchResume(cl.raiseExits, 0)
+
+  # emit the join for the return label, if used
+  if cl.returnLabel.isSome:
+    join unknownLineInfo, cl.returnLabel.get()
+
   if cr.hasNext(tree):
     # the tree must be an expression; the last node is required to be an atom
     let x = atomToIr(tree, cl, cr)
-    if nodes.len == 0:
-      x
-    else:
-      nodes.add x
-      newExpr(cnkStmtListExpr, unknownLineInfo, nodes[^1].typ, nodes)
-  else:
-    # it's a statement list
-    toSingleNode nodes
+    stmts.add x
+
+  # XXX: the list of statements is still wrapped in a node for now, but
+  #      this needs to change once all code generators use the new CGIR
+  result = newStmt(cnkStmtList, unknownLineInfo)
+  result.kids = move stmts
 
 proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
                  owner: PSym,
@@ -920,6 +1197,9 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
       # environment parameter
       add(owner.ast[paramsPos][^1].sym)
 
+  # enable translation:
+  cl.isActive = true
+
   result = Body()
   result.code = tb(body, env, cl, NodePosition 0)
   result.locals = cl.locals
diff --git a/compiler/backend/cgirgen_legacy.nim b/compiler/backend/cgirgen_legacy.nim
new file mode 100644
index 00000000000..cb60ba0eae0
--- /dev/null
+++ b/compiler/backend/cgirgen_legacy.nim
@@ -0,0 +1,920 @@
+## Implements the translation from the MIR to the ``CgNode`` IR. All code
+## reaching the code generation phase passes through here.
+##
+## .. note::
+##   The `tb` prefix that's still used in some places is an abbreviation of
+##   "translate back"
+##
+## .. note::
+##   The ``CgNode`` IR is slated for removal, with the MIR intended to take
+##   its place as the code-generator input.
+
+import
+  std/[
+    tables
+  ],
+  compiler/ast/[
+    ast_types,
+    ast_idgen,
+    ast_query,
+    lineinfos,
+    types
+  ],
+  compiler/backend/[
+    cgir
+  ],
+  compiler/front/[
+    options
+  ],
+  compiler/mir/[
+    mirbodies,
+    mirenv,
+    mirtrees,
+    sourcemaps
+  ],
+  compiler/modules/[
+    modulegraphs
+  ],
+  compiler/utils/[
+    containers,
+    idioms,
+    int128
+  ]
+
+from compiler/ast/ast import newSym, newType, rawAddSon
+from compiler/sem/semdata import makeVarType
+
+type
+  TranslateCl = object
+    graph: ModuleGraph
+    idgen: IdGenerator
+
+    owner: PSym
+
+    tempMap: SeqMap[TempId, LocalId]
+      ## maps a ``TempId`` to the ID of the local created for it
+    localsMap: Table[int, LocalId]
+      ## maps a sybmol ID to the corresponding local. Needed because normal
+      ## local variables reach here as ``PSym``s
+    blocks: seq[LabelId]
+      ## the stack of enclosing blocks for the currently processed node
+
+    locals: Store[LocalId, Local]
+      ## the in-progress list of all locals in the translated body
+
+    # a 'def' in the MIR means that the the local starts to exists and that it
+    # is accessible in all connected basic blocks part of the enclosing
+    # ``mnkScope``. The ``CgNode`` IR doesn't use same notion of scope,
+    # so for now, all 'def's (without the initial values) within nested
+    # control-flow-related trees are moved to the start of the enclosing
+    # ``mnkScope``.
+    inUnscoped: bool
+      ## whether the currently proceesed statement/expression is part of an
+      ## unscoped control-flow context
+    defs: seq[CgNode]
+      ## the stack of locals/globals for which the ``cnkDef``/assignemnt needs
+      ## to be inserted later
+
+  TreeCursor = object
+    ## A cursor into a ``MirBody``.
+    pos: uint32 ## the index of the currently pointed to node
+    origin {.cursor.}: PNode ## the source node
+
+func newMagicNode(magic: TMagic, info: TLineInfo): CgNode =
+  CgNode(kind: cnkMagic, info: info, magic: magic)
+
+func get(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
+  cr.origin = t.sourceFor(cr.pos.NodePosition)
+  result = t.code[cr.pos]
+
+  inc cr.pos
+
+func enter(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
+  assert t.code[cr.pos].kind in SubTreeNodes, "not a sub-tree"
+  result = get(t, cr)
+
+func leave(t: MirBody, cr: var TreeCursor) =
+  assert t.code[cr.pos].kind == mnkEnd, "not at the end of sub-tree"
+  inc cr.pos
+
+template info(cr: TreeCursor): TLineInfo =
+  cr.origin.info
+
+template `[]`(t: MirBody, cr: TreeCursor): untyped =
+  t.code[cr.pos]
+
+template hasNext(cr: TreeCursor, t: MirBody): bool =
+  cr.pos.int < t.code.len
+
+template `[]=`(x: CgNode, i: Natural, n: CgNode) =
+  x.kids[i] = n
+
+template `[]=`(x: CgNode, i: BackwardsIndex, n: CgNode) =
+  x.kids[i] = n
+
+template add(x: CgNode, y: CgNode) =
+  x.kids.add y
+
+proc copyTree(n: CgNode): CgNode =
+  case n.kind
+  of cnkAtoms:
+    new(result)
+    result[] = n[]
+  of cnkWithOperand:
+    result = CgNode(kind: n.kind, info: n.info, typ: n.typ)
+    result.operand = copyTree(n.operand)
+  of cnkWithItems:
+    result = CgNode(kind: n.kind, info: n.info, typ: n.typ)
+    result.kids.setLen(n.kids.len)
+    for i, it in n.pairs:
+      result[i] = copyTree(it)
+
+proc newEmpty(info = unknownLineInfo): CgNode =
+  CgNode(kind: cnkEmpty, info: info)
+
+proc newTree(kind: CgNodeKind, info: TLineInfo, kids: varargs[CgNode]): CgNode =
+  ## For node kinds that don't represent standalone statements.
+  result = CgNode(kind: kind, info: info)
+  result.kids = @kids
+
+func newTypeNode(info: TLineInfo, typ: PType): CgNode =
+  CgNode(kind: cnkType, info: info, typ: typ)
+
+func newFieldNode(s: PSym; info = unknownLineInfo): CgNode =
+  CgNode(kind: cnkField, info: info, typ: s.typ, field: s)
+
+func newLabelNode(blk: BlockId; info = unknownLineInfo): CgNode =
+  CgNode(kind: cnkLabel, info: info, label: blk)
+
+proc newExpr(kind: CgNodeKind, info: TLineInfo, typ: PType,
+             kids: sink seq[CgNode]): CgNode =
+  ## Variant of ``newExpr`` optimized for passing a pre-existing child
+  ## node sequence.
+  result = CgNode(kind: kind, info: info, typ: typ)
+  result.kids = kids
+
+proc translateLit*(val: PNode): CgNode =
+  ## Translates an ``mnkLiteral`` node to a ``CgNode``.
+  ## Note that the MIR not only uses ``mnkLiteral`` for "real" literals, but
+  ## also for pushing other raw ``PNode``s through the MIR phase.
+  template node(k: CgNodeKind, field, value: untyped): CgNode =
+    CgNode(kind: k, info: val.info, typ: val.typ, field: value)
+
+  case val.kind
+  of nkIntLiterals:
+    # use the type for deciding what whether it's a signed or unsigned value
+    case val.typ.skipTypes(abstractRange + {tyEnum}).kind
+    of tyInt..tyInt64, tyBool:
+      node(cnkIntLit, intVal, val.intVal)
+    of tyUInt..tyUInt64, tyChar:
+      node(cnkUIntLit, intVal, val.intVal)
+    of tyPtr, tyPointer, tyProc:
+      # XXX: consider adding a dedicated node for pointer-like-literals
+      #      to both ``PNode`` and ``CgNode``
+      node(cnkUIntLit, intVal, val.intVal)
+    else:
+      unreachable(val.typ.skipTypes(abstractRange).kind)
+  of nkFloatLiterals:
+    case val.typ.skipTypes(abstractRange).kind
+    of tyFloat, tyFloat64:
+      node(cnkFloatLit, floatVal, val.floatVal)
+    of tyFloat32:
+      # all code-generators need to do this at one point, so we help them out
+      # by narrowing the value to a float32 value
+      node(cnkFloatLit, floatVal, val.floatVal.float32.float64)
+    else:
+      unreachable()
+  of nkStrKinds:
+    node(cnkStrLit, strVal, val.strVal)
+  of nkNilLit:
+    newNode(cnkNilLit, val.info, val.typ)
+  of nkNimNodeLit:
+    node(cnkAstLit, astLit, val[0])
+  of nkRange:
+    node(cnkRange, kids, @[translateLit(val[0]), translateLit(val[1])])
+  of nkSym:
+    # special case for raw symbols used with emit and asm statements
+    assert val.sym.kind == skField
+    node(cnkField, field, val.sym)
+  else:
+    unreachable("implement: " & $val.kind)
+
+func addIfNotEmpty(stmts: var seq[CgNode], n: sink CgNode) =
+  ## Only adds the node to the list if it's not an empty node. Used to prevent
+  ## the creation of statement-list expression that only consist of empty
+  ## nodes + the result-expression (a statement-list expression is unnecessary
+  ## in that case)
+  if n.kind != cnkEmpty:
+    stmts.add n
+
+func toSingleNode(stmts: sink seq[CgNode]): CgNode =
+  ## Creates a single ``CgNode`` from a list of *statements*
+  case stmts.len
+  of 0:
+    result = newEmpty()
+  of 1:
+    result = move stmts[0]
+  else:
+    result = newNode(cnkStmtList)
+    result.kids = stmts
+
+proc newDefaultCall(info: TLineInfo, typ: PType): CgNode =
+  ## Produces the tree for a ``default`` magic call.
+  newExpr(cnkCall, info, typ, [newMagicNode(mDefault, info)])
+
+proc initLocal(s: PSym): Local =
+  ## Inits a ``Local`` with the data from `s`.
+  result = Local(typ: s.typ, flags: s.flags, isImmutable: (s.kind == skLet),
+                 name: s.name)
+  if s.kind in {skVar, skLet, skForVar}:
+    result.alignment = s.alignment.uint32
+
+proc wrapInHiddenAddr(cl: TranslateCl, n: CgNode): CgNode =
+  ## Restores the ``cnkHiddenAddr`` around lvalue expressions passed to ``var``
+  ## parameters. The code-generators operating on ``CgNode``-IR depend on the
+  ## hidden addr to be present
+  if n.typ.skipTypes(abstractInst).kind != tyVar:
+    newOp(cnkHiddenAddr, n.info, makeVarType(cl.owner, n.typ, cl.idgen), n)
+  else:
+    # XXX: is this case ever reached? It should not be. Raw ``var`` values
+    #      must never be passed directly to ``var`` parameters at the MIR
+    #      level
+    n
+
+proc genObjConv(n: CgNode, a, b, t: PType): CgNode =
+  ## Depending on the relationship between `a` and `b`, wraps `n` in either an
+  ## up- or down-conversion. `t` is the type to use for the resulting
+  ## expression
+  let diff = inheritanceDiff(b, a)
+  #echo "a: ", a.sym.name.s, "; b: ", b.sym.name.s
+  #assert diff != 0 and diff != high(int), "redundant or illegal conversion"
+  if diff == 0:
+    return nil
+  result = newOp(
+    if diff < 0: cnkObjUpConv else: cnkObjDownConv,
+    n.info, t): n
+
+# forward declarations:
+proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+              cr: var TreeCursor): CgNode
+proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+               cr: var TreeCursor, allowExpr=false): seq[CgNode]
+
+proc handleSpecialConv(c: ConfigRef, n: CgNode, info: TLineInfo,
+                       dest: PType): CgNode =
+  ## Checks if a special conversion operator is required for a conversion
+  ## between the source type (i.e. that of `n`) and the destination type.
+  ## If it is, generates the conversion operation IR and returns it -- nil
+  ## otherwise
+  let
+    orig = dest
+    source = n.typ.skipTypes(abstractVarRange)
+    dest = dest.skipTypes(abstractVarRange)
+
+  case dest.kind
+  of tyObject:
+    assert source.kind == tyObject
+    genObjConv(n, source, dest, orig)
+  of tyRef, tyPtr, tyVar, tyLent:
+    assert source.kind == dest.kind
+    if source.base.kind == tyObject:
+      genObjConv(n, source.base, dest.base, orig)
+    else:
+      nil
+  else:
+    nil
+
+proc convToIr(cl: TranslateCl, n: CgNode, info: TLineInfo, dest: PType): CgNode =
+  ## Generates the ``CgNode`` IR for an ``mnkPathConv`` operation (handle
+  ## conversion).
+  result = handleSpecialConv(cl.graph.config, n, info, dest)
+  if result == nil:
+    # no special conversion is used
+    result = newOp(cnkLvalueConv, info, dest, n)
+
+proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
+  case n.kind
+  of mnkProc:
+    CgNode(kind: cnkProc, info: info, typ: n.typ, prc: n.prc)
+  of mnkGlobal:
+    CgNode(kind: cnkGlobal, info: info, typ: n.typ, global: n.global)
+  of mnkConst:
+    CgNode(kind: cnkConst, info: info, typ: n.typ, cnst: n.cnst)
+  of mnkLocal, mnkParam:
+    # paramaters are treated like locals in the code generators
+    assert n.sym.id in cl.localsMap
+    newLocalRef(cl.localsMap[n.sym.id], info, n.sym.typ)
+  of mnkTemp:
+    newLocalRef(cl.tempMap[n.temp], info, n.typ)
+  of mnkAlias:
+    # the type of the node doesn't match the real one
+    let
+      id = cl.tempMap[n.temp]
+      typ = cl.locals[id].typ
+    # the view is auto-dereferenced here for convenience
+    newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
+  of mnkLiteral:
+    translateLit(n.lit)
+  of mnkType:
+    newTypeNode(info, n.typ)
+  of mnkNone:
+    # type arguments do use `mnkNone` in some situtations, so keep
+    # the type
+    CgNode(kind: cnkEmpty, info: info, typ: n.typ)
+  else:
+    unreachable("not an atom: " & $n.kind)
+
+proc atomToIr(tree: MirBody, cl: var TranslateCl,
+              cr: var TreeCursor): CgNode {.inline.} =
+  atomToIr(get(tree, cr), cl, cr.info)
+
+proc tbExceptItem(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor
+                 ): CgNode =
+  let n {.cursor.} = get(tree, cr)
+  case n.kind
+  of mnkLocal:
+    # the 'except' branch acts as a definition for the local
+    let id = cl.locals.add initLocal(n.sym)
+    cl.localsMap[n.sym.id] = id
+    newLocalRef(id, cr.info, n.typ)
+  of mnkType:  newTypeNode(cr.info, n.typ)
+  else:        unreachable()
+
+
+proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
+                cr: var TreeCursor; preferField = true): CgNode =
+  ## Translates a MIR lvalue expression to the corresponding CG IR.
+  ## Due to tagged unions (currently) not being addressable at the type-
+  ## representation level, the exact meaning of ``mnkPathVariant`` is
+  ## context-dependent -- `preferField` disambiguates whether it should be
+  ## turned into a field access rather than a (pseudo) access of the tagged
+  ## union.
+  let info = cr.info
+
+  template recurse(): CgNode =
+    lvalueToIr(tree, cl, tree.get(cr), cr, false)
+
+  case n.kind
+  of mnkLocal, mnkGlobal, mnkParam, mnkTemp, mnkAlias, mnkConst, mnkProc:
+    return atomToIr(n, cl, info)
+  of mnkPathNamed:
+    result = newExpr(cnkFieldAccess, info, n.typ,
+                     [recurse(), newFieldNode(n.field)])
+  of mnkPathVariant:
+    if preferField:
+      result = newExpr(cnkFieldAccess, cr.info, n.field.typ,
+                      [recurse(), newFieldNode(n.field)])
+    else:
+      # variant access itself has no ``CgNode`` counterpart at the moment
+      result = recurse()
+  of mnkPathPos:
+    result = newExpr(cnkTupleAccess, info, n.typ,
+                     [recurse(),
+                      CgNode(kind: cnkIntLit, intVal: n.position.BiggestInt)])
+  of mnkPathArray:
+    # special case in order to support string literal access
+    # XXX: this needs to be removed once there is a dedicated run-time-
+    #      sequence access operator
+    let arg =
+      if tree[cr].kind == mnkLiteral:
+        atomToIr(tree, cl, cr)
+      else:
+        recurse()
+
+    result = newExpr(cnkArrayAccess, info, n.typ, [arg, atomToIr(tree, cl, cr)])
+  of mnkPathConv:
+    result = convToIr(cl, recurse(), info, n.typ)
+  # dereferences are allowed at the end of a path tree
+  of mnkDeref:
+    result = newOp(cnkDeref, info, n.typ, atomToIr(tree, cl, cr))
+  of mnkDerefView:
+    result = newOp(cnkDerefView, info, n.typ, atomToIr(tree, cl, cr))
+  of AllNodeKinds - LvalueExprKinds - {mnkProc}:
+    unreachable(n.kind)
+
+  leave(tree, cr)
+
+proc lvalueToIr(tree: MirBody, cl: var TranslateCl,
+                cr: var TreeCursor; preferField=true): CgNode {.inline.} =
+  lvalueToIr(tree, cl, tree.get(cr), cr, preferField)
+
+proc valueToIr(tree: MirBody, cl: var TranslateCl,
+               cr: var TreeCursor): CgNode =
+  case tree[cr].kind
+  of mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkAlias,
+     mnkLiteral, mnkType:
+    atomToIr(tree, cl, cr)
+  of mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv, mnkPathVariant,
+     mnkDeref, mnkDerefView:
+    lvalueToIr(tree, cl, cr)
+  else:
+    unreachable("not a value: " & $tree[cr].kind)
+
+proc argToIr(tree: MirBody, cl: var TranslateCl,
+             cr: var TreeCursor): (bool, CgNode) =
+  ## Translates a MIR argument tree to the corresponding CG IR tree.
+  ## Returns both the tree and whether the argumnet was wrapped in a tag
+  ## operator (which indicates that the parameter is a ``var`` parameter).
+  var n {.cursor.} = tree.get(cr)
+  assert n.kind in ArgumentNodes, "argument node expected: " & $n.kind
+  # the inner node may be a tag node
+  n = tree.get(cr)
+  case n.kind
+  of mnkTag:
+    # it is one, the expression must be an lvalue
+    result = (true, lvalueToIr(tree, cl, cr))
+    leave(tree, cr)
+  of mnkLiteral, mnkType, mnkProc, mnkNone:
+    # not a tag but an atom
+    result = (false, atomToIr(n, cl, cr.info))
+  of LvalueExprKinds:
+    result = (false, lvalueToIr(tree, cl, n, cr))
+  else:
+    unreachable("not a valid argument expression")
+
+  leave(tree, cr)
+
+proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
+              cr: var TreeCursor): CgNode =
+  ## Translate a valid call-like tree to the CG IR.
+  let info = cr.info
+  result = newExpr((if n.kind == mnkCall: cnkCall else: cnkCheckedCall),
+                   info, n.typ)
+  result.add: # the callee
+    case tree[cr].kind
+    of mnkMagic: newMagicNode(tree.get(cr).magic, info)
+    else:        valueToIr(tree, cl, cr)
+
+  # the code generators currently require some magics to not have any
+  # arguments wrapped in ``cnkHiddenAddr`` nodes
+  let noAddr = result[0].kind == cnkMagic and
+               result[0].magic in FakeVarParams
+
+  # translate the arguments:
+  while tree[cr].kind != mnkEnd:
+    var (mutable, arg) = argToIr(tree, cl, cr)
+    if noAddr:
+      if arg.typ.kind == tyVar:
+        # auto-dereference the view
+        # XXX: prevent this case from happening
+        arg = newOp(cnkDerefView, arg.info, arg.typ.base, arg)
+    elif mutable:
+      arg = wrapInHiddenAddr(cl, arg)
+
+    result.add arg
+
+  leave(tree, cr)
+
+proc exprToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode
+
+proc sourceExprToIr(tree: MirBody, cl: var TranslateCl,
+                    cr: var TreeCursor): tuple[n: CgNode, useFast: bool] =
+  ## Translates the MIR expression appearing in an assignment's source
+  ## slot. Assignment modifiers are dropped, and whether a fast assignment or
+  ## normal assignment should be used is computed and returned.
+  case tree[cr].kind
+  of mnkCopy, mnkSink:
+    # requires a full assignment
+    discard enter(tree, cr)
+    result = (valueToIr(tree, cl, cr), false)
+    leave(tree, cr)
+  of mnkMove:
+    # an ``x = move y`` assignment can be turned into a fast assignment
+    discard enter(tree, cr)
+    result = (valueToIr(tree, cl, cr), true)
+    leave(tree, cr)
+  of LvalueExprKinds:
+    # a fast assignment is correct for all raw lvalues
+    result = (lvalueToIr(tree, cl, cr), true)
+  else:
+    # rvalue expressions require a full assignment
+    result = (exprToIr(tree, cl, cr), false)
+
+proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+           n: MirNode, cr: var TreeCursor): CgNode =
+  ## Translates a 'def'-like construct
+  assert n.kind in DefNodes
+  let
+    entity {.cursor.} = get(tree, cr) # the name of the defined entity
+    info = cr.info
+
+  var def: CgNode
+
+  case entity.kind
+  of mnkLocal:
+    # translate the ``PSym`` to a ``Local`` and establish a mapping
+    let
+      sym = entity.sym
+      id = cl.locals.add initLocal(sym)
+
+    assert sym.id notin cl.localsMap, "re-definition of local"
+    cl.localsMap[sym.id] = id
+
+    def = newLocalRef(id, info, entity.typ)
+  of mnkParam:
+    # ignore 'def's for parameters
+    def = newEmpty()
+  of mnkGlobal:
+    def = CgNode(kind: cnkGlobal, info: info, typ: entity.typ,
+                 global: entity.global)
+  of mnkTemp:
+    # MIR temporaries are like normal locals, with the difference that they
+    # are created ad-hoc and don't have any extra information attached
+    assert entity.typ != nil
+    let tmp = cl.locals.add Local(typ: entity.typ)
+
+    assert entity.temp notin cl.tempMap, "re-definition of temporary"
+    cl.tempMap[entity.temp] = tmp
+
+    def = newLocalRef(tmp, info, entity.typ)
+  of mnkAlias:
+    # MIR aliases are translated to var/lent views
+    assert n.kind in {mnkBind, mnkBindMut}, "alias can only be defined by binds"
+    assert entity.typ != nil
+    let
+      typ = makeVarType(cl.owner, entity.typ, cl.idgen,
+                        if n.kind == mnkBind: tyLent else: tyVar)
+      tmp = cl.locals.add Local(typ: typ)
+
+    assert entity.temp notin cl.tempMap, "re-definition of temporary"
+    cl.tempMap[entity.temp] = tmp
+
+    def = newLocalRef(tmp, info, typ)
+  else:
+    unreachable()
+
+  var arg =
+    if n.kind in {mnkBind, mnkBindMut} and tree[cr].kind in LvalueExprKinds:
+      # don't use the field interperation for variant access
+      lvalueToIr(tree, cl, cr, preferField=false)
+    else:
+      sourceExprToIr(tree, cl, cr)[0]
+  leave(tree, cr)
+  if n.kind in {mnkBind, mnkBindMut} and arg.typ.kind notin {tyVar, tyLent}:
+    # wrap the operand in an address-of operation
+    arg = newOp(cnkHiddenAddr, info, def.typ, arg)
+
+  let isLet = (entity.kind == mnkTemp and n.kind == mnkDefCursor) or
+              (entity.kind == mnkTemp and not hasDestructor(def.typ)) or
+              (entity.kind == mnkAlias)
+  # to reduce the pressure on the code generator, locals that never cross
+  # structured control-flow boundaries are not lifted. As a temporary
+  # measure, cursor temporaries and aliases are treated as such, but
+  # do note that this is not guaranteed and relies on how `mirgen`
+  # produces MIR code
+
+  case def.kind
+  of cnkLocal:
+    if cl.inUnscoped and not isLet:
+      # add the local to the list of moved definitions and only emit
+      # an assignment
+      cl.defs.add copyTree(def)
+      result =
+        case arg.kind
+        of cnkEmpty: arg
+        else:        newStmt(cnkAsgn, info, [def, arg])
+    else:
+      result = newStmt(cnkDef, info, [def, arg])
+  of cnkGlobal:
+    # there are no defs for globals in the ``CgNode`` IR, so we
+    # emit an assignment that has the equivalent behaviour (in
+    # terms of initialization)
+    case arg.kind
+    of cnkEmpty:
+      if sfImportc in env.globals[def.global].flags:
+        # for imported globals, the 'def' only means that the symbol becomes
+        # known to us, not that it starts its lifetime here -> don't
+        # initialize or move it
+        result = arg
+      elif cl.inUnscoped:
+        # move the default initialization to the start of the scope
+        cl.defs.add def
+        result = arg
+      else:
+        result = newStmt(cnkAsgn, info, [def, newDefaultCall(info, def.typ)])
+    else:
+      if sfImportc notin env.globals[def.global].flags and cl.inUnscoped:
+        # default intialization is required at the start of the scope
+        cl.defs.add def
+      result = newStmt(cnkAsgn, info, [def, arg])
+  of cnkEmpty:
+    result = def
+  else:
+    unreachable()
+
+proc bodyToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+              cr: var TreeCursor): CgNode =
+  ## Generates the ``CgNode`` tree for the body of a construct that implies
+  ## some form of control-flow.
+  let prev = cl.inUnscoped
+  # assume the body is unscoped until stated otherwise
+  cl.inUnscoped = true
+  result = stmtToIr(tree, env, cl, cr)
+  cl.inUnscoped = prev
+
+proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
+              cr: var TreeCursor): CgNode
+
+proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+              cr: var TreeCursor): CgNode =
+  let n {.cursor.} = tree.get(cr)
+  let info = cr.info ## the source information of `n`
+
+  template body(): CgNode =
+    bodyToIr(tree, env, cl, cr)
+
+  template to(kind: CgNodeKind, args: varargs[untyped]): CgNode =
+    let r = newStmt(kind, info, args)
+    leave(tree, cr)
+    r
+
+  template toList(k: CgNodeKind, body: untyped): CgNode =
+    let res {.inject.} = newStmt(k, info)
+    while tree[cr].kind != mnkEnd:
+      body
+    leave(tree, cr)
+    res
+
+  case n.kind
+  of DefNodes:
+    defToIr(tree, env, cl, n, cr)
+  of mnkAsgn, mnkInit, mnkSwitch:
+    let
+      dst = lvalueToIr(tree, cl, cr)
+      (src, useFast) = sourceExprToIr(tree, cl, cr)
+    to (if useFast: cnkFastAsgn else: cnkAsgn), dst, src
+  of mnkRepeat:
+    to cnkRepeatStmt, body()
+  of mnkBlock:
+    cl.blocks.add n.label # push the label to the stack
+    let body = body()
+    cl.blocks.setLen(cl.blocks.len - 1) # pop block from the stack
+    to cnkBlockStmt, newLabelNode(cl.blocks.len.BlockId, info), body
+  of mnkTry:
+    let res = newStmt(cnkTryStmt, info, [body()])
+    assert n.len <= 2
+
+    for _ in 0..<n.len:
+      let it {.cursor.} = enter(tree, cr)
+
+      case it.kind
+      of mnkExcept:
+        for _ in 0..<it.len:
+          let br {.cursor.} = enter(tree, cr)
+          assert br.kind == mnkBranch
+
+          let excpt = newNode(cnkExcept, cr.info)
+          for j in 0..<br.len:
+            excpt.add tbExceptItem(tree, cl, cr)
+
+          excpt.add body()
+          res.add excpt
+
+          leave(tree, cr)
+
+      of mnkFinally:
+        res.add newTree(cnkFinally, cr.info, body())
+      else:
+        unreachable(it.kind)
+
+      leave(tree, cr)
+
+    leave(tree, cr)
+    res
+  of mnkBreak:
+    # find the stack index of the enclosing 'block' identified by the break's
+    # label; we use the index as the ID
+    var idx = cl.blocks.high
+    while idx >= 0 and cl.blocks[idx] != n.label:
+      dec idx
+    newStmt(cnkBreakStmt, info, [newLabelNode(BlockId idx, info)])
+  of mnkReturn:
+    newNode(cnkReturnStmt, info)
+  of mnkVoid:
+    var res = exprToIr(tree, cl, cr)
+    if res.typ.isEmptyType():
+      # a void expression doesn't need to be discarded
+      discard
+    else:
+      res = newStmt(cnkVoidStmt, info, [res])
+    leave(tree, cr)
+    res
+  of mnkIf:
+    to cnkIfStmt, valueToIr(tree, cl, cr), body()
+  of mnkRaise:
+    # the operand can either be empty or an lvalue expression
+    to cnkRaiseStmt:
+      case tree[cr].kind
+      of mnkNone: atomToIr(tree, cl, cr)
+      else:       lvalueToIr(tree, cl, cr)
+  of mnkCase:
+    caseToIr(tree, env, cl, n, cr)
+  of mnkAsm:
+    toList cnkAsmStmt:
+      res.add valueToIr(tree, cl, cr)
+  of mnkEmit:
+    toList cnkEmitStmt:
+      res.add valueToIr(tree, cl, cr)
+  of mnkStmtList:
+    toList cnkStmtList:
+      res.kids.addIfNotEmpty stmtToIr(tree, env, cl, cr)
+  of mnkScope:
+    toSingleNode scopeToIr(tree, env, cl, cr)
+  of mnkDestroy:
+    unreachable("a 'destroy' that wasn't lowered")
+  of AllNodeKinds - StmtNodes:
+    unreachable(n.kind)
+
+proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
+              cr: var TreeCursor): CgNode =
+  assert n.kind == mnkCase
+  result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
+  for j in 0..<n.len:
+    let br {.cursor.} = enter(tree, cr)
+
+    result.add newTree(cnkBranch, cr.info)
+    if br.len > 0:
+      for x in 0..<br.len:
+        assert tree[cr].kind in {mnkConst, mnkLiteral}
+        result[^1].add atomToIr(tree, cl, cr)
+
+    result[^1].add bodyToIr(tree, env, cl, cr)
+    leave(tree, cr)
+
+  leave(tree, cr)
+
+proc exprToIr(tree: MirBody, cl: var TranslateCl,
+              cr: var TreeCursor): CgNode =
+  ## Translates a MIR expression to the corresponding CG IR representation.
+  ## Moves the cursor to the next tree item.
+  let n {.cursor.} = get(tree, cr)
+  let info = cr.info
+
+  template op(kind: CgNodeKind, e: CgNode): CgNode =
+    let r = newOp(kind, info, n.typ, e)
+    leave(tree, cr)
+    r
+
+  template treeOp(k: CgNodeKind, body: untyped): CgNode =
+    let res {.inject.} = newExpr(k, info, n.typ)
+    while tree[cr].kind != mnkEnd:
+      body
+    leave(tree, cr)
+    res
+
+  case n.kind
+  of Atoms:
+    atomToIr(n, cl, info)
+  of mnkPathVariant, mnkPathArray, mnkPathConv, mnkPathNamed, mnkPathPos:
+    lvalueToIr(tree, cl, n, cr)
+  of mnkCast:
+    op cnkCast, valueToIr(tree, cl, cr)
+  of mnkConv:
+    op cnkConv, valueToIr(tree, cl, cr)
+  of mnkStdConv:
+    op cnkHiddenConv, valueToIr(tree, cl, cr)
+  of mnkToSlice:
+    treeOp cnkToSlice:
+      res.add valueToIr(tree, cl, cr)
+  of mnkAddr:
+    op cnkAddr, lvalueToIr(tree, cl, cr)
+  of mnkDeref:
+    op cnkDeref, atomToIr(tree, cl, cr)
+  of mnkView:
+    op cnkHiddenAddr, lvalueToIr(tree, cl, cr)
+  of mnkDerefView:
+    op cnkDerefView, atomToIr(tree, cl, cr)
+  of mnkObjConstr:
+    assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
+    treeOp cnkObjConstr:
+      let f = newFieldNode(get(tree, cr).field)
+      res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
+  of mnkConstr:
+    let typ = n.typ.skipTypes(abstractVarRange)
+
+    let kind =
+      case typ.kind
+      of tySet:               cnkSetConstr
+      of tyArray, tySequence: cnkArrayConstr
+      of tyTuple:             cnkTupleConstr
+      of tyProc:
+        assert typ.callConv == ccClosure
+        cnkClosureConstr
+      else:
+        unreachable(typ.kind)
+
+    treeOp kind:
+      res.add argToIr(tree, cl, cr)[1]
+  of mnkCall, mnkCheckedCall:
+    callToIr(tree, cl, n, cr)
+  of UnaryOps:
+    const Map = [mnkNeg: cnkNeg]
+    treeOp Map[n.kind]:
+      res.add valueToIr(tree, cl, cr)
+  of BinaryOps:
+    const Map = [mnkAdd: cnkAdd, mnkSub: cnkSub,
+                 mnkMul: cnkMul, mnkDiv: cnkDiv, mnkModI: cnkModI]
+    treeOp Map[n.kind]:
+      res.kids = @[valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)]
+  of mnkCopy, mnkMove, mnkSink:
+    # translation of assignments needs to handle all modifiers
+    unreachable("loose assignment modifier")
+  of AllNodeKinds - ExprKinds - {mnkNone}:
+    unreachable(n.kind)
+
+proc genDefFor(sym: sink CgNode): CgNode =
+  ## Produces the statement tree of a definition for the given symbol-like
+  ## node. Globals use an assignment.
+  case sym.kind
+  of cnkLocal:
+    newStmt(cnkDef, sym.info, [sym, newEmpty()])
+  of cnkGlobal:
+    # emulate the default-initialization behaviour
+    newStmt(cnkAsgn, sym.info, [sym, newDefaultCall(sym.info, sym.typ)])
+  else:
+    unreachable()
+
+proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+               cr: var TreeCursor, allowExpr = false): seq[CgNode] =
+  let
+    ends =
+      if allowExpr: {mnkEnd} + Atoms
+      else:         {mnkEnd}
+    prev = cl.defs.len
+    prevInUnscoped = cl.inUnscoped
+
+  # a scope is entered, meaning that we're no longer in an unscoped context
+  cl.inUnscoped = false
+
+  var stmts: seq[CgNode]
+  # translate all statements:
+  while cr.hasNext(tree) and tree[cr].kind notin ends:
+    stmts.addIfNotEmpty stmtToIr(tree, env, cl, cr)
+
+  if cr.hasNext(tree) and tree[cr].kind == mnkEnd:
+    leave(tree, cr) # close the sub-tree
+
+  if cl.defs.len > prev:
+    # insert all the lifted defs at the start
+    for i in countdown(cl.defs.high, prev):
+      stmts.insert genDefFor(move cl.defs[i])
+
+    # "pop" the elements that were added as part of this scope:
+    cl.defs.setLen(prev)
+
+  cl.inUnscoped = prevInUnscoped
+
+  result = stmts
+
+proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
+        start: NodePosition): CgNode =
+  ## Translate `tree` to the corresponding ``CgNode`` representation.
+  var cr = TreeCursor(pos: start.uint32)
+  var nodes = scopeToIr(tree, env, cl, cr, allowExpr=true)
+  if cr.hasNext(tree):
+    # the tree must be an expression; the last node is required to be an atom
+    let x = atomToIr(tree, cl, cr)
+    if nodes.len == 0:
+      x
+    else:
+      nodes.add x
+      newExpr(cnkStmtListExpr, unknownLineInfo, nodes[^1].typ, nodes)
+  else:
+    # it's a statement list
+    toSingleNode nodes
+
+proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
+                 owner: PSym,
+                 body: sink MirBody): Body =
+  ## Generates the ``CgNode`` IR corresponding to the input MIR `body`,
+  ## using `idgen` to provide new IDs when creating symbols.
+  var cl = TranslateCl(graph: graph, idgen: idgen, owner: owner)
+  if owner.kind in routineKinds:
+    # setup the locals and associated mappings for the parameters
+    template add(v: PSym) =
+      let s = v
+      cl.localsMap[s.id] = cl.locals.add initLocal(s)
+
+    let sig =
+      if owner.kind == skMacro: owner.internal
+      else:                     owner.typ
+
+    # result variable:
+    if sig[0].isEmptyType():
+      # always reserve a slot for the result variable, even if the latter is
+      # not present
+      discard cl.locals.add(Local())
+    else:
+      add(owner.ast[resultPos].sym)
+
+    # normal parameters:
+    for i in 1..<sig.len:
+      add(sig.n[i].sym)
+
+    if sig.callConv == ccClosure:
+      # environment parameter
+      add(owner.ast[paramsPos][^1].sym)
+
+  result = Body()
+  result.code = tb(body, env, cl, NodePosition 0)
+  result.locals = cl.locals
diff --git a/compiler/backend/cgirutils.nim b/compiler/backend/cgirutils.nim
index f68f8fbd214..b5f361b401f 100644
--- a/compiler/backend/cgirutils.nim
+++ b/compiler/backend/cgirutils.nim
@@ -59,7 +59,8 @@ proc treeRepr*(n: CgNode): string =
     of cnkMagic:
       result.add "magic: "
       result.add $n.magic
-    of cnkEmpty, cnkInvalid, cnkType, cnkAstLit, cnkNilLit, cnkReturnStmt:
+    of cnkEmpty, cnkInvalid, cnkType, cnkAstLit, cnkNilLit, cnkReturnStmt,
+       cnkResume:
       discard
     of cnkWithOperand:
       result.add "\n"
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index a0db57b1383..22f5f5def2e 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -205,3 +205,8 @@ proc pick*[T](n: CgNode, forInt, forFloat: T): T =
   of tyFloat..tyFloat64:       forFloat
   else:
     unreachable("not an integer or float type")
+
+func numArgs*(n: CgNode): int {.inline.} =
+  ## Returns the number of arguments for a call-like node. The callee
+  ## is excluded.
+  n.len - 1 - ord(n.kind == cnkCheckedCall)
diff --git a/compiler/backend/jsbackend.nim b/compiler/backend/jsbackend.nim
index 6c3cc7e1dbd..55069b22b5a 100644
--- a/compiler/backend/jsbackend.nim
+++ b/compiler/backend/jsbackend.nim
@@ -74,11 +74,11 @@ proc processEvent(g: PGlobals, graph: ModuleGraph, modules: BModuleList,
       p = startProc(g, bmod, evt.id, Body())
       partial[evt.sym.id] = p
 
-    let body = generateIR(graph, bmod.idgen, g.env, evt.sym, evt.body)
+    let body = generateIRLegacy(graph, bmod.idgen, g.env, evt.sym, evt.body)
     genPartial(p, merge(p.fullBody, body))
   of bekProcedure:
     let
-      body = generateIR(graph, bmod.idgen, g.env, evt.sym, evt.body)
+      body = generateIRLegacy(graph, bmod.idgen, g.env, evt.sym, evt.body)
       r = genProc(g, bmod, evt.id, body)
 
     if sfCompilerProc in evt.sym.flags:
@@ -115,7 +115,8 @@ proc generateCodeForMain(globals: PGlobals, graph: ModuleGraph, m: BModule,
 
   let owner = m.module
   genTopLevelStmt(globals, m):
-    canonicalize(graph, m.idgen, globals.env, owner, body, TranslationConfig())
+    canonicalize(graph, m.idgen, globals.env, owner, body, TranslationConfig(),
+                 legacy=true)
 
 proc generateCode*(graph: ModuleGraph, mlist: sink ModuleList) =
   ## Entry point into the JS backend. Generates the code for all modules and
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index 58e66953a1a..20a020ff7cc 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -2447,7 +2447,7 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
   of cnkTryStmt: genTry(p, n)
   of cnkRaiseStmt: genRaiseStmt(p, n)
   of cnkInvalid, cnkMagic, cnkRange, cnkBinding, cnkExcept, cnkFinally,
-     cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkField:
+     cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkField, cnkNewCfNodes:
     internalError(p.config, n.info, "gen: unknown node type: " & $n.kind)
 
 proc newModule*(g: ModuleGraph; module: PSym): BModule =
diff --git a/compiler/front/condsyms.nim b/compiler/front/condsyms.nim
index d50a5b440ed..8bad92d1f8d 100644
--- a/compiler/front/condsyms.nim
+++ b/compiler/front/condsyms.nim
@@ -74,3 +74,4 @@ proc initDefines*(symbols: StringTableRef) =
   defineSymbol("nimskullReworkStaticExec")
   defineSymbol("nimskullNoMagicNewAssign")
   defineSymbol("nimskullNoFloat128")
+  defineSymbol("nimskullNewExceptionRt")
diff --git a/compiler/mir/mirbridge.nim b/compiler/mir/mirbridge.nim
index 9660d81eacd..19b58d19467 100644
--- a/compiler/mir/mirbridge.nim
+++ b/compiler/mir/mirbridge.nim
@@ -10,6 +10,7 @@ import
   compiler/backend/[
     cgir,
     cgirgen,
+    cgirgen_legacy,
     cgirutils
   ],
   compiler/front/[
@@ -76,7 +77,8 @@ proc echoOutput*(config: ConfigRef, owner: PSym, body: Body) =
       config.writeln(treeRepr(body.code))
 
 proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
-                   owner: PSym, body: PNode, config: TranslationConfig): Body =
+                   owner: PSym, body: PNode, config: TranslationConfig;
+                   legacy=false): Body =
   ## Legacy routine. Translates the body `body` of the procedure `owner` to
   ## MIR code, and the MIR code to ``CgNode`` IR.
   echoInput(graph.config, owner, body)
@@ -85,5 +87,8 @@ proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
   echoMir(graph.config, owner, body)
 
   # step 2: generate the ``CgNode`` tree
-  result = generateIR(graph, idgen, env, owner, body)
+  if legacy:
+    result = cgirgen_legacy.generateIR(graph, idgen, env, owner, body)
+  else:
+    result = cgirgen.generateIR(graph, idgen, env, owner, body)
   echoOutput(graph.config, owner, result)
\ No newline at end of file
diff --git a/compiler/vm/vmbackend.nim b/compiler/vm/vmbackend.nim
index 4084bce8c8a..280cccafcab 100644
--- a/compiler/vm/vmbackend.nim
+++ b/compiler/vm/vmbackend.nim
@@ -126,7 +126,7 @@ proc generateCodeForProc(c: var CodeGenCtx, idgen: IdGenerator, s: PSym,
   ## Generates and the bytecode for the procedure `s` with body `body`. The
   ## resulting bytecode is emitted into the global bytecode section.
   let
-    body = generateIR(c.graph, idgen, c.env, s, body)
+    body = generateIRLegacy(c.graph, idgen, c.env, s, body)
     r    = genProc(c, s, body)
 
   if r.isOk:
@@ -181,7 +181,7 @@ proc processEvent(c: var GenCtx, mlist: ModuleList, discovery: var DiscoveryData
   of bekPartial:
     let p = addr mgetOrPut(partial, evt.id, PartialProc(sym: evt.sym))
     discard merge(p.body):
-      generateIR(c.graph, idgen, c.gen.env, evt.sym, evt.body)
+      generateIRLegacy(c.graph, idgen, c.gen.env, evt.sym, evt.body)
   of bekProcedure:
     # a complete procedure became available
     let r = generateCodeForProc(c.gen, idgen, evt.sym, evt.body)
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 7d99e1cd1f1..8744d567cf2 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -3200,7 +3200,8 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
   of cnkAsmStmt, cnkEmitStmt:
     unused(c, n, dest)
   of cnkInvalid, cnkMagic, cnkRange, cnkExcept, cnkFinally, cnkBranch,
-     cnkBinding, cnkLabel, cnkStmtListExpr, cnkField, cnkToSlice:
+     cnkBinding, cnkLabel, cnkStmtListExpr, cnkField, cnkToSlice,
+     cnkNewCfNodes:
     unreachable(n.kind)
 
 proc initProc(c: TCtx, owner: PSym, body: sink Body): BProc =
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 1b9a96a6e11..3913cbf5bf2 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -154,7 +154,7 @@ proc generateMirCode(c: var TCtx, env: var MirEnv, n: PNode;
     result.code = finish(bu)
 
 proc generateIR(c: var TCtx, env: MirEnv, body: sink MirBody): Body =
-  backends.generateIR(c.graph, c.idgen, env, c.module, body)
+  backends.generateIRLegacy(c.graph, c.idgen, env, c.module, body)
 
 proc setupRootRef(c: var TCtx) =
   ## Sets up if the ``RootRef`` type for the type info cache. This
@@ -271,7 +271,7 @@ proc genProc(jit: var JitState, c: var TCtx, s: PSym): VmGenResult =
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
-  let outBody = generateIR(c.graph, c.idgen, jit.gen.env, s, mirBody)
+  let outBody = generateIRLegacy(c.graph, c.idgen, jit.gen.env, s, mirBody)
   echoOutput(c.config, s, outBody)
 
   try:
diff --git a/doc/mir.rst b/doc/mir.rst
index ac7fff3ac45..df09c8c6b9d 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -48,6 +48,15 @@ Semantics
         | <Type>
         | LVALUE
 
+  INTERMEDIATE_TARGET = <Label>
+                      | Leave <Label>
+
+  TARGET = <Label>
+         | TargetList INTERMEDIATE_TARGET ... <Label>
+
+  EX_TARGET = TARGET
+            | TargetList INTERMEDIATE_TARGET ... Resume
+
   UNARY_OP = NegI VALUE
 
   BINARY_OP = AddI VALUE, VALUE
@@ -78,12 +87,17 @@ Semantics
                                          # one for which the behaviour cannot
                                          # be represented in the MIR)
 
-  # checked calls have the same shape as normal calls. The difference is that
-  # the call has an exceptional exit (i.e., it might raise an exception)
+  # (legacy) checked calls have the same shape as normal calls. The difference
+  # is that the call has an exceptional exit (i.e., it might raise an
+  # exception)
   CHECKED_CALL_EXPR = CheckedCall <Proc> CALL_ARG ...
                     | CheckedCall LVALUE CALL_ARG ...
                     | CheckedCall <Magic> CALL_ARG ...
 
+  CHECKED_CALL_EXPR = CheckedCall <Proc> CALL_ARG ...  EX_TARGET
+                    | CheckedCall LVALUE CALL_ARG ...  EX_TARGET
+                    | CheckedCall <Magic> CALL_ARG ... EX_TARGET
+
 
   RVALUE = UNARY_OP
          | BINARY_OP
@@ -150,7 +164,10 @@ Semantics
             | Switch LVALUE ASGN_SRC    # changes the active branch of a
                                         # variant. Unclear semantics.
             | If VALUE STATEMENT        # if the value evaluates to true
-                                        # execute the statement
+                                        # execute the statement (legacy)
+            | If VALUE <Label>          # fall through if the value evaluates
+                                        # to true, otherwise jump to the if's
+                                        # corresponding end
             | Case VALUE BRANCH_LIST    # dispatch to one of the branches based
                                         # on the value, where value must be
                                         # either of integer, float, or string
@@ -158,13 +175,16 @@ Semantics
             | Block <Label> STATEMENT   # run the wrapped statement and provide
                                         # a named exit. The label must be
                                         # unique across all blocks in the
-                                        # procedure
+                                        # procedure (legacy)
             | Break <Label>             # exit the enclosing block that has the
-                                        # given label
+                                        # given label (legacy)
             | Repeat STATEMENT          # unconditional loop. Repeat the
                                         # statement for an indefinite amount
-                                        # of times
-            | TRY_STMT
+                                        # of times (legacy)
+            | TRY_STMT                  # (legacy)
+            | Goto TARGET
+            | Loop <Label>              # unconditional jump back to the start
+                                        # of a loop
             | Raise LVALUE              # push the given exception to the
                                         # exception stack and start exceptional
                                         # control-flow. The `ref object` is
@@ -172,14 +192,27 @@ Semantics
             | Raise <None>              # re-raise the current exception
             | Return                    # exit the procedure, but execute all
                                         # enclosing finalizers first (from
-                                        # innermost to outermost)
+                                        # innermost to outermost) (legacy)
             | Destroy LVALUE
+            | Raise LVALUE EX_TARGET
+            | Raise <None> EX_TARGET
+            | Join <Label>              # join point for non-exceptional
+                                        # control-flow (e.g., goto)
+            | LoopJoin <Label>          # join point for `Loop`
+            | Except <Type> ... EX_TARGET
+            | Except <Local> EX_TARGET
+            | Except                    # catch-all handler
+            | Finally <Label>
+            | Continue <Label> (<Label> | Resume) ...
+            | End <Label>               # marks the end of an if, repeat, or
+                                        # except
             | Emit VALUE ...
             | Asm VALUE ...
 
   BRANCH_LABEL = <Literal>
                | <Const>
   BRANCH_LIST = (Branch BRANCH_LABEL ... STATEMENT) ... # a list of branches
+              | (Branch BRANCH_LABEL ... TARGET) ...
 
   EXCEPT_BRANCH = Branch <Type> ... STATEMENT # exception handler
                 | Branch <Local>    STATEMENT # exception handler for imported
@@ -219,6 +252,110 @@ be read from during execution of the procedure.
 This information is intended for use by data-flow analysis and code
 generators.
 
+
+Control Flow Representation
+===========================
+
+.. note:: This only covers the new control-flow primitives.
+
+Terminology:
+* *basic block*: a basic block is a region of statements that contains no
+  jumps and is not jumped into
+* *label*: identifies a control-flow-related construct
+* *terminator*: marks the end of a basic block
+
+A basic block is started by `Finally` and `Except`. Terminators are: `Case`,
+`Goto`, `Raise`, `Continue`, and `Loop`. `If`, `Join`, and `LoopJoin` act as
+both the start and end of a basic block. The nature of `End` depends on the
+associated construct:
+* for `If`, it acts as both a terminator and start of a basic block
+* for `Except`, it only marks the end of the section
+
+Except for `Loop`, all terminators only allow forward control-flow.
+
+Structured Constructs
+---------------------
+
+Each `If` and `Except` must be paired with exactly one `End`, each `LoopJoin`
+with a `Loop`, and each `Finally` with a `Continue`. These are the
+*structured* constructs, and they must not overlap each other, meaning
+that:
+
+.. code-block::
+
+  if x (L1)
+  if y (L2)
+  end L1
+  end L2
+
+is not allowed. However, much like in the high-level language, structured
+constructs can be nested.
+
+Target Lists
+------------
+
+`Goto`, `Raise`, `Except`, and `CheckedCall` support *target lists*. The
+target list specifies intermediate jump targets as well as which sections
+are exited. Take, for example:
+
+.. code-block::
+
+  goto [Leave L1, L2, Leave L3, L4]
+
+What this means is the following:
+1. leave the section (`Except` or `Finally`) identified by label L1
+2. enter the `Finally` section identified by label L2
+3. leave the section identified by label L3
+4. land at the `Finally` or `Join` identified by label L4
+
+An example of the code that would result in such `Goto`:
+
+.. code-block:: nim
+
+  block L4:
+    try:
+      ...
+    finally:
+      try:
+        try
+          ...
+        finally:
+          break L4 # this would translate to the aforementioned goto
+      finally:
+        ...
+
+In the context of exceptional control-flow, the final target must be either
+a `Finally` or an `Except`, otherwise it must be either a `Finally` or `Join`.
+
+Resume
+------
+
+`Resume` is a special jump target that may only appear as the final target of
+`Raise`, `CheckedCall`, and `Except`. It specifies that unwinding/exception-
+handling *resumes* in the caller procedure.
+
+Exception Handler
+-----------------
+
+`Except` represents an exception handler. If types or a local is specified,
+the section is only entered if the run-time type of the active exception
+matches the section's filters. If there's a match, execution continues with
+the statement following the `Except`, otherwise it continues at the target
+specified by the `Except`.
+
+Finally Sections
+----------------
+
+A `Finally` section is used as an intermediate target in a jump chain. Where
+the `Continue` statement marking the end of the section jumps to depends on
+the *target list* the entered `Finally` is part of. For example, with
+`Goto [L1, L2]`, the `Continue` of the `Finally` section identified by L1
+would jump to L2.
+
+The `Continue` must also be present if it is never actually reached. In this
+case, the `Finally` section may only appear as the final target in a target
+list.
+
 Storage
 =======
 
diff --git a/lib/system/excpt.nim b/lib/system/excpt.nim
index 74da1d65c6b..8603fce28b7 100644
--- a/lib/system/excpt.nim
+++ b/lib/system/excpt.nim
@@ -67,6 +67,13 @@ type
     len: int
     prev: ptr GcFrameHeader
 
+  ExceptionFrame {.compilerproc.} = object
+    ## Represents an exception handler (i.e., an ``except`` section).
+    prev: ptr ExceptionFrame
+      ## previous frame, or nil
+    exc: ref Exception
+      ## always non-nil
+
 when NimStackTraceMsgs:
   var frameMsgBuf* {.threadvar.}: string
 var
@@ -74,6 +81,12 @@ var
   currException {.threadvar.}: ref Exception
   gcFramePtr {.threadvar.}: GcFrame
 
+  handlers {.threadvar.}: ptr ExceptionFrame
+    ## linked list of all active handlers in the current thread
+  activeException {.threadvar.}: ref Exception
+    ## stack of in-flight exceptions. An exception stops being in-flight once
+    ## an ``except`` section "catches" it.
+
 type
   FrameState = tuple[gcFramePtr: GcFrame, framePtr: PFrame,
                      currException: ref Exception]
@@ -118,11 +131,13 @@ proc pushGcFrame*(s: GcFrame) {.compilerRtl, inl.} =
   gcFramePtr = s
 
 proc pushCurrentException(e: sink(ref Exception)) {.compilerRtl, inl.} =
+  # XXX: legacy runtime procedure only used by the csources compiler
   e.up = currException
   currException = e
   #showErrorMessage2 "A"
 
 proc popCurrentException {.compilerRtl, inl.} =
+  # XXX: legacy runtime procedure only used by the csources compiler
   currException = currException.up
   #showErrorMessage2 "B"
 
@@ -412,6 +427,13 @@ when true:
       currException = nil
       quit(1)
 
+proc pushActiveException(e: sink(ref Exception)) =
+  e.up = activeException
+  activeException = e
+  # FIXME: don't set the current exception here; it's only done this way for
+  #        backwards compatibility
+  currException = e # set the current exception already
+
 proc raiseExceptionAux(e: sink(ref Exception)) {.nodestroy.} =
   when defined(nimPanics):
     # XXX: the compiler should reject raise being used with defects. User-code
@@ -425,7 +447,10 @@ proc raiseExceptionAux(e: sink(ref Exception)) {.nodestroy.} =
   if globalRaiseHook != nil:
     if not globalRaiseHook(e): return
 
-  pushCurrentException(e)
+  when defined(nimskullNewExceptionRt):
+    pushActiveException(e)
+  else:
+    pushCurrentException(e)
   inc nimInErrorMode
 
 proc prepareException(e: ref Exception, ename: cstring) {.compilerRtl.} =
@@ -467,10 +492,16 @@ proc raiseException(e: sink(ref Exception), ename: cstring) {.compilerRtl.} =
   raiseExceptionEx(e, ename, nil, nil, 0)
 
 proc reraiseException() {.compilerRtl.} =
-  if currException == nil:
-    sysFatal(ReraiseDefect, "no exception to reraise")
-  else:
+  when defined(nimskullNewExceptionRt):
+    # the compiler makes sure that a re-raise only take place within an
+    # exception handler
+    pushActiveException(move handlers.exc)
     inc nimInErrorMode
+  else:
+    if currException == nil:
+      sysFatal(ReraiseDefect, "no exception to reraise")
+    else:
+      inc nimInErrorMode
 
 proc threadTrouble() =
   # also forward declared, it is 'raises: []' hence the try-except.
@@ -534,6 +565,71 @@ proc nimFrame(s: PFrame) {.compilerRtl, inl, raises: [].} =
   framePtr = s
   if s.calldepth == nimCallDepthLimit: callDepthLimitReached()
 
+# v2 exception handling runtime
+# -----------------------------
+
+{.push stacktrace: off, checks: off.}
+
+proc nimCatchException(frame: ptr ExceptionFrame) {.compilerproc.} =
+  ## Pops the top-most in-flight exception from the stack, stores it in
+  ## `frame`, and sets it as the current exception. `frame` is pushed to the
+  ## handler stack.
+  # zero-initialize the location first
+  nimZeroMem(frame, sizeof(ExceptionFrame))
+  frame.prev = handlers
+  frame.exc = activeException
+  # push to handler stack:
+  handlers = frame
+
+  currException = activeException
+  # "pop" the exception from the active stack. Moving from the up pointer
+  # makes sure the caught exception is properly disconnected:
+  activeException = move activeException.up
+
+proc restoreCurrentEx() =
+  # FIXME: don't consider active exceptions; it's only done this way for
+  #        backwards compatibility
+  if handlers.isNil or handlers.exc.isNil:
+    currException = activeException
+  elif handlers.exc.up == activeException:
+    # the active handler is more recent than the most-recent active exception
+    currException = handlers.exc
+  else:
+    # the active exception was raised after the most-recent handler was entered
+    currException = activeException
+
+proc nimLeaveExcept() {.compilerproc, inline.} =
+  ## Called when an exception handler is exited. Pops the top-most frame from
+  ## the handler stack. Supports being called during unwinding.
+  var wasInErrorMode = nimInErrorMode
+  nimInErrorMode = false
+  handlers.exc = nil # cleanup the ref
+  handlers = handlers.prev
+  restoreCurrentEx()
+  nimInErrorMode = wasInErrorMode
+
+proc nimAbortException() {.compilerproc.} =
+  ## Abort (i.e., discard) an in-flight exception. Must only be called if an
+  ## exception is actually in-flight.
+  var wasInErrorMode = nimInErrorMode
+  # disable error mode right away
+  nimInErrorMode = false
+
+  if wasInErrorMode:
+    # if an exception is aborted by raising another exception, don't pop the
+    # active exception; drop its parent
+    if activeException.up != nil:
+      activeException.up = activeException.up.up
+  else:
+    activeException = activeException.up
+
+  restoreCurrentEx()
+  nimInErrorMode = wasInErrorMode
+
+{.pop.}
+
+# -----
+
 when not defined(noSignalHandler) and not defined(useNimRtl):
   type Sighandler = proc (a: cint) {.noconv, benign.}
     # xxx factor with ansi_c.CSighandlerT, posix.Sighandler
diff --git a/tests/exception/tfinally6.nim b/tests/exception/tfinally6.nim
index 05c747645d0..2c731759df7 100644
--- a/tests/exception/tfinally6.nim
+++ b/tests/exception/tfinally6.nim
@@ -3,7 +3,7 @@ discard """
     Multiple tests regarding ``finally`` interaction with exception handlers
     and raised exceptions.
   '''
-  knownIssue.c js: "The current exception is not properly cleared"
+  knownIssue.js: "The current exception is not properly cleared"
 """
 
 var steps: seq[int]
diff --git a/tests/exception/tleave_except2.nim b/tests/exception/tleave_except2.nim
new file mode 100644
index 00000000000..63ee9496ae5
--- /dev/null
+++ b/tests/exception/tleave_except2.nim
@@ -0,0 +1,87 @@
+discard """
+  description: '''
+    Ensure that leaving an `except` section by raising an exception properly
+    updates the current exception.
+  '''
+  knownIssue.js vm: "The current exception is not reset properly"
+"""
+
+var steps: seq[string]
+
+type Ex = object of CatchableError
+
+proc `=destroy`(x: var Ex) =
+  steps.add x.msg
+
+template postcondition() =
+  # ensure that the exceptions were destroyed in the correct order
+  when defined(gcOrc) or defined(gcArc):
+    doAssert steps == ["1", "2"]
+
+# -------------
+# test case 1: local raise and local exception handler
+
+proc test1() =
+  try:
+    try:
+      raise Ex.newException("1")
+    except Ex as e:
+      doAssert getCurrentException() == e
+      doAssert e.msg == "1"
+      raise Ex.newException("2")
+  except Ex as e:
+    doAssert getCurrentException() == e
+    doAssert e.msg == "2"
+
+  doAssert getCurrentException() == nil
+
+test1()
+postcondition()
+
+# -------------
+# test case 2: indirect raise and local exception handler
+
+proc raiseEx() =
+  raise Ex.newException("2")
+
+proc test2() =
+  try:
+    try:
+      raise Ex.newException("1")
+    except Ex as e:
+      doAssert getCurrentException() == e
+      doAssert e.msg == "1"
+      raiseEx()
+  except Ex as e:
+    doAssert getCurrentException() == e
+    doAssert e.msg == "2"
+
+  doAssert getCurrentException() == nil
+
+steps = @[]
+test2()
+postcondition()
+
+# -------------
+# test case 3: indirect raise and non-local exception handler
+
+proc test3() =
+  proc inner() =
+    try:
+      raise Ex.newException("1")
+    except Ex as e:
+      doAssert getCurrentException() == e
+      doAssert e.msg == "1"
+      raiseEx()
+
+  try:
+    inner()
+  except Ex as e:
+    doAssert getCurrentException() == e
+    doAssert e.msg == "2"
+
+  doAssert getCurrentException() == nil
+
+steps = @[]
+test3()
+postcondition()
diff --git a/tests/exception/treraise2.nim b/tests/exception/treraise2.nim
new file mode 100644
index 00000000000..30216fe2887
--- /dev/null
+++ b/tests/exception/treraise2.nim
@@ -0,0 +1,58 @@
+discard """
+  description: '''
+    Ensure that raising a caught exception from within an exception handler
+    works
+  '''
+  knownIssue.js vm: "The current exception is not properly updated"
+"""
+
+proc manualReraise() =
+  # raising an already caught exception works and doesn't interfere with how
+  # the current exception is set
+  try:
+    raise CatchableError.newException("1")
+  except CatchableError as e:
+    raise e
+
+try:
+  manualReraise()
+except CatchableError as e:
+  doAssert e.msg == "1"
+
+doAssert getCurrentException() == nil
+
+# ---------------------------------------------------------------------------
+# more complex situation: re-raise an exception not caught by the most nested
+# handler
+
+# situation 1: catch within the original handler
+try:
+  raise CatchableError.newException("1")
+except CatchableError as e:
+  try:
+    try:
+      raise CatchableError.newException("2")
+    except CatchableError as e2:
+      raise e # raise the outer exception again
+  except CatchableError as e2:
+    doAssert e2.msg == "1"
+
+  # the current exception must still be the same as `e`
+  doAssert getCurrentException().msg == "1"
+
+doAssert getCurrentException() == nil
+
+# situation 2: catch outside the original handler
+try:
+  try:
+    raise CatchableError.newException("1")
+  except CatchableError as e:
+    try:
+      raise CatchableError.newException("2")
+    except CatchableError as e2:
+      raise e # raise the outer exception again
+  # the exception propagates outside the original handler
+except CatchableError as e:
+  doAssert e.msg == "1"
+
+doAssert getCurrentException() == nil
diff --git a/tests/lang_objects/destructor/tdestruction_in_unreachable.nim b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
new file mode 100644
index 00000000000..5efb1e3e846
--- /dev/null
+++ b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
@@ -0,0 +1,35 @@
+discard """
+  description: '''
+    Ensure that no destructor is called for a local defined in an unreachable
+    part of the code, even if the scope is left via unstructured control-flow.
+  '''
+  targets: "c js vm"
+"""
+
+type Object = object
+
+var wasDestroyed = false
+
+proc `=destroy`(x: var Object) =
+  wasDestroyed = true
+
+proc test(cond: bool) =
+  block:
+    if cond:
+      return
+    else:
+      raise CatchableError.newException("")
+
+  # everything beyond this point is statically unreachable code
+  var o = Object()
+  if cond:
+    # introduce an unstructured exit of the scope
+    return
+
+  discard o
+
+test(true)
+
+# XXX: wasDestroy must be false, but it currently isn't. Testing the inverse
+#      makes sure that the test at least compiles
+doAssert wasDestroyed, "the behaviour is correct now"
\ No newline at end of file

From d53c9a31f1e8d12307383de8fa2f83b0f8821094 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 3 Mar 2024 23:31:09 +0100
Subject: [PATCH 019/169] refactor(mir): split `mirchangesets` into two modules
 (#1217)

## Summary

Split `mirchangesets` into two modules: one for the changesets
concerning only `MirTree`s and one for `MirBody` changesets. This
breaks up unnecessary module dependencies and prepares for future
extension of the `MirBody` changesets.

## Details

* the existing `Changeset` type is renamed to `TreeChangeset`
  * it only records changes for trees, and no longer has direct
    integration with `MirBuilder`
  * `insert` and `replaceMulti` provide the raw node storage
* the `MirBody`-focused API providing `MirBuilder` instances is of part
  to the new `newchangesets` module
  * inheritance (i.e., `TreeChangeset = object of RootObj`) is decided
    against because it doesn't work with `prepare(sink TreeChangeset)`
  * instead, `Changeset` stores an instance of `TreeChangeset`, with
    the `TreeChangeset` API being made available through proxy templates
* the `tmir_changesets` test is updated and renamed to
  `ttreechangesets`

`Changeset` needs to be coupled more with `MirBody` in the future.
Splitting the `MirTree`-only part into a separate type and module
makes it possible to keep using changesets where only a `MirTree` but
no body `MirBody` exists. One such case is going to be transforming/
modifying MIR constant expressions.
---
 compiler/mir/injecthooks.nim                  |  6 +-
 compiler/mir/mirpasses.nim                    |  6 +-
 compiler/mir/newchangesets.nim                | 92 +++++++++++++++++++
 .../{mirchangesets.nim => treechangesets.nim} | 72 +++++----------
 compiler/sem/injectdestructors.nim            | 14 +--
 ...mir_changesets.nim => ttreechangesets.nim} |  8 +-
 6 files changed, 133 insertions(+), 65 deletions(-)
 create mode 100644 compiler/mir/newchangesets.nim
 rename compiler/mir/{mirchangesets.nim => treechangesets.nim} (79%)
 rename tests/compiler/{tmir_changesets.nim => ttreechangesets.nim} (95%)

diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index 6f7d3b08b44..201ae64db01 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -19,7 +19,7 @@ import
   ],
   compiler/mir/[
     mirbodies,
-    mirchangesets,
+    newchangesets,
     mirconstr,
     mirenv,
     mirtrees
@@ -292,6 +292,6 @@ proc injectHooks*(body: var MirBody, graph: ModuleGraph, env: var MirEnv,
                   owner: PSym) =
   ## Adapter for the legacy pass-application pipeline. Once possible, the pass
   ## needs to be treated as just another MIR pass.
-  var c = initChangeset(body.code)
+  var c = initChangeset(body)
   injectHooks(body, graph, env, owner, c)
-  apply(body.code, prepare(c))
+  body.apply(c)
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index a561fda2b4c..c7ab7420a11 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -19,7 +19,7 @@ import
     datatables,
     mirbodies,
     mirenv,
-    mirchangesets,
+    newchangesets,
     mirconstr,
     mirtrees,
     sourcemaps
@@ -465,9 +465,9 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
   ## certain passes. Passes may register new entities with `env`.
   template batch(b: untyped) =
     block:
-      var c {.inject.} = initChangeset(body.code)
+      var c {.inject.} = initChangeset(body)
       b
-      apply(body.code, prepare(c))
+      apply(body, c)
 
   if target == targetC:
     batch:
diff --git a/compiler/mir/newchangesets.nim b/compiler/mir/newchangesets.nim
new file mode 100644
index 00000000000..ed038118479
--- /dev/null
+++ b/compiler/mir/newchangesets.nim
@@ -0,0 +1,92 @@
+## Implements the `Changeset <#Changeset>`_ type, which is a changeset for
+## `MirBody <mirbodies.html#MirBody>`_. It builds upon/extends
+## `TreeChangeset <treechangesets.html#TreeChangeset>`_.
+
+import
+  compiler/mir/[
+    mirbodies,
+    mirconstr,
+    mirtrees,
+    sourcemaps,
+    treechangesets
+  ]
+
+type
+  Changeset* = object
+    ## Represents a set of changes to be applied to a ``MirBody``.
+    inner: TreeChangeset
+    numTemps: uint32
+      ## keeps track of the number of temporaries. Exchanged with
+      ## the created builder, where it's used for allocating new IDs
+
+# ----------------------------------------
+# proxy routines
+
+template replace*(c: var Changeset, tree: MirTree, at: NodePosition,
+                  with: MirNode) =
+  ## Same as `replace <treechangesets.html#replace,TreeChangeset,MirTree,NodePosition,sinkMirNode>`_.
+  replace(c.inner, tree, at, with)
+
+template changeTree*(c: var Changeset, tree: MirTree, at: NodePosition,
+                     with: MirNode) =
+  ## Same as `changeTree <treechangesets.html#changeTree,TreeChangeset,MirTree,NodePosition,sinkMirNode>`_.
+  changeTree(c.inner, tree, at, with)
+
+template insert*(c: var Changeset, at: NodePosition, n: MirNode) =
+  ## Same as `insert <treechangesets.html#insert,TreeChangeset,NodePosition,sinkMirNode>`_.
+  insert(c.inner, at, n)
+
+template remove*(c: var Changeset, tree: MirTree, at: NodePosition) =
+  ## Same as `remove <treechangesets.html#remove,TreeChangeset,MirTree,NodePosition>`_.
+  remove(c.inner, tree, at)
+
+# ----------------------------------------
+# `Changeset`-specific routines
+
+func initChangeset*(body: MirBody): Changeset =
+  ## Sets up a changeset for `body`. The changeset either needs to be
+  ## discarded, or applied to the same ``MirBody`` instance it was created for.
+  # compute the next ID to use for new temporaries:
+  for i, n in body.code.pairs:
+    if n.kind in DefNodes and
+       (let ent = body.code[i, 0]; ent.kind in {mnkTemp, mnkAlias}):
+      result.numTemps = max(ent.temp.uint32 + 1, result.numTemps)
+
+func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
+                 info: SourceId): MirBuilder =
+  ## Internal routine for setting up a builder. Must be paired with a
+  ## ``finishBuilder`` call.
+  result = initBuilder(info, move buffer)
+  swap(c.numTemps, result.numTemps)
+
+func finishBuilder(c: var Changeset, buffer: var MirNodeSeq,
+                   bu: sink MirBuilder) =
+  # move the ID counter and buffer back into the changeset
+  swap(c.numTemps, bu.numTemps)
+  buffer = finish(bu)
+
+template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
+                 name: untyped, body: untyped) =
+  ## Records an insertion at the `at` position. For building the new tree,
+  ## a ``MirBuilder`` instance is made available to the provided `body` via
+  ## an injected local of name `name`. `source` identifies the node to
+  ## inherit source information from.
+  insert(c.inner, at, bufferTmp):
+    var name = initBuilder(c, bufferTmp, tree[source].info)
+    body
+    finishBuilder(c, bufferTmp, name)
+
+template replaceMulti*(c: var Changeset, tree: MirTree, at: NodePosition,
+                       name, body: untyped) =
+  ## Records a replacement of the node or sub-tree at the `at` position. For
+  ## building the replacement tree, a ``MirBuilder`` instance is made
+  ## available to the provided `body` via an injected local of name `name`.
+  let pos = at
+  replaceMulti(c.inner, tree, pos, bufferTmp):
+    var name = initBuilder(c, bufferTmp, tree[pos].info)
+    body
+    finishBuilder(c, bufferTmp, name)
+
+func apply*(body: var MirBody, c: sink Changeset) =
+  ## Applies the changeset `c` to `body`.
+  apply(body.code, prepare(move c.inner))
diff --git a/compiler/mir/mirchangesets.nim b/compiler/mir/treechangesets.nim
similarity index 79%
rename from compiler/mir/mirchangesets.nim
rename to compiler/mir/treechangesets.nim
index e360fe7645c..fcfae9b2ab2 100644
--- a/compiler/mir/mirchangesets.nim
+++ b/compiler/mir/treechangesets.nim
@@ -1,19 +1,19 @@
-## This module implements the ``Changeset`` API, which is the main way of
-## applying changes to a ``MirTree``.
+## This module implements the `TreeChangeset <#TreeChangeset>`_ API, which is
+## the main way of modifying a ``MirTree`` after its initial construction.
 ##
 ## Instead of modifying a ``MirTree`` directly, the changes (which can be
 ## insertions, replacements, or removals) are first recorded into a
-## ``Changeset``. This allows for recording changes independent of each other
-## concurrently and later apply the changes all at once.
+## ``TreeChangeset``. This allows for recording changes independent of each
+## other concurrently and later applying the changes all at once.
 ##
-## Before applying a ``Changeset`` to a ``MirTree``, it has to be prepared via
-## a call to ``prepare`` first, after which the ``Changeset`` is sealed an no
-## further changes can be recorded. ``prepare`` is responsible from normalizing
-## the internal representation of the ``Changeset`` and is required for the
-## later application to work.
+## Before applying a ``TreeChangeset`` to a ``MirTree``, it has to be prepared
+## via a call to ``prepare`` first, after which the ``TreeChangeset`` is sealed
+## and no further changes can be recorded. ``prepare`` is responsible from
+## normalizing the internal representation of the ``Changeset`` and is required
+## for the later application to work.
 ##
 ## Applying the ``PreparedChangeset`` is done via ``apply``. This integrates
-## all recorded changes into the applied to tree,.
+## all recorded changes into the applied-to tree.
 ##
 ## Order of application
 ## --------------------
@@ -32,9 +32,7 @@ import
     algorithm
   ],
   compiler/mir/[
-    mirtrees,
-    mirconstr,
-    sourcemaps
+    mirtrees
   ],
   compiler/utils/[
     idioms
@@ -50,13 +48,11 @@ type
     orig: HOslice[NodeIndex] ## the slice of nodes this change affects
     src:  HOslice[NodeIndex] ## a slice in the buffer of staged nodes
 
-  Changeset* = object
+  TreeChangeset* = object
     ## Represents a set of changes to be applied to a ``MirTree``.
     nodes: seq[MirNode]
     rows: seq[Row]
 
-    numTemps: uint32 ## the number of existing temporaries
-
   PreparedChangeset* = object
     nodes: seq[MirNode]
     rows: seq[Row]
@@ -65,6 +61,9 @@ type
     stagingSize: int ## the minimum amount of nodes the working area must be
                      ## able to hold
 
+  # use a local alias for convenience:
+  Changeset = TreeChangeset
+
 func single[T](x: T): HOslice[T] {.inline.} =
   ## Utility for creating a slice with a single item
   HOslice[T](a: x, b: succ(x))
@@ -84,16 +83,6 @@ func addSingle(s: var MirNodeSeq, n: sink MirNode): HOslice[NodeIndex] =
   s.add n
   result = single(s.high.NodeIndex)
 
-func initChangeset*(tree: MirTree): Changeset =
-  ## Initializes a new ``Changeset`` instance. Until the resulting
-  ## ``Changeset`` is applied, the associated tree must not be modified.
-
-  # count the number of existing temporaries:
-  for i, n in tree.pairs:
-    if n.kind in DefNodes and
-       (let ent = tree[i, 0]; ent.kind in {mnkTemp, mnkAlias}):
-      result.numTemps = max(ent.temp.uint32 + 1, result.numTemps)
-
 func replace*(c: var Changeset, tree: MirTree, at: NodePosition,
               with: sink MirNode) =
   ## Records replacing the node or sub-tree at `at` with `with`. The origin
@@ -121,19 +110,8 @@ func insert*(c: var Changeset, at: NodePosition, n: sink MirNode) =
   ## is not modified.
   c.rows.add row(at, at, c.nodes.addSingle(n))
 
-func initBuilder(c: var Changeset, info: SourceId): MirBuilder =
-  ## Internal routines for setting up a builder. Must be paired with a
-  ## ``finishBuilder`` call.
-  result = initBuilder(info, move c.nodes)
-  swap(c.numTemps, result.numTemps)
-
-func finishBuilder(c: var Changeset, bu: sink MirBuilder) =
-  # move the ID counter and buffer back into the changeset
-  swap(c.numTemps, bu.numTemps)
-  c.nodes = finish(bu)
-
-template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
-                 name: untyped, body: untyped) =
+template insert*(c: var Changeset, at: NodePosition, name: untyped,
+                 body: untyped) =
   ## Records an insertion at the `at` position, providing direct
   ## access to the internal node buffer inside `body` via an injected variable
   ## of the name `name`. `source` is the node to inherit the source/origin
@@ -141,14 +119,14 @@ template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
   block:
     let
       start = c.nodes.len.NodeIndex
-      # evaluate `at` and `source` before `body`, as the latter might change
-      # what `source` evaluates to:
+      # evaluate `at` before `body`, as the latter might change
+      # what `at` evaluates to:
       pos = at
-      info = tree[source].info
 
-    var name = initBuilder(c, info)
+    var name: MirNodeSeq
+    swap(name, c.nodes)
     body
-    finishBuilder(c, name)
+    swap(name, c.nodes)
 
     c.rows.add row(pos, pos, span(start, c.nodes.len.NodeIndex))
 
@@ -161,12 +139,12 @@ template replaceMulti*(c: var Changeset, tree: MirTree, at: NodePosition,
     let
       start = c.nodes.len.NodeIndex
       pos = at # prevent double evaluation
-      info = tree[pos].info
       next = sibling(tree, pos)
 
-    var name = initBuilder(c, info)
+    var name: MirNodeSeq
+    swap(name, c.nodes)
     body
-    finishBuilder(c, name)
+    swap(name, c.nodes)
 
     c.rows.add row(pos, next, span(start, c.nodes.len.NodeIndex))
 
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index fa48d3d6c6f..e34cd3ae505 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -112,7 +112,7 @@ import
   compiler/mir/[
     analysis,
     mirbodies,
-    mirchangesets,
+    newchangesets,
     mirconstr,
     mirenv,
     mirtrees,
@@ -880,13 +880,9 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
   ## For now, semantic errors and other diagnostics related to lifetime-hook
   ## usage are also reported here.
 
-  template apply(c: Changeset) =
-    ## Applies the changeset `c` to `body`.
-    apply(body.code, prepare(c))
-
   # apply the first batch of passes:
   block:
-    var changes = initChangeset(body.code)
+    var changes = initChangeset(body)
     # the VM implements branch switching itself - performing the lowering for
     # code meant to run in it would be harmful
     # FIXME: discriminant assignment lowering also needs to be disabled for
@@ -903,12 +899,12 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
           changes.replaceMulti(body.code, i, buf):
             lowerBranchSwitch(buf, body.code, g, idgen, env, i)
 
-    apply(changes)
+    body.apply(changes)
 
   # apply the second batch of passes:
   block:
     var
-      changes = initChangeset(body.code)
+      changes = initChangeset(body)
       actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
 
     let
@@ -926,4 +922,4 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
 
     injectDestructors(body.code, g, destructors, env, changes)
 
-    apply(changes)
+    body.apply(changes)
diff --git a/tests/compiler/tmir_changesets.nim b/tests/compiler/ttreechangesets.nim
similarity index 95%
rename from tests/compiler/tmir_changesets.nim
rename to tests/compiler/ttreechangesets.nim
index d74c93deaec..10ed10d98fb 100644
--- a/tests/compiler/tmir_changesets.nim
+++ b/tests/compiler/ttreechangesets.nim
@@ -1,5 +1,5 @@
 discard """
-  description: "Tests for the MIR ``Changeset`` API"
+  description: "Tests for the MIR ``TreeChangeset`` API"
   targets: native
 """
 
@@ -7,9 +7,11 @@ discard """
 
 import
   compiler/ast/ast_types,
-  compiler/mir/[mirtrees, mirchangesets, mirconstr, sourcemaps],
+  compiler/mir/[mirtrees, treechangesets, mirconstr, sourcemaps],
   compiler/utils/containers
 
+type Changeset = TreeChangeset
+
 proc temp(x: int): MirNode =
   MirNode(kind: mnkTemp, temp: x.TempId)
 
@@ -42,7 +44,7 @@ template test(input, output: typed, body: untyped) =
       tree =
         when input is array: @input
         else:                input
-      c {.inject.} = initChangeset(tree)
+      c {.inject.}: Changeset
       sourceMap = setupSourceMap(tree)
 
     template replace(c: Changeset, i: int, n: MirNode) {.inject.} =

From c40038fa906ca10a91bcb82ad19f92a9c4420497 Mon Sep 17 00:00:00 2001
From: Adam Sherwood <43248857+theSherwood@users.noreply.github.com>
Date: Mon, 4 Mar 2024 20:17:41 +0000
Subject: [PATCH 020/169] export `.dynlib` procs to WASM when using Emscripten
 (#1218)

## Summary
* The  `dynlib`  pragma now ensures that the procedure is exported to
WASM when compiling with Emscripten

## Details
*  `N_LIB_EXPORT`  now expands to
`__attribute__((used, visibility("default")))`  when  `__EMSCRIPTEN__`
is defined.
* Compiling to wasm with emscripten won't export symbols without
`__attribute__((used))` .

Replaces https://github.com/nim-works/nimskull/pull/1216 (where I merged
some changes that didn't belong)

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 lib/nimbase.h | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/lib/nimbase.h b/lib/nimbase.h
index 8ec14d58a53..4720b251c5d 100644
--- a/lib/nimbase.h
+++ b/lib/nimbase.h
@@ -18,6 +18,7 @@ __POCC__
 __TINYC__
 __clang__
 __AVR__
+__EMSCRIPTEN__
 */
 
 
@@ -220,8 +221,16 @@ __AVR__
 #    define N_FASTCALL_PTR(rettype, name) rettype (*name)
 #    define N_SAFECALL_PTR(rettype, name) rettype (*name)
 #  endif
-#  define N_LIB_EXPORT NIM_EXTERNC __attribute__((visibility("default")))
-#  define N_LIB_EXPORT_VAR  __attribute__((visibility("default")))
+#  ifdef __EMSCRIPTEN__
+//   Emscripten uses an EMSCRIPTEN_KEEPALIVE macro to mark exports, but also
+//   requires an <emscripten.h> include. The macro expands to __attribute__((used)).
+//   With the following, we cut out the middleman and avoid that include:
+#    define N_LIB_EXPORT  NIM_EXTERNC __attribute__((used, visibility("default")))
+#    define N_LIB_EXPORT_VAR  __attribute__((used, visibility("default")))
+#  else
+#    define N_LIB_EXPORT  NIM_EXTERNC __attribute__((visibility("default")))
+#    define N_LIB_EXPORT_VAR  __attribute__((visibility("default")))
+#  endif
 #  define N_LIB_IMPORT  extern
 #endif
 

From edeee65787e9d46351f659c0f0d3faaa2562396e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 5 Mar 2024 17:22:17 +0100
Subject: [PATCH 021/169] fix(cgirgen): compiler crash with unreachable code
 (#1219)

## Summary

Fix elimination of unreachable code in the MIR-to-CGIR translation
leading to the compiler crashing in some cases.

## Details

With how the current forward translation of MIR-to-CGIR works,
definitions of locals/globals in unscoped contexts need to always be
translated, otherwise they won't be moved to the start of their scope.

The previous approach was to only disable translation following
terminal statements when in scoped contexts, and always enabling
translation after join-like statements, but this doesn't catch the
following:
```
scope:
  try:
    scope:
      raise
    def _1 = ...
  finally:
    =destroy(name _1)
```

Since the `raise` terminal statement is in a scope context, translation
is disabled, but due to the lack of a join-like statement following it,
it isn't enabled again for the `def` statement. Since there's the `_1`
local is then not registered with the CGIR body, either translation or
code generation for the (reachable) `=destroy(name _1)` crashes due to
the unknown local.

### The Solution

A different approach to mitigating the current problem with unscoped
locals is used: no special handling is applied when setting the
`cl.isActive` flag. Instead, the flag is ignored when within unscoped
contexts. This is both simpler and more robust than the previous
workaround.

A regression test that produces MIR akin to the above example is added.
---
 compiler/backend/cgirgen.nim                  | 41 ++++++++-----------
 .../tdestruction_in_unreachable.nim           | 21 ++++++++++
 2 files changed, 39 insertions(+), 23 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 72963ea341c..753574c224e 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -283,22 +283,8 @@ proc genObjConv(n: CgNode, a, b, t: PType): CgNode =
     if diff < 0: cnkObjUpConv else: cnkObjDownConv,
     n.info, t): n
 
-proc disable(cl: var TranslateCl) =
-  # consider the following MIR:
-  #   try:
-  #     return
-  #     def _1 = ...
-  #   finally:
-  #     =destroy(name _1)
-  #
-  # Although nonesense, this is currently both legal and possible MIR. If
-  # translation would be disabled beyond the ``return``, then the temporary
-  # wouldn't be registered. Therefore, disable is a no-op when in an unscoped
-  # contexts (such as the above)
-  # XXX: eliminating unreachable code needs to happen much earlier, either in
-  #      ``mirgen`` or ``transf``
-  if not cl.inUnscoped:
-    cl.isActive = false
+func disable(cl: var TranslateCl) {.inline.} =
+  cl.isActive = false
 
 # forward declarations:
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
@@ -737,12 +723,8 @@ proc join(stmts: var seq[CgNode], cl: var TranslateCl, info: TLineInfo,
   if label == target and (found or required):
     stmts.add newTree(cnkJoinStmt, info, node(label))
 
-  if found or true:
+  if found:
     # code is alive if following a join that is targeted by an alive goto
-    # XXX: translation has to be forcefully enabled at a join, even if not
-    #      within a scoped context: the surrounding scope might itself be
-    #      part of an unscoped context. This is a temporary workaround, see
-    #      `disable <#disable,TranslateCl>`_
     cl.isActive = true
 
 template join(info: TLineInfo, lbl: LabelId; required = false) =
@@ -773,8 +755,21 @@ template guarded(lbl: LabelId, body: untyped) =
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
               cr: var TreeCursor, stmts: var seq[CgNode]) =
 
-  # skip the statement if translation is disabled
-  if not cl.isActive:
+  # skip the statement if translation is disabled, but with a caveat. Consider
+  # the following MIR:
+  #   try:
+  #     return
+  #     def _1 = ...
+  #   finally:
+  #     =destroy(name _1)
+  #
+  # Although nonesense, this is currently both legal and possible MIR. If
+  # translation would be disabled beyond the ``return``, then the temporary
+  # wouldn't be registered. Therefore, translation is always enabled in unscoped
+  # contexts (such as the above)
+  # XXX: eliminating unreachable code needs to happen much earlier, either in
+  #      ``mirgen`` or ``transf``
+  if not cl.isActive and not cl.inUnscoped:
     tree.skip(cr)
     return
 
diff --git a/tests/lang_objects/destructor/tdestruction_in_unreachable.nim b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
index 5efb1e3e846..ab12209fb0e 100644
--- a/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
+++ b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
@@ -32,4 +32,25 @@ test(true)
 
 # XXX: wasDestroy must be false, but it currently isn't. Testing the inverse
 #      makes sure that the test at least compiles
+doAssert wasDestroyed, "the behaviour is correct now"
+
+# ------------------------------
+# test without if/else statement
+
+proc test2(cond: bool) =
+  block:
+    # the return is within its own scope. Using a raise would have the same
+    # compile-time effect, but would result in an unhandled exception at
+    # run-time
+    return
+
+  var o = Object()
+  if cond:
+    # introduce an unstructured exit of the scope (which currently
+    # forces destruction within a finally)
+    return
+  discard o
+
+test2(true)
+# XXX: same comment as for the assertion above
 doAssert wasDestroyed, "the behaviour is correct now"
\ No newline at end of file

From 924dcaf0ae0285a93ca084c05837a75dcec34278 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 5 Mar 2024 17:30:57 +0100
Subject: [PATCH 022/169] refactor: rename `newchangesets` module (#1220)

## Summary

Rename the `newchangesets` module to `mirchangesets`. A temporary name
was used so that Git history of the original `mirchangesets` module
(now `treechangesets`) is kept intact.
---
 compiler/mir/injecthooks.nim                          | 2 +-
 compiler/mir/{newchangesets.nim => mirchangesets.nim} | 0
 compiler/mir/mirpasses.nim                            | 2 +-
 compiler/sem/injectdestructors.nim                    | 2 +-
 4 files changed, 3 insertions(+), 3 deletions(-)
 rename compiler/mir/{newchangesets.nim => mirchangesets.nim} (100%)

diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index 201ae64db01..eefcc5f5178 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -19,7 +19,7 @@ import
   ],
   compiler/mir/[
     mirbodies,
-    newchangesets,
+    mirchangesets,
     mirconstr,
     mirenv,
     mirtrees
diff --git a/compiler/mir/newchangesets.nim b/compiler/mir/mirchangesets.nim
similarity index 100%
rename from compiler/mir/newchangesets.nim
rename to compiler/mir/mirchangesets.nim
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index c7ab7420a11..74ba5c7076c 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -19,7 +19,7 @@ import
     datatables,
     mirbodies,
     mirenv,
-    newchangesets,
+    mirchangesets,
     mirconstr,
     mirtrees,
     sourcemaps
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index e34cd3ae505..b51ff3643cb 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -112,7 +112,7 @@ import
   compiler/mir/[
     analysis,
     mirbodies,
-    newchangesets,
+    mirchangesets,
     mirconstr,
     mirenv,
     mirtrees,

From 5aca007cd7ef41a1128fbe6d6eb667ce612f847c Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Wed, 6 Mar 2024 19:54:12 +0100
Subject: [PATCH 023/169] Remove nkStmtListType and nkBlockType nodes (#1221)

## Summary
* Remove  `nkStmtListType`  and  `nkBlockType`  node kinds and replace
the remaining usages of  `nkStmtListType`  with  `nkStmtListExpr`

## Details
*  `not nil`  is implemented as a  `TypeTrait`  magic and no longer
reaches mirgen
* A workaround for untyped AST in sempass2 has been added to the check
introduced in cef64c469f167d4eeb3edda85c78040ccc95bfe9 and accordingly a
`knownIssue`  testcase for the underlying issue

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 compiler/ast/ast_query.nim                    |  2 --
 compiler/ast/ast_types.nim                    |  3 --
 compiler/ast/renderer.nim                     |  8 ++---
 compiler/front/condsyms.nim                   |  1 +
 compiler/mir/mirgen.nim                       | 20 +----------
 compiler/sem/sem.nim                          |  2 +-
 compiler/sem/semexprs.nim                     |  3 --
 compiler/sem/semfold.nim                      |  6 ++--
 compiler/sem/semgnrc.nim                      |  2 +-
 compiler/sem/semmagic.nim                     |  8 ++++-
 compiler/sem/sempass2.nim                     |  9 ++---
 compiler/sem/semtempl.nim                     |  2 +-
 compiler/sem/semtypes.nim                     | 23 ++++---------
 lib/core/macros.nim                           |  4 +--
 lib/system.nim                                |  3 ++
 .../lang_objects/metatype/ttyped_type_ast.nim | 33 +++++++++++++++++++
 16 files changed, 67 insertions(+), 62 deletions(-)
 create mode 100644 tests/lang_objects/metatype/ttyped_type_ast.nim

diff --git a/compiler/ast/ast_query.nim b/compiler/ast/ast_query.nim
index 57533b37bbe..bfe706246ca 100644
--- a/compiler/ast/ast_query.nim
+++ b/compiler/ast/ast_query.nim
@@ -123,8 +123,6 @@ const
     nkIteratorTy,
     nkSharedTy,
     nkEnumTy,
-    nkStmtListType,
-    nkBlockType
   }
 
   # TODO: replace with `nk*Literals`, see above
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index b214870ab14..1f0730c04c0 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -201,9 +201,6 @@ type
     nkBlockExpr           ## a statement block ending in an expr; this is used
                           ## to allow powerful multi-line templates that open a
                           ## temporary scope
-    nkStmtListType        ## a statement list ending in a type; for macros
-    nkBlockType           ## a statement block ending in a type; for macros
-                          ## types as syntactic trees:
 
     nkWith                ## distinct with `foo`
     nkWithout             ## distinct without `foo`
diff --git a/compiler/ast/renderer.nim b/compiler/ast/renderer.nim
index d59a9dadd75..991c0113756 100644
--- a/compiler/ast/renderer.nim
+++ b/compiler/ast/renderer.nim
@@ -633,14 +633,14 @@ proc longMode(g: TSrcGen; n: PNode, start: int = 0, theEnd: int = - 1): bool =
 
 proc gstmts(g: var TSrcGen, n: PNode, c: TContext, doIndent=true) =
   if n.kind == nkEmpty: return
-  if n.kind in {nkStmtList, nkStmtListExpr, nkStmtListType}:
+  if n.kind in {nkStmtList, nkStmtListExpr}:
     if doIndent: indentNL(g)
     for i in 0..<n.len:
       if i > 0:
         optNL(g, n[i-1], n[i])
       else:
         optNL(g)
-      if n[i].kind in {nkStmtList, nkStmtListExpr, nkStmtListType}:
+      if n[i].kind in {nkStmtList, nkStmtListExpr}:
         gstmts(g, n[i], c, doIndent=false)
       else:
         gsub(g, n[i], fromStmtList = true)
@@ -1421,7 +1421,7 @@ proc gsub(g: var TSrcGen, n: PNode, c: TContext, fromStmtList = false) =
     put(g, tkSpaces, Space)
     putWithSpace(g, tkEquals, "=")
     gsub(g, n, 1)
-  of nkStmtList, nkStmtListExpr, nkStmtListType:
+  of nkStmtList, nkStmtListExpr:
     if n.len == 1 and n[0].kind == nkDiscardStmt:
       put(g, tkParLe, "(")
       gsub(g, n[0])
@@ -1654,7 +1654,7 @@ proc renderTree*(n: PNode, renderFlags: TRenderFlags = {}): string =
   # do not indent the initial statement list so that
   # writeFile("file.nim", repr n)
   # produces working Nim code:
-  if n.kind in {nkStmtList, nkStmtListExpr, nkStmtListType}:
+  if n.kind in {nkStmtList, nkStmtListExpr}:
     gstmts(g, n, emptyContext, doIndent = false)
   else:
     gsub(g, n)
diff --git a/compiler/front/condsyms.nim b/compiler/front/condsyms.nim
index 8bad92d1f8d..1af4b0141cb 100644
--- a/compiler/front/condsyms.nim
+++ b/compiler/front/condsyms.nim
@@ -75,3 +75,4 @@ proc initDefines*(symbols: StringTableRef) =
   defineSymbol("nimskullNoMagicNewAssign")
   defineSymbol("nimskullNoFloat128")
   defineSymbol("nimskullNewExceptionRt")
+  defineSymbol("nimskullNoNkStmtListTypeAndNkBlockType")
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index b1498f11023..9c573881729 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -547,28 +547,10 @@ proc genTypeExpr(c: var TCtx, n: PNode): Value =
   assert n.typ.kind == tyTypeDesc
   c.builder.useSource(c.sp, n)
   case n.kind
-  of nkStmtListType, nkStmtListExpr:
+  of nkStmtListExpr:
     # FIXME: a ``nkStmtListExpr`` shouldn't reach here, but it does. See
     #        ``tests/lang_callable/generics/t18859.nim`` for a case where it
     #        does
-    if n[^1].typ.kind == tyTypeDesc:
-      genTypeExpr(c, n.lastSon)
-    else:
-      # HACK: this is big hack. Consider the following case:
-      #
-      #       .. code-block:: nim
-      #
-      #         type Obj[T] = object
-      #           p: T not nil
-      #
-      #         var x: Obj[ref int]
-      #
-      #       The ``T not nil`` is a ``nkStmtListType`` node with a single
-      #       ``nkInfix`` sub-node, where the latter doesn't use a
-      #       ``tyTypeDesc`` type but a ``tyRef`` instead. For now, we work
-      #       around this by using the type of the ``nkStmtListType``
-      typeLit(n.typ)
-  of nkBlockType:
     genTypeExpr(c, n.lastSon)
   of nkSym:
     case n.sym.kind
diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index a96c96221a1..3d98df006e9 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -730,7 +730,7 @@ proc semAfterMacroCall(c: PContext, call, macroResult: PNode,
       # More restrictive version.
       result = semExprWithType(c, result, flags)
     of tyTypeDesc:
-      if result.kind == nkStmtList: result.transitionSonsKind(nkStmtListType)
+      if result.kind == nkStmtList: result.transitionSonsKind(nkStmtListExpr)
       result = semTypeNode2(c, result, nil)
       if result.kind != nkError:
         result.typ = makeTypeDesc(c, result.typ)
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index dcafe9b8fcb..39ed98b095a 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -3623,9 +3623,6 @@ proc semExpr(c: PContext, n: PNode, flags: TExprFlags = {}): PNode =
     result = semTypeNode2(c, n, nil)
     # a type expression is of type ``typeDesc[T]``
     result.typ = makeTypeDesc(c, result.typ.skipTypes({tyTypeDesc}))
-  of nkStmtListType:
-    result = semTypeNode2(c, n, nil)
-    result.typ = makeTypeDesc(c, result.typ)
   of nkCall, nkInfix, nkPrefix, nkPostfix, nkCommand, nkCallStrLit:
     # check if it is an expression macro:
     checkMinSonsLen(n, 1, c.config)
diff --git a/compiler/sem/semfold.nim b/compiler/sem/semfold.nim
index 81df1f7097e..66b5e4468f4 100644
--- a/compiler/sem/semfold.nim
+++ b/compiler/sem/semfold.nim
@@ -844,14 +844,14 @@ proc foldConstExprAux(m: PSym, n: PNode, idgen: IdGenerator, g: ModuleGraph): Fo
     return
   of nkSym:
     discard "may be folded away"
-  of nkTypeExprs - {nkStmtListType, nkBlockType}:
+  of nkTypeExprs:
     result.node = newNodeIT(nkType, n.info, n.typ)
   of nkBracket, nkCurly, nkTupleConstr, nkRange, nkAddr, nkHiddenAddr,
      nkHiddenDeref, nkDerefExpr, nkBracketExpr, nkCallKinds, nkIfExpr,
      nkElifExpr, nkElseExpr, nkElse, nkElifBranch:
     for it in n.items:
       result.add foldConstExprAux(m, it, idgen, g)
-  of nkCast, nkConv, nkHiddenStdConv, nkHiddenSubConv, nkBlockExpr, nkBlockType:
+  of nkCast, nkConv, nkHiddenStdConv, nkHiddenSubConv, nkBlockExpr:
     # the first slot only holds the type/label, which we don't need to traverse
     # into / fold
     result.add n[0]
@@ -875,7 +875,7 @@ proc foldConstExprAux(m: PSym, n: PNode, idgen: IdGenerator, g: ModuleGraph): Fo
     result.add n[0] # skip the type slot
     for i in 1..<n.len:
       result.add foldConstExprAux(m, n[i], idgen, g)
-  of nkStmtListExpr, nkStmtListType:
+  of nkStmtListExpr:
     for i in 0..<n.len-1:
       result.add foldInAstAux(m, n[i], idgen, g)
     # the last node is an expression
diff --git a/compiler/sem/semgnrc.nim b/compiler/sem/semgnrc.nim
index d9eb91c0880..eaa4596cb53 100644
--- a/compiler/sem/semgnrc.nim
+++ b/compiler/sem/semgnrc.nim
@@ -432,7 +432,7 @@ proc semGenericStmt(c: PContext, n: PNode,
       n[^1] = checkError semGenericStmt(c, n[^1], flags, ctx)
       closeScope(c)
       closeScope(c)
-  of nkBlockStmt, nkBlockExpr, nkBlockType:
+  of nkBlockStmt, nkBlockExpr:
     checkSonsLen(n, 2, c.config)
     openScope(c)
     if n[0].kind != nkEmpty:
diff --git a/compiler/sem/semmagic.nim b/compiler/sem/semmagic.nim
index 2ed006a579a..0fbb1d84380 100644
--- a/compiler/sem/semmagic.nim
+++ b/compiler/sem/semmagic.nim
@@ -175,7 +175,13 @@ proc evalTypeTrait(c: PContext; traitCall: PNode, operand: PType, context: PSym)
   of "and":
     return typeWithSonsResult(tyAnd, @[operand, operand2])
   of "not":
-    return typeWithSonsResult(tyNot, @[operand])
+    if traitCall.len == 3:
+      c.config.internalAssert traitCall[2].kind == nkNilLit
+      # the operand is not generic anymore, let ``semTypeNode`` produce a
+      # type with the not-nil modifier applied
+      return makeTypeDesc(c, semTypeNode(c, traitCall, nil)).toNode(traitCall.info)
+    else:
+      return typeWithSonsResult(tyNot, @[operand])
   of "typeToString":
     var prefer = preferTypeName
     if traitCall.len >= 2:
diff --git a/compiler/sem/sempass2.nim b/compiler/sem/sempass2.nim
index 0df51198755..713154ac4b5 100644
--- a/compiler/sem/sempass2.nim
+++ b/compiler/sem/sempass2.nim
@@ -1313,8 +1313,10 @@ proc track(tracked: PEffects, n: PNode) =
       if iterCall[1].typ != nil and
          iterCall[1].typ.skipTypes(abstractVar).kind notin {tyVarargs, tyOpenArray}:
         createTypeBoundOps(tracked, iterCall[1].typ, iterCall[1].info)
-    
+
     if tracked.owner.kind != skMacro and iterCall.kind in nkCallKinds and
+       iterCall[0].typ != nil and # XXX: untyped AST can reach here due to
+                                  # semTypeNode discarding the typed AST
        iterCall[0].typ.skipTypes(abstractInst).callConv == ccClosure:
       # the loop is a for-loop over a closure iterator. Lift the hooks for
       # the iterator
@@ -1438,11 +1440,6 @@ proc track(tracked: PEffects, n: PNode) =
       track(tracked, n[i])
 
     inc tracked.leftPartOfAsgn
-  of nkBlockType, nkStmtListType:
-    # TODO: it's a minor breaking change (macros can observe it via
-    #       `getImpl`), but these nodes should instead be folded into
-    #        ``nkType`` nodes by ``semfold``
-    discard
   of nkBindStmt, nkMixinStmt, nkImportStmt, nkImportExceptStmt, nkExportStmt,
      nkExportExceptStmt, nkFromStmt:
     # a declarative statement that is not relevant to the analysis. Report
diff --git a/compiler/sem/semtempl.nim b/compiler/sem/semtempl.nim
index be499f5cb9d..e8f86c3e2a1 100644
--- a/compiler/sem/semtempl.nim
+++ b/compiler/sem/semtempl.nim
@@ -720,7 +720,7 @@ proc semTemplBody(c: var TemplCtx, n: PNode): PNode =
       hasError = true
 
     closeScope(c)
-  of nkBlockStmt, nkBlockExpr, nkBlockType:
+  of nkBlockStmt, nkBlockExpr:
     checkSonsLen(n, 2, c.c.config)
     openScope(c)
     case n[0].kind
diff --git a/compiler/sem/semtypes.nim b/compiler/sem/semtypes.nim
index 0e572663b9b..9076eb9d078 100644
--- a/compiler/sem/semtypes.nim
+++ b/compiler/sem/semtypes.nim
@@ -1675,18 +1675,6 @@ proc semStmtListType(c: PContext, n: PNode, prev: PType): PType =
   else:
     result = nil
 
-proc semBlockType(c: PContext, n: PNode, prev: PType): PType =
-  inc(c.execCon.nestedBlockCounter)
-  checkSonsLen(n, 2, c.config)
-  openScope(c)
-  if n[0].kind notin {nkEmpty, nkSym}:
-    addDecl(c, newSymS(skLabel, n[0], c))
-  result = semStmtListType(c, n[1], prev)
-  n[1].typ = result
-  n.typ = result
-  closeScope(c)
-  dec(c.execCon.nestedBlockCounter)
-
 proc semGenericParamInInvocation(c: PContext, n: PNode): PType =
   result = semTypeNode(c, n, nil)
   n.typ = makeTypeDesc(c, result)
@@ -2124,7 +2112,11 @@ proc semTypeNode(c: PContext, n: PNode, prev: PType): PType =
             # I suggest revisiting this once the language decides on whether
             # `not nil` should be the default. We can then map nilable refs
             # to other types such as `Option[T]`.
-            result = makeTypeFromExpr(c, newTree(nkStmtListType, n.copyTree))
+            var copyN = n.copyTree
+            # the `not` procedure expects a typedesc, so make sure the
+            # operand is a `tyTypeDesc`
+            copyN[1].typ = makeTypeDesc(c, result)
+            result = makeTypeFromExpr(c, copyN)
           of NilableTypes + {tyGenericInvocation, tyForward}:
             result = freshType(c, result, prev)
             result.flags.incl(tfNotNil)
@@ -2162,7 +2154,7 @@ proc semTypeNode(c: PContext, n: PNode, prev: PType): PType =
   of nkWhenStmt:
     var whenResult = semWhen(c, n, false)
     if whenResult.kind == nkStmtList:
-      whenResult.transitionSonsKind(nkStmtListType)
+      whenResult.transitionSonsKind(nkStmtListExpr)
     result = semTypeNode(c, whenResult, prev)
   of nkBracketExpr:
     checkMinSonsLen(n, 2, c.config)
@@ -2312,8 +2304,7 @@ proc semTypeNode(c: PContext, n: PNode, prev: PType): PType =
     else:
       result = semProcTypeWithScope(c, n, prev, skProc)
   of nkEnumTy: result = semEnum(c, n, prev)
-  of nkStmtListType: result = semStmtListType(c, n, prev)
-  of nkBlockType: result = semBlockType(c, n, prev)
+  of nkStmtListExpr: result = semStmtListType(c, n, prev)
   of nkError:
     localReport(c.config, n, reportSem rsemTypeExpected)
     result = newOrPrevType(tyError, prev, c)
diff --git a/lib/core/macros.nim b/lib/core/macros.nim
index a16058ba786..f5a731cb857 100644
--- a/lib/core/macros.nim
+++ b/lib/core/macros.nim
@@ -92,8 +92,8 @@ type
     nnkIncludeStmt,
     nnkBindStmt, nnkMixinStmt, nnkUsingStmt,
     nnkCommentStmt, nnkStmtListExpr, nnkBlockExpr,
-    nnkStmtListType, nnkBlockType,
-    nnkWith, nnkWithout,
+    nnkWith = skipEnumValue(nimskullNoNkStmtListTypeAndNkBlockType, nnkBlockExpr, 2),
+    nnkWithout,
     nnkTypeOfExpr, nnkObjectTy,
     nnkTupleTy, nnkTupleClassTy, nnkTypeClassTy, nnkStaticTy,
     nnkRecList, nnkRecCase, nnkRecWhen,
diff --git a/lib/system.nim b/lib/system.nim
index f7f5b269c75..550b60ac13c 100644
--- a/lib/system.nim
+++ b/lib/system.nim
@@ -3043,3 +3043,6 @@ when defined(nimDebugUtils):
     {.define(nimCompilerDebug).}
     n
     {.undef(nimCompilerDebug).}
+
+proc `not`*[T: ref or ptr](a: typedesc[T], b: typeof(nil)): typedesc {.magic: "TypeTrait", noSideEffect.}
+  ## Constructs a `not nil` type.
diff --git a/tests/lang_objects/metatype/ttyped_type_ast.nim b/tests/lang_objects/metatype/ttyped_type_ast.nim
new file mode 100644
index 00000000000..e89ffc92139
--- /dev/null
+++ b/tests/lang_objects/metatype/ttyped_type_ast.nim
@@ -0,0 +1,33 @@
+discard """
+  description: "Ensure no untyped AST slips through to later compiler stages"
+  action: compile
+  knownIssue: '''When the typeof is analyzed by semTypeNode due to elementType
+having a typedesc return type, the typed AST is discarded because semTypeNode
+only returns a PType and thus the AST passed to isTyped stays untyped.
+  '''
+"""
+
+import macros
+
+template elementType*(a: untyped): typedesc =
+  typeof(block: (for ai in a: ai))
+
+iterator myiter3(): int = yield 10
+
+proc collectSyms(n: NimNode): seq[NimNode] =
+  if n.kind == nnkSym:
+    result = @[n]
+  else:
+    for c in n:
+      result.add collectSyms(c)
+
+macro isTyped(a: typed): bool =
+  newLit(collectSyms(a).len == 3)
+
+static:
+  assert: isTyped:
+    typeof(block: (for ai in myiter3(): ai))
+
+  # knownIssue; see above
+  assert: isTyped:
+    elementType(myiter3())

From 1854db10bf8b35214222d69dbf90c21d7e8caf5f Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 7 Mar 2024 04:16:48 +0100
Subject: [PATCH 024/169] std/asyncjs: value passed to `catch` is always
 `Error` (#1224)

## Summary

* NimSkull exceptions leaving `.async` procedure are automatically
  turned into JavaScript `Error`s
* errors retrieved by `catch` that were originally NimSkull exceptions
  always use only the original exception's message (no "uncaught
  exception" prefix)

## Details

* the `.async` macro wraps the body in a `try`/`except` that turns
  catchable errors into `Error`s
* depending on whether a procedure is called within a `try` (at
  run-time), `raise` either raises a NimSkull exception or JavaScript
  error
* the `tasyncjs_pragma` test is updated to not rely on the transformed
  body being a statement list
---
 lib/js/asyncjs.nim           | 12 ++++++++++++
 tests/js/tasyncjs.nim        | 21 ++++++++++++++++++++-
 tests/js/tasyncjs_bad.nim    |  2 +-
 tests/js/tasyncjs_pragma.nim |  3 +--
 4 files changed, 34 insertions(+), 4 deletions(-)

diff --git a/lib/js/asyncjs.nim b/lib/js/asyncjs.nim
index 7193beff9db..ac61c1a34c1 100644
--- a/lib/js/asyncjs.nim
+++ b/lib/js/asyncjs.nim
@@ -73,6 +73,8 @@ type
   PromiseJs* {.importjs: "Promise".} = ref object
   ## A JavaScript Promise.
 
+proc reraise(e: ref CatchableError) {.asmNoStackFrame, noreturn.} =
+  {.emit: ["throw new Error(", cstring(e.msg), ");"].}
 
 proc replaceReturn(node: var NimNode) =
   var z = 0
@@ -136,6 +138,16 @@ proc generateJsasync(arg: NimNode): NimNode =
       return `jsResolve`()
     result.body.add(voidFix)
 
+  if len(code) > 0:
+    # turn |NimSkull| outgoing exceptions into JavaScript errors
+    let body = result.body
+    result.body = quote:
+      try:
+        `body`
+      except CatchableError as e:
+        # use .noreturn call to make sure `body` being an expression works
+        reraise(e)
+
   let asyncPragma = quote:
     {.codegenDecl: "async function $2($3)".}
 
diff --git a/tests/js/tasyncjs.nim b/tests/js/tasyncjs.nim
index 00753a16c8c..e5be781c5a9 100644
--- a/tests/js/tasyncjs.nim
+++ b/tests/js/tasyncjs.nim
@@ -91,7 +91,26 @@ proc main() {.async.} =
     await fn(7).then((a: int) => (discard)).catch((r: Error) => (reason = r))
     doAssert reason != nil
     doAssert reason.name == "Error"
-    doAssert "foobar: 7" in $reason.message
+    doAssert "foobar: 7" == $reason.message
+
+  block async_within_try:
+    # make sure the object passed to the catch callback is an ``Error`` for
+    # futures created within try scopes
+    var
+      reason: Error
+      promise: Future[int]
+    try:
+      # the try should have no effect on the exception object the ``catch``
+      # gets
+      promise = fn(7)
+    except:
+      doAssert false, "unreachable"
+
+    await promise.catch((r: Error) => (reason = r))
+    doAssert reason != nil
+    doAssert reason.name == "Error"
+    doAssert "foobar: 7" == $reason.message
+
   echo "done" # justified here to make sure we're running this, since it's inside `async`
 
 discard main()
diff --git a/tests/js/tasyncjs_bad.nim b/tests/js/tasyncjs_bad.nim
index b1e5a7bc33f..1817fe3e68d 100644
--- a/tests/js/tasyncjs_bad.nim
+++ b/tests/js/tasyncjs_bad.nim
@@ -1,6 +1,6 @@
 discard """
   exitCode: 1
- outputsub: "Error: unhandled exception: foobar: 13"
+ outputsub: "foobar: 13"
 """
 
 # note: this needs `--unhandled-rejections=strict`, see D20210217T215950
diff --git a/tests/js/tasyncjs_pragma.nim b/tests/js/tasyncjs_pragma.nim
index 2b6f32e92bf..1d54b76b1a8 100644
--- a/tests/js/tasyncjs_pragma.nim
+++ b/tests/js/tasyncjs_pragma.nim
@@ -15,8 +15,7 @@ macro f*(a: untyped): untyped =
   let call = quote:
     echo 0
   result.body.add(call)
-  for child in a.body:
-    result.body.add(child)
+  result.body.add(a.body)
   #echo result.body.repr
 
 proc t* {.async, f.} =

From d8da140afee771dcd1fa89b3196908f686787334 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 8 Mar 2024 15:39:33 +0100
Subject: [PATCH 025/169] vmgen: use the new-style CGIR (#1225)

## Summary

Use the goto-using version of the CGIR for VM code generation,
removing another usage of the legacy variant. This also fixes the
current exception (`getCurrentException`) being incorrect after
raising from within an `except`, on the VM backend.

## Details

### VM changes

To accomodate the code generator, two small changes are made to the
instruction interface:
* instead of the instruction position from where to extract the
  register, the register index is directly encoded in `ehoLeave` EH
  instructions
* `opcBranch` must now be followed by a `opcTJmp` (jump if true)
  instead of a `opcFJmp` (jump if false)

### Code generator changes

The CGIR's control-flow representation translates more or less directly
to the VM's control-flow instructions, so code generation for it is
straightforward.

* the new-style CGIR is enabled in both `vmbackend` and `vmjit`
* no pre-pass over the CGIR - like is used by the C code generator - is
  needed
* registers for locals are freed at the end of structured blocks
  (`cnkIf`, `cnkFinally`, `cnkExcept`, and loops)
* EH instructions are emitted as the jump actions are processed
* jump actions for exceptional exits (e.g., `cnkCheckedCall`,
  `cnkRaise`, etc.) are usually the same for regions of code, so a
  caching mechanism is used to prevent repeated EH instructions
  sequences in that case. (not required for correctness)

---------

Co-authored-by: Clyybber <darkmine956@gmail.com>
---
 compiler/vm/vm.nim                 |  12 +-
 compiler/vm/vmbackend.nim          |   4 +-
 compiler/vm/vmgen.nim              | 617 ++++++++++++++---------------
 compiler/vm/vmjit.nim              |   4 +-
 tests/exception/tleave_except2.nim |   2 +-
 tests/exception/treraise2.nim      |   2 +-
 6 files changed, 313 insertions(+), 328 deletions(-)

diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index f3be5b14b99..f3646516021 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -605,10 +605,8 @@ proc runEh(t: var VmThread, c: var TCtx): Result[PrgCtr, VmException] =
         t.ehStack.setLen(t.ehStack.len - 1)
       of 1:
         # discard the parent thread if it's associated with the provided
-        # ``finally``
-        let instr = c.code[instr.b]
-        vmAssert instr.opcode == opcFinallyEnd
-        let (fromEh, b) = decodeControl(t.getReg(instr.regA).intVal)
+        # control register
+        let (fromEh, b) = decodeControl(t.getReg(instr.b.TRegister).intVal)
         if fromEh:
           vmAssert b.int == t.ehStack.high - 1
           swap(tos, t.ehStack[^2])
@@ -2072,7 +2070,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       inc pc, rbx
       handleJmpBack()
     of opcBranch:
-      # we know the next instruction is a 'fjmp':
+      # we know the next instruction is a 'tjmp':
       let value = c.constants[instr.regBx-wordExcess]
 
       checkHandle(regs[ra])
@@ -2090,11 +2088,11 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       else:
         unreachable(value.kind)
 
-      assert c.code[pc+1].opcode == opcFJmp
+      assert c.code[pc+1].opcode == opcTJmp
       inc pc
       # we skip this instruction so that the final 'inc(pc)' skips
       # the following jump
-      if not cond:
+      if cond:
         let instr2 = c.code[pc]
         let rbx = instr2.regBx - wordExcess - 1 # -1 for the following 'inc pc'
         inc pc, rbx
diff --git a/compiler/vm/vmbackend.nim b/compiler/vm/vmbackend.nim
index 280cccafcab..4084bce8c8a 100644
--- a/compiler/vm/vmbackend.nim
+++ b/compiler/vm/vmbackend.nim
@@ -126,7 +126,7 @@ proc generateCodeForProc(c: var CodeGenCtx, idgen: IdGenerator, s: PSym,
   ## Generates and the bytecode for the procedure `s` with body `body`. The
   ## resulting bytecode is emitted into the global bytecode section.
   let
-    body = generateIRLegacy(c.graph, idgen, c.env, s, body)
+    body = generateIR(c.graph, idgen, c.env, s, body)
     r    = genProc(c, s, body)
 
   if r.isOk:
@@ -181,7 +181,7 @@ proc processEvent(c: var GenCtx, mlist: ModuleList, discovery: var DiscoveryData
   of bekPartial:
     let p = addr mgetOrPut(partial, evt.id, PartialProc(sym: evt.sym))
     discard merge(p.body):
-      generateIRLegacy(c.graph, idgen, c.gen.env, evt.sym, evt.body)
+      generateIR(c.graph, idgen, c.gen.env, evt.sym, evt.body)
   of bekProcedure:
     # a complete procedure became available
     let r = generateCodeForProc(c.gen, idgen, evt.sym, evt.body)
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 8744d567cf2..8aeafa6d87a 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -76,7 +76,7 @@ import
 import std/options as std_options
 
 from compiler/backend/compat import getInt, isOfBranch, skipConv, lastSon,
-  getMagic, pick
+  getMagic, pick, numArgs
 
 from std/bitops import bitor
 
@@ -127,15 +127,25 @@ type
 
   BlockKind = enum
     bkBlock   ## labeled block
-    bkTry     ## the ``try`` and ``except`` clause of a ``finally``-having
-              ## try statement
     bkExcept  ## ``except`` clause
     bkFinally ## ``finally`` clause
 
+  BlockInfo = object
+    oldRegisterCount: int
+      ## upper bound of allocated registers at the beginning of the block
+    label: BlockId
+    case kind: BlockKind
+    of bkBlock, bkFinally:
+      start: TPosition
+    of bkExcept:
+      discard
+
   BProc = object
-    blocks: seq[tuple[kind: BlockKind, exits: seq[TPosition], cr: TRegister]]
-      ## for each block, the jump instructions targeting the block's exit.
-      ## These need to be patched once the code for the block is generated
+    blocks: seq[BlockInfo]
+      ## information about each block-like construct. Forms a stack
+    exits: seq[tuple[label: BlockId, pos: TPosition]]
+      ## jump instructions that need patching once the target instruction is
+      ## known
     sym: PSym
     body: Body
       ## the full body of the current procedure/statement/expression
@@ -151,12 +161,12 @@ type
     baseOffset: TPosition
       ## the bytecode position that instruction-to-EH mappings need to be
       ## relative to
-    hasEh: int
-      ## > 0 when some form of exception handling exists for the current
-      ## node
-    raiseExits: int
-      ## used to establish a relation between two points during code
-      ## generation (e.g., "are there new exceptional exits since X?")
+    ehExits: seq[tuple[label: BlockId, pos: uint32]]
+      ## EH instructions that need patching once position and type of the
+      ## target EH instruction is known
+    lastPath: CgNode
+      ## the path corresponding to the previously emitted EH instruction
+      ## sequence, or nil. Prevents excessive EH code duplication
 
   CodeGenCtx* = object
     ## Bundles all input, output, and other contextual data needed for the
@@ -438,14 +448,65 @@ proc patchSetEh(c: var TCtx, p: TPosition) =
   # opcode and regA stay the same, only regB is updated:
   c.code[p] = TInstr(instr.TInstrType or TInstrType(fin shl regBShift))
 
-proc registerEh(c: var TCtx) =
-  ## If a jump-list designated for exception handling is active, associates it
-  ## with the next-emitted instruction.
-  if c.prc.hasEh > 0:
-    inc c.prc.raiseExits
-    let pos = c.code.len
-    c.ehTable.add:
-      (uint32(pos - c.prc.baseOffset.int), c.ehCode.len.uint32)
+proc genEhCode(c: var TCtx, n: CgNode)
+
+proc registerEh(c: var TCtx, n: CgNode) =
+  ## Emits an exception-handling table entry for the instruction at the head
+  ## of the instruction list (i.e., the one emitted next). `n` must be either
+  ## a label or target list.
+  proc isEqual(a, b: CgNode): bool =
+    ## Compares two label-like nodes for equality.
+    if a.kind != b.kind:
+      return false
+
+    case a.kind
+    of cnkLeave:  a[0].label == b[0].label
+    of cnkLabel:  a.label == b.label
+    of cnkResume: true
+    else:
+      unreachable()
+
+  proc comparePaths(a, b: CgNode): int =
+    ## Returns the number of actions `a` and `b` share at the end. 0
+    ## means that both share no trailing actions.
+    let (a, b) =
+      if a.kind == cnkTargetList: (a, b)
+      else:                       (b, a)
+    # because of the above swap, if `a` is not a list of targets, then neither
+    # is `b`
+    if a.kind == cnkTargetList:
+      if b.kind == cnkLabel:
+        result = if isEqual(a[^1], b): 1 else: 0
+      else:
+        result = min(a.len, b.len)
+        for i in 1..result:
+          if not isEqual(a[^i], b[^i]):
+            return i - 1
+        # one target list is a subset of the other
+    else:
+      result = if isEqual(a, b): 1 else: 0
+
+  let pos = uint32(c.code.len - c.prc.baseOffset.int)
+  case n.kind
+  of cnkLabel:
+    # un-intercepted jump
+    if c.prc.lastPath == nil or comparePaths(c.prc.lastPath, n) == 0:
+      genEhCode(c, n)
+
+    c.ehTable.add (pos, uint32(c.ehCode.len - 1))
+  of cnkTargetList:
+    if n.len == 1 and n[0].kind == cnkResume:
+      # if there's nothing responding to the exception within the current
+      # procedure, no EH code needs to be associated with the instruction
+      return
+
+    if c.prc.lastPath == nil or comparePaths(n, c.prc.lastPath) < n.len:
+      # cannot re-use the previous instruction sequence
+      genEhCode(c, n)
+
+    c.ehTable.add (pos, uint32(c.ehCode.len - n.len))
+  else:
+    unreachable(n.kind)
 
 proc getSlotKind(t: PType): TSlotKind =
   case t.skipTypes(IrrelevantTypes+{tyRange}).kind
@@ -633,33 +694,17 @@ proc whichAsgnOpc(t: PType): TOpcode {.used.} =
   else:
     opcAsgnComplex
 
-proc genRepeat(c: var TCtx; n: CgNode) =
-  # lab1:
-  #   body
-  #   jmp lab1
-  # lab2:
-  let lab1 = c.genLabel
-  c.gen(n[0])
-  c.jmpBack(n, lab1)
-
-func initBlock(kind: BlockKind, cr = TRegister(0)): typeof(BProc().blocks[0]) =
-  ## NOTE: this procedure is a workaround for a bug of the current csources
-  ## compiler. `isTry` being a literal bool value would lead to run-time
-  ## crashes.
-  result = (kind, @[], cr)
-
-proc genBlock(c: var TCtx; n: CgNode) =
-  let oldRegisterCount = c.prc.regInfo.len
-
-  c.prc.blocks.add initBlock(bkBlock) # push a new block
-  c.gen(n[1])
-  # fixup the jumps:
-  for pos in c.prc.blocks[^1].exits.items:
-    c.patch(pos)
-  # pop the block again:
-  c.prc.blocks.setLen(c.prc.blocks.len - 1)
-
-  for i in oldRegisterCount..<c.prc.regInfo.len:
+func pushBlock(c: var TCtx, blk: sink BlockInfo) =
+  blk.oldRegisterCount = c.prc.regInfo.len
+  # XXX: ^^ the register list only grows, meaning that its length doesn't
+  #      represent the allocated upper bound... Freeing register used for
+  #      locals is broken in general
+  c.prc.blocks.add blk
+
+proc popBlock(c: var TCtx) =
+  let blk = c.prc.blocks.pop()
+  # free all register allocated for locals part of the block:
+  for i in blk.oldRegisterCount..<c.prc.regInfo.len:
       when not defined(release):
         if c.prc.regInfo[i].inUse and c.prc.regInfo[i].kind in {slotTempUnknown,
                                   slotTempInt,
@@ -670,36 +715,62 @@ proc genBlock(c: var TCtx; n: CgNode) =
           doAssert false, "leaking temporary " & $i & " " & $c.prc.regInfo[i].kind
       c.prc.regInfo[i] = RegInfo(kind: slotEmpty)
 
-proc blockLeaveActions(c: var TCtx, info: CgNode, target: Natural) =
-  ## Emits the bytecode for leaving a block. `target` is the index of the
-  ## block to exit.
-  # perform the leave actions from innermost to outermost
-  for i in countdown(c.prc.blocks.high, target):
-    case c.prc.blocks[i].kind
-    of bkBlock:
-      discard "no leave action to perfrom"
-    of bkTry:
-      # enter the finally clause
-      c.prc.blocks[i].exits.add c.xjmp(info, opcEnter)
-    of bkExcept:
-      # leave the except clause
-      c.gABI(info, opcLeave, 0, 0, 0)
-    of bkFinally:
-      # leave the finally clause
-      c.gABI(info, opcLeave, c.prc.blocks[i].cr, 0, 1)
+func controlReg(c: TCtx, blk: BlockInfo): TRegister =
+  c.code[blk.start.int].regA
+
+proc genGoto(c: var TCtx; n: CgNode) =
+  ## Generates and emits the code for a ``cnkGoto``. Depending on whether it's
+  ## an intercepted jump, the goto can translate to more than one instruction.
+  let
+    target = n[0]
+    info = n.info
+  case target.kind
+  of cnkLabel:
+    c.prc.exits.add (target.label, c.xjmp(n, opcJmp))
+  of cnkTargetList:
+    # there are some leave actions
+    for i in 0..<target.len-1:
+      let it = target[i]
+      case it.kind
+      of cnkLabel:
+        # enter the finally section:
+        c.prc.exits.add (it.label, c.xjmp(n, opcEnter))
+      of cnkLeave:
+        # leave the except or finally section:
+        for blk in c.prc.blocks.items:
+          if blk.label == it[0].label:
+            case blk.kind
+            of bkExcept:
+              c.gABI(info, opcLeave, 0, 0, 0)
+            of bkFinally:
+              c.gABI(info, opcLeave, c.controlReg(blk), 0, 1)
+            else:
+              unreachable()
+            break
+      else:
+        unreachable()
+
+    # the jump to the final destination
+    c.prc.exits.add (target[^1].label, c.xjmp(n, opcJmp))
+  else:
+    unreachable()
 
-proc genBreak(c: var TCtx; n: CgNode) =
-  # find the labeled block corresponding to the block ID:
-  var i, b = 0
-  while b < n[0].label.int or c.prc.blocks[i].kind != bkBlock:
-    b += ord(c.prc.blocks[i].kind == bkBlock)
-    inc i
 
-  blockLeaveActions(c, n, i)
+iterator take[T](s: var seq[T], label: BlockId): lent T =
+  ## Returns all items with `label` and removes them afterwards.
+  var i = 0
+  while i < s.len:
+    if s[i].label == label:
+      yield s[i]
+      # remove the item from the list (order within the list doesn't
+      # matter)
+      s.del(i)
+    else:
+      inc i
 
-  # emit the actual jump to the end of targeted labeled block:
-  let label = c.xjmp(n, opcJmp)
-  c.prc.blocks[i].exits.add label
+proc patch(c: var TCtx, label: BlockId) =
+  for it in take(c.prc.exits, label):
+    c.patch(it.pos)
 
 proc genIf(c: var TCtx, n: CgNode) =
   #  if (!expr1) goto lab1;
@@ -708,16 +779,16 @@ proc genIf(c: var TCtx, n: CgNode) =
   block:
       let it = n
       withDest(tmp):
-        var elsePos: TPosition
+        var start: TPosition
         if isNotOpr(c.env, it[0]):
           c.gen(it[0][1], tmp)
-          elsePos = c.xjmp(it[0][1], opcTJmp, tmp) # if true
+          start = c.xjmp(it[0][1], opcTJmp, tmp) # if true
         else:
           c.gen(it[0], tmp)
-          elsePos = c.xjmp(it[0], opcFJmp, tmp) # if false
+          start = c.xjmp(it[0], opcFJmp, tmp) # if false
 
-      c.gen(it[1]) # then part
-      c.patch(elsePos)
+      # the 'if' opens a block, which the corresponding 'end' closes
+      pushBlock(c): BlockInfo(kind: bkBlock, label: it[1].label, start: start)
 
 # XXX `rawGenLiteral` should be a func, but can't due to `internalAssert`
 proc rawGenLiteral(c: var TCtx, val: sink VmConstant): int =
@@ -858,18 +929,7 @@ proc unused(c: TCtx; n: CgNode; x: TDest) {.inline.} =
     fail(n.info, vmGenDiagNotUnused, PNode(nil))
 
 proc genCase(c: var TCtx; n: CgNode) =
-  #  if (!expr1) goto lab1;
-  #    thenPart
-  #    goto LEnd
-  #  lab1:
-  #  if (!expr2) goto lab2;
-  #    thenPart2
-  #    goto LEnd
-  #  lab2:
-  #    elsePart
-  #  Lend:
   let selType = n[0].typ.skipTypes(abstractVarRange)
-  var endings: seq[TPosition] = @[]
   withDest(tmp):
     c.gen(n[0], tmp)
 
@@ -877,15 +937,12 @@ proc genCase(c: var TCtx; n: CgNode) =
     for i in 1..<n.len:
       let branch = n[i]
       if isOfBranch(branch):
-        var elsePos: TPosition
         if selType.kind == tyString:
           # special handling for string case statements: generate a sequence
           # of comparisons
           let
             cond = c.getTemp(slotTempInt)
-            # we re-use the `endings` list for collecting the jumps to the
-            # body:
-            start = endings.len
+            exit = branch[^1].label
 
           for j in 0..<branch.len - 1:
             let
@@ -893,31 +950,20 @@ proc genCase(c: var TCtx; n: CgNode) =
               val = c.genx(it)
             # generate: ``if tmp == label: goto body``
             c.gABC(it, opcEqStr, cond, tmp, val)
-            endings.add c.xjmp(it, opcTJmp, cond)
+            c.prc.exits.add (exit, c.xjmp(it, opcTJmp, cond))
             c.freeTemp(val)
 
           c.freeTemp(cond)
-          # emit a jump to the next branch:
-          elsePos = c.xjmp(branch.lastSon, opcJmp)
-          # patch the jumps to the body:
-          for j in start..<endings.len:
-            c.patch(endings[j])
-          endings.setLen(start)
         else:
           # branch tmp, codeIdx
-          # fjmp   elseLabel
+          # tjmp   thenLabel
           let b = genBranchLit(c, branch, selType)
           c.gABx(branch, opcBranch, tmp, b)
-          elsePos = c.xjmp(branch.lastSon, opcFJmp, tmp)
+          c.prc.exits.add (branch[^1].label, c.xjmp(branch, opcTJmp, tmp))
 
-        c.gen(branch.lastSon)
-        if i < n.len-1:
-          endings.add(c.xjmp(branch.lastSon, opcJmp, 0))
-        c.patch(elsePos)
       else:
         # else stmt:
-        c.gen(branch[0])
-  for endPos in endings: c.patch(endPos)
+        c.prc.exits.add (branch[0].label, c.xjmp(branch.lastSon, opcJmp))
 
 proc genType(c: var TCtx; typ: PType; noClosure = false): int =
   ## Returns the ID of `typ`'s corresponding `VmType` as an `int`. The
@@ -942,179 +988,104 @@ proc genTypeInfo(c: var TCtx, typ: PType): int =
 
   internalAssert(c.config, result <= regBxMax, "")
 
-proc genExcept(c: var TCtx, n: CgNode, firstExit: int) =
-  ## Emits the code and EH code for the 'except' branches of a ``cnkTry``
-  ## statement (`n`).
-  let startEh = c.ehCode.len.uint32
-  c.prc.raiseExits = firstExit # treat all open exceptional exits as handled
-
-  # for a simpler implementation, two passes are used. First emit the
-  # EH instructions
-  let last = n.len - 1 - ord(n[^1].kind == cnkFinally)
-  for i in 1..last:
-    let it = n[i]
-    if it.len > 1:
-      # exception handler with filter
-      for j in 0..<it.len - 1:
-        assert it[j].kind == cnkType
-        let typ = c.genType(it[j].typ.skipTypes(abstractPtrs))
-        c.ehCode.add (ehoExceptWithFilter, uint16 typ, 0'u32)
-    else:
-      # catch-all exception handler
-      c.ehCode.add (ehoExcept, 0'u16, 0'u32)
-
-  # closing the chain, if necessary, is done once the finally section is
-  # generated
-
-  # second pass: emit the actual exception handler bodies
-  var
-    instr = startEh
-    hasRaiseExits = false
-    exits: seq[TPosition]
-
-  for i in 1..last:
-    let start = c.genLabel()
-    # patch the 'Except'/'ExceptWithFilter' targets
-    for _ in 0..<max(n[i].len-1, 1):
-      c.ehCode[instr].b = uint32 start
-      inc instr
-
-    # body:
-    c.prc.blocks.add initBlock(bkExcept)
-    c.gen(n[i][^1])
-    c.gABI(n[i], opcLeave, 0, 0, 0) # pop the exception
-    c.prc.blocks.setLen(c.prc.blocks.len - 1)
-
-    if c.prc.raiseExits > firstExit:
-      # all exceptional exits from within the ``except`` need to close the
-      # thread that entered it
-      c.ehCode.add (ehoNext, 0'u16, 2'u32)
-      c.ehCode.add (ehoLeave, 0'u16, 0'u32)
-      c.prc.raiseExits = firstExit
-      hasRaiseExits = true
-
-    if i < last:
-      # emit a jump past the following handlers
-      exits.add c.xjmp(n[i], opcJmp)
-
-  for endPos in exits.items:
-    c.patch(endPos)
-
-  if n[last].len > 1 or hasRaiseExits:
-    # exceptional control-flow possibly leaves the handler section (because
-    # there's no catch-all handler), OR one of the handlers potentially
-    # raises
-    inc c.prc.raiseExits
-
-proc genFinally(c: var TCtx, n: CgNode, firstExit: int) =
-  ## Generates and emits the code for a ``cnkFinally`` clause.
-  let
-    enteredViaExcept = c.prc.raiseExits > firstExit
-    startEh = c.ehCode.len
-
-  # patch the 'Enter' instructions entering the finalizer and then pop the
-  # block
-  for pos in c.prc.blocks[^1].exits.items:
-    c.patch(pos)
-  c.prc.blocks.setLen(c.prc.blocks.len - 1)
-
-  # omit the EH 'Finally' instruction if there are no exceptional exits
-  if enteredViaExcept:
-    c.ehCode.add (ehoFinally, 0'u16, uint32 c.genLabel())
-    # add a tentative 'Next' instruction; it's removed again if not needed
+proc genEhCodeAux(c: var TCtx, n: CgNode) =
+  ## Emits the EH instruction for a single action of a jump target list.
+  case n.kind
+  of cnkLeave:
+    let label = n[0].label
+    # which except or finally block?
+    for it in c.prc.blocks.items:
+      if it.label == label:
+        case it.kind
+        of bkExcept:
+          c.ehCode.add (ehoLeave, 0'u16, 0'u32)
+        of bkFinally:
+          c.ehCode.add (ehoLeave, 1'u16, uint32 c.controlReg(it))
+        else:
+          unreachable()
+        break
+  of cnkLabel:
+    # we don't know yet whether this is a finally or exception handler; the
+    # instruction is patched later
+    c.prc.ehExits.add (n.label, c.ehCode.len.uint32)
     c.ehCode.add (ehoNext, 0'u16, 0'u32)
-    # all exceptional threads are handled
-    c.prc.raiseExits = firstExit
+  of cnkResume:
+    # resume means to resume exception handling in the caller (if possible at
+    # run-time)
+    c.ehCode.add (ehoEnd, 0'u16, 0'u32)
+  else:
+    unreachable()
 
-  let
-    control = c.getTemp(slotTempInt)
-    start = c.xjmp(n, opcFinally, control)
-
-  # generate the code for the body
-  c.prc.blocks.add initBlock(bkFinally, control)
-  c.prc.hasEh += ord(enteredViaExcept)
-  c.gen(n[0])
-  c.prc.hasEh -= ord(enteredViaExcept)
-  c.prc.blocks.setLen(c.prc.blocks.len - 1)
-
-  if enteredViaExcept:
-    if c.prc.raiseExits > firstExit:
-      # the 'finally' could be part of an active exceptional thread, and
-      # the 'finally' clause has an exceptional exit. Patch the earlier
-      # 'Next' instruction to point *past* the 'Leave'
-      c.ehCode[startEh + 1].b = uint32(c.ehCode.len - (startEh+1) + 1)
-      c.ehCode.add (ehoLeave, 1'u16, uint32 c.genLabel())
-    else:
-      # remove the unneeded 'Next'
-      c.ehCode.setLen(startEh + 1)
+proc genEhCode(c: var TCtx, n: CgNode) =
+  ## Emits the EH instruction sequence for a jump action description.
+  case n.kind
+  of cnkLabel:
+    genEhCodeAux(c, n)
+  of cnkTargetList:
+    for i in 0..<n.len:
+      genEhCodeAux(c, n[i])
+  else:
+    unreachable()
+  # remember the jump target description the EH code sequence came from
+  c.prc.lastPath = n
+
+proc genExcept(c: var TCtx, n: CgNode) =
+  ## Emits the EH code for a ``cnkExcept``.
+
+  # simple but high-impact optimization: if the last EH exit we need to patch
+  # is the preceding EH instruction, eliminate the instruction (it'd just be
+  # a single instruction jump)
+  if c.prc.ehExits.len > 0 and
+     c.prc.ehExits[^1] == (n[0].label, c.ehCode.high.uint32):
+    c.ehCode.setLen(c.ehCode.len - 1)
+    c.prc.ehExits.setLen(c.prc.ehExits.len - 1)
+
+  # patch all EH instructions targeting the handler:
+  for it in take(c.prc.ehExits, n[0].label):
+    c.ehCode[it.pos] = (ehoNext, 0'u16, c.ehCode.len.uint32 - it.pos)
+
+  pushBlock(c): BlockInfo(kind: bkExcept, label: n[0].label)
+
+  let pc = uint32 c.genLabel()
+  if n.len > 1:
+    # exception handler with filter
+    for i in 1..<n.len-1:
+      let it = n[i]
+      assert it.kind == cnkType
+      let typ = c.genType(it.typ.skipTypes(abstractPtrs))
+      c.ehCode.add (ehoExceptWithFilter, uint16 typ, pc)
+
+    # emit the follow-up EH code
+    genEhCode(c, n[^1])
+  else:
+    # catch-all exception handler
+    c.ehCode.add (ehoExcept, 0'u16, pc)
+    # new EH code was emitted, invalidating the cached path:
+    c.prc.lastPath = nil
 
-    # continue the exceptional control-flow
-    inc c.prc.raiseExits
+proc genFinally(c: var TCtx, n: CgNode) =
+  let pc = c.genLabel()
 
-  c.gABx(n, opcFinallyEnd, control, 0)
-  c.patch(start)
-  c.freeTemp(control)
+  # update all EH instructions targeting the finally:
+  for it in take(c.prc.ehExits, n[0].label):
+    c.ehCode[it.pos] = (ehoFinally, 0'u16, uint32 pc)
 
-proc genTry(c: var TCtx; n: CgNode) =
-  let
-    hasExcept = n[1].kind == cnkExcept
-    hasFinally = n[^1].kind == cnkFinally
-    startEh = c.ehCode.len
-    firstExit = c.prc.raiseExits
-    needsSkip = firstExit > 0 and c.ehCode[^1].opcode != ehoNext
-
-  if needsSkip:
-    # an unclosed EH chain on the same level exists, e.g.:
-    #   try:
-    #     try: ... finally: ... # <- this is the unclosed chain
-    #     try: ... finally: ...
-    #   except: ...
-    #
-    # make sure the new chain doesn't enter the finally/except clauses emitted
-    # for the current 'try'
-    c.ehCode.add (ehoNext, 0'u16, 0'u32)
+  pushBlock(c): BlockInfo(kind: bkFinally, label: n[0].label, start: pc)
 
-  if hasFinally:
-    c.prc.blocks.add initBlock(bkTry)
-
-  # emit the bytecode for the 'try' body:
-  inc c.prc.hasEh
-  c.gen(n[0])
-  dec c.prc.hasEh
-
-  # omit the exception handlers if there are no exceptional exits from within
-  # the try clause
-  if hasExcept and c.prc.raiseExits > firstExit:
-    let eh = c.xjmp(n, opcJmp) # jump past the exception handling
-    c.prc.hasEh += ord(hasFinally)
-    genExcept(c, n, firstExit)
-    c.prc.hasEh -= ord(hasFinally)
-    c.patch(eh)
-
-  if hasFinally:
-    genFinally(c, n[^1], firstExit)
-
-  if needsSkip:
-    # patch the 'Next' instruction skipping the handler chain
-    c.ehCode[startEh].b = uint32(c.ehCode.len - startEh)
-
-  if c.prc.hasEh == 0:
-    # end the EH chain if there are no more applicable handlers within the
-    # current procedure
-    assert firstExit == 0
-    c.ehCode.add (ehoEnd, 0'u16, 0'u32)
-    c.prc.raiseExits = firstExit
-    # echo "emit: end"
+  let control = c.getTemp(slotTempInt)
+  c.patch(n[0].label) # patch the jumps targeting the finally
+  c.gABC(n, opcFinally, control)
+  # the control register is freed at the end of the finally section
 
 proc genRaise(c: var TCtx; n: CgNode) =
   if n[0].kind != cnkEmpty:
     let dest = c.genx(n[0])
-    c.registerEh()
+    c.registerEh(n[^1])
     c.gABI(n, opcRaise, dest, 0, imm=0)
     c.freeTemp(dest)
   else:
     # reraise
-    c.registerEh()
+    c.registerEh(n[^1])
     c.gABI(n, opcRaise, 0, 0, imm=1)
 
 proc writeBackResult(c: var TCtx, info: CgNode) =
@@ -1133,11 +1104,6 @@ proc writeBackResult(c: var TCtx, info: CgNode) =
       c.gABC(info, opcFastAsgnComplex, dest, tmp)
       c.freeTemp(tmp)
 
-proc genReturn(c: var TCtx; n: CgNode) =
-  blockLeaveActions(c, n, 0)
-  writeBackResult(c, n)
-  c.gABC(n, opcRet)
-
 proc genLit(c: var TCtx; n: CgNode; lit: int; dest: var TDest) =
   ## `lit` is the index of a constant as returned by `genLiteral`
   # load the literal into the *register*
@@ -1174,7 +1140,8 @@ proc genCall(c: var TCtx; n: CgNode; dest: var TDest) =
 
   let
     fntyp = skipTypes(n[0].typ, abstractInst)
-    regCount = n.len + ord(fntyp.callConv == ccClosure)
+    operands = numArgs(n) + 1
+    regCount = operands + ord(fntyp.callConv == ccClosure)
     x = c.prc.getTempRange(regCount, slotTempUnknown)
 
   # generate the code for the callee:
@@ -1187,7 +1154,7 @@ proc genCall(c: var TCtx; n: CgNode; dest: var TDest) =
       # the respective registers directly
       # XXX: dead code, but should be restored
       c.gen(n[0][0], x+0)
-      c.gen(n[0][1], x+n.len)
+      c.gen(n[0][1], x+operands)
     else:
       let
         tmp = c.genx(n[0])
@@ -1196,14 +1163,14 @@ proc genCall(c: var TCtx; n: CgNode; dest: var TDest) =
       # use a full assignment in order for the environment to stay alive during
       # the call
       c.gABC(n[0], opcLdObj, tmp2, tmp, 1)
-      c.gABC(n[0], opcAsgnComplex, x+n.len, tmp2)
+      c.gABC(n[0], opcAsgnComplex, x+operands, tmp2)
       c.freeTemp(tmp2)
       c.freeTemp(tmp)
   else:
     c.gen(n[0], x+0)
 
   # varargs need 'opcSetType' for the FFI support:
-  for i in 1..<n.len:
+  for i in 1..<operands:
     # skip empty arguments (i.e. arguments to compile-time parameters that
     # were omitted):
     if n[i].kind == cnkEmpty:
@@ -1230,11 +1197,13 @@ proc genCall(c: var TCtx; n: CgNode; dest: var TDest) =
       internalAssert(c.config, tfVarargs in fntyp.flags)
       c.gABx(n, opcSetType, r, c.genType(n[i].typ))
 
-  c.registerEh()
+  if n.kind == cnkCheckedCall:
+    c.registerEh(n[^1])
+
   if res.isUnset:
-    c.gABC(n, opcIndCall, 0, x, n.len)
+    c.gABC(n, opcIndCall, 0, x, operands)
   else:
-    c.gABC(n, opcIndCallAsgn, res, x, n.len)
+    c.gABC(n, opcIndCallAsgn, res, x, operands)
 
   if res != dest:
     if dest.isUnset:
@@ -2092,7 +2061,7 @@ proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
   of mEcho:
     unused(c, n, dest)
     let
-      numArgs = n.len - 2
+      numArgs = numArgs(n)-1 # the extra type argument is ignored
       x = c.prc.getTempRange(numArgs, slotTempUnknown)
     for i in 0..<numArgs:
       var r: TRegister = x+i
@@ -2377,28 +2346,27 @@ proc genDiscrVal(c: var TCtx, discr, n: CgNode, oty: PType): TRegister =
     var endings: seq[TPosition] = @[]
     let bIReg = c.getTemp(discr.typ)
     let tmp = c.getTemp(discr.typ)
-    # XXX: this is mostly just copied from `genCase`
     c.gen(n, tmp)
     # branch tmp, codeIdx
-    # fjmp   elseLabel
-
-    # iterate of/else branches
-    for i in 1..<recCase.len:
-      let branch = recCase[i]
-      let bI = i - 1
-      assert bI <= int(high(uint16))
-      if branch.len == 1:
-        # else branch:
-        c.gABx(n, opcLdImmInt, bIReg, bI)
-      else:
-        # of branch
+    # tjmp   target
+
+    # iterate of/else branches and emit the dispatcher:
+    for i, branch in branches(recCase):
+      case branch.kind
+      of nkElse:
+        endings.add c.xjmp(n, opcJmp)
+      of nkOfBranch:
         let b = genBranchLit(c, branch)
         c.gABx(n, opcBranch, tmp, b)
-        let elsePos = c.xjmp(n, opcFJmp, tmp)
-        c.gABx(n, opcLdImmInt, bIReg, bI)
-        if i < recCase.len-1:
-          endings.add(c.xjmp(n, opcJmp, 0))
-        c.patch(elsePos)
+        endings.add c.xjmp(n, opcTJmp)
+      else:
+        unreachable()
+
+    # emit the bodies:
+    for i, branch in branches(recCase):
+      c.patch(endings[i])
+      c.gABx(n, opcLdImmInt, bIReg, i)
+      endings[i] = c.xjmp(n, opcJmp) # jump past the other branches
 
     for endPos in endings: c.patch(endPos)
 
@@ -3153,27 +3121,46 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
   of cnkCaseStmt:
     unused(c, n, dest)
     genCase(c, n)
-  of cnkRepeatStmt:
-    unused(c, n, dest)
-    genRepeat(c, n)
-  of cnkBlockStmt:
-    unused(c, n, dest)
-    genBlock(c, n)
-  of cnkReturnStmt:
-    genReturn(c, n)
   of cnkRaiseStmt:
     genRaise(c, n)
-  of cnkBreakStmt:
-    genBreak(c, n)
-  of cnkTryStmt:
-    unused(c, n, dest)
-    genTry(c, n)
+  of cnkGotoStmt:
+    genGoto(c, n)
   of cnkStmtList:
+    # XXX: supported for a transition period (``cgir.merge`` creates nested
+    #      statement lists)
     unused(c, n, dest)
     for x in n: gen(c, x)
   of cnkVoidStmt:
     unused(c, n, dest)
     gen(c, n[0])
+  of cnkContinueStmt:
+    # marks the end of a finally section
+    let
+      blk {.cursor.} = c.prc.blocks[^1]
+      control = c.controlReg(blk)
+    # patch the ``opcFinally`` instruction:
+    c.patch(blk.start)
+    c.gABx(n, opcFinallyEnd, control, 0)
+    # now free the control register
+    c.freeTemp(control)
+    popBlock(c)
+  of cnkJoinStmt:
+    c.patch(n[0].label)
+  of cnkLoopJoinStmt:
+    # loops count as blocks too
+    pushBlock(c):
+      BlockInfo(kind: bkBlock, label: n[0].label, start: c.genLabel())
+  of cnkLoopStmt:
+    c.jmpBack(n, c.prc.blocks[^1].start)
+    popBlock(c)
+  of cnkExcept:
+    genExcept(c, n)
+  of cnkFinally:
+    genFinally(c, n)
+  of cnkEnd:
+    if c.prc.blocks[^1].kind == bkBlock:
+      c.patch(c.prc.blocks[^1].start)
+    popBlock(c)
   of cnkHiddenConv, cnkConv:
     genConv(c, n, n.operand, dest)
   of cnkLvalueConv:
@@ -3199,9 +3186,9 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
     genTypeLit(c, n, n.typ, dest)
   of cnkAsmStmt, cnkEmitStmt:
     unused(c, n, dest)
-  of cnkInvalid, cnkMagic, cnkRange, cnkExcept, cnkFinally, cnkBranch,
+  of cnkInvalid, cnkMagic, cnkRange, cnkBranch,
      cnkBinding, cnkLabel, cnkStmtListExpr, cnkField, cnkToSlice,
-     cnkNewCfNodes:
+     cnkLegacyNodes, cnkResume, cnkTargetList, cnkLeave:
     unreachable(n.kind)
 
 proc initProc(c: TCtx, owner: PSym, body: sink Body): BProc =
@@ -3239,7 +3226,7 @@ proc genExpr*(c: var TCtx; body: sink Body): Result[int, VmGenDiag] =
   var d: TDest = -1
   try:
     let eh = genSetEh(c, n.info)
-    if n.kind == cnkStmtListExpr:
+    if n.kind == cnkStmtList:
       # special case the expression here so that ``gen`` doesn't have to
       for i in 0..<n.len-1:
         c.gen(n[i])
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 3913cbf5bf2..1b9a96a6e11 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -154,7 +154,7 @@ proc generateMirCode(c: var TCtx, env: var MirEnv, n: PNode;
     result.code = finish(bu)
 
 proc generateIR(c: var TCtx, env: MirEnv, body: sink MirBody): Body =
-  backends.generateIRLegacy(c.graph, c.idgen, env, c.module, body)
+  backends.generateIR(c.graph, c.idgen, env, c.module, body)
 
 proc setupRootRef(c: var TCtx) =
   ## Sets up if the ``RootRef`` type for the type info cache. This
@@ -271,7 +271,7 @@ proc genProc(jit: var JitState, c: var TCtx, s: PSym): VmGenResult =
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
-  let outBody = generateIRLegacy(c.graph, c.idgen, jit.gen.env, s, mirBody)
+  let outBody = generateIR(c.graph, c.idgen, jit.gen.env, s, mirBody)
   echoOutput(c.config, s, outBody)
 
   try:
diff --git a/tests/exception/tleave_except2.nim b/tests/exception/tleave_except2.nim
index 63ee9496ae5..66262b80fd9 100644
--- a/tests/exception/tleave_except2.nim
+++ b/tests/exception/tleave_except2.nim
@@ -3,7 +3,7 @@ discard """
     Ensure that leaving an `except` section by raising an exception properly
     updates the current exception.
   '''
-  knownIssue.js vm: "The current exception is not reset properly"
+  knownIssue.js: "The current exception is not reset properly"
 """
 
 var steps: seq[string]
diff --git a/tests/exception/treraise2.nim b/tests/exception/treraise2.nim
index 30216fe2887..9fd0a841095 100644
--- a/tests/exception/treraise2.nim
+++ b/tests/exception/treraise2.nim
@@ -3,7 +3,7 @@ discard """
     Ensure that raising a caught exception from within an exception handler
     works
   '''
-  knownIssue.js vm: "The current exception is not properly updated"
+  knownIssue.js: "The current exception is not properly updated"
 """
 
 proc manualReraise() =

From 24ba843ac9b41922adcc5f92b4b7881cbfb8a2f1 Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Sun, 10 Mar 2024 02:43:51 +0100
Subject: [PATCH 026/169] Use more node kind sets (#1226)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

## Summary
* Move  `nkLiterals`  and its more specific literal subsets to
`ast_types`  and include  `nkNilLit`  in  `nkLiterals`
* Introduce node kind sets  `nkSIntLiterals` ,  `nkUIntLiterals`  for
signed and unsigned integer literals
* Make more use of node kind set constants across the compiler and make
some case statements exhaustive
* A few minor bugs have been fixed along the way and tests for them
added

## Details
* Fix a bug that made  `astrepr.cyclicTreeAux`  ignore the children of
non-error nodes (only used by the  `astrepr.treeRepr`  debugging
facility)
* Fix the assertion failures encountered when running the  `ic`  tests
with a debug or release compiler
* Fix the  `locks`  pragma erroneously accepting unsigned integers and
char literals (see  `tests/pragmas/tlocks.nim` )
* Fix unsigned integers and char literals causing crashes with term
rewriting macros (see
`tests/lang_experimental/trmacros/trmacros_various2.nim` )
* Fix the VM crashing when trying to access the non-existent sons of a
`nnkCommentStmt`  node (see  `tests/errmsgs/tnnodeindexkind.nim` )

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/ast/ast.nim                          |  2 +-
 compiler/ast/ast_query.nim                    | 30 +++++-------
 compiler/ast/ast_types.nim                    | 20 +++++---
 compiler/ast/astalgo.nim                      | 26 +++++-----
 compiler/ast/errorhandling.nim                | 10 ++--
 compiler/ast/filters.nim                      | 20 ++++----
 compiler/ast/trees.nim                        | 42 +++++++++-------
 compiler/ast/treetab.nim                      | 20 ++++----
 compiler/ast/types.nim                        | 16 +++----
 compiler/ast/typesrenderer.nim                |  6 +--
 compiler/front/sexp_reporter.nim              |  6 +--
 compiler/ic/dce.nim                           |  7 ++-
 compiler/ic/ic.nim                            | 24 +++++-----
 compiler/ic/integrity.nim                     |  4 +-
 compiler/ic/packed_ast.nim                    | 25 +++-------
 compiler/mir/mirgen.nim                       |  2 +-
 compiler/mir/proto_mir.nim                    |  2 +-
 compiler/sem/closureiters.nim                 |  6 +--
 compiler/sem/dfa.nim                          |  2 +-
 compiler/sem/evaltempl.nim                    |  2 +-
 compiler/sem/guards.nim                       | 48 ++++++++++---------
 compiler/sem/isolation_check.nim              |  2 +-
 compiler/sem/lookups.nim                      |  4 +-
 compiler/sem/nilcheck.nim                     |  8 ++--
 compiler/sem/parampatterns.nim                |  4 +-
 compiler/sem/patterns.nim                     | 32 ++++++++-----
 compiler/sem/pragmas.nim                      | 19 ++++----
 compiler/sem/semdata.nim                      |  4 +-
 compiler/sem/semexprs.nim                     | 20 ++++----
 compiler/sem/semfields.nim                    |  5 +-
 compiler/sem/semfold.nim                      | 22 ++++-----
 compiler/sem/semgnrc.nim                      |  2 +-
 compiler/sem/semmagic.nim                     |  2 +-
 compiler/sem/semobjconstr.nim                 |  2 +-
 compiler/sem/sempass2.nim                     | 15 +++---
 compiler/sem/semstmts.nim                     |  2 +-
 compiler/sem/semtempl.nim                     |  8 ++--
 compiler/sem/semtypes.nim                     | 16 +++----
 compiler/sem/semtypinst.nim                   |  2 +-
 compiler/sem/sighashes.nim                    | 29 ++++++-----
 compiler/sem/transf.nim                       | 14 +++---
 compiler/sem/typeallowed.nim                  |  4 +-
 compiler/sem/varpartitions.nim                |  8 ++--
 compiler/tools/docgen.nim                     |  2 +-
 compiler/utils/astrepr.nim                    | 18 +++----
 compiler/vm/packed_env.nim                    |  6 +--
 compiler/vm/vm.nim                            | 20 ++++----
 tests/errmsgs/tnnodeindexkind.nim             | 13 ++++-
 .../trmacros/trmacros_various2.nim            | 12 +++++
 tests/pragmas/tlocks.nim                      | 10 ++++
 50 files changed, 337 insertions(+), 288 deletions(-)

diff --git a/compiler/ast/ast.nim b/compiler/ast/ast.nim
index 2c1371263a4..58f01eaf313 100644
--- a/compiler/ast/ast.nim
+++ b/compiler/ast/ast.nim
@@ -482,7 +482,7 @@ template copyNodeImpl(dst, src, processSonsStmt) =
     dst.floatLitBase = src.floatLitBase
   of nkSym: dst.sym = src.sym
   of nkIdent: dst.ident = src.ident
-  of nkStrLit..nkTripleStrLit: dst.strVal = src.strVal
+  of nkStrLiterals: dst.strVal = src.strVal
   of nkEmpty, nkNone, nkNilLit, nkType, nkCommentStmt: discard "no children"
   of nkError: dst.diag = src.diag # do cheap copies
   of nkWithSons: processSonsStmt
diff --git a/compiler/ast/ast_query.nim b/compiler/ast/ast_query.nim
index bfe706246ca..8b613c6c876 100644
--- a/compiler/ast/ast_query.nim
+++ b/compiler/ast/ast_query.nim
@@ -89,12 +89,6 @@ const
 
   nkPragmaCallKinds* = {nkExprColonExpr, nkCall, nkCallStrLit}
 
-  nkIntLiterals*   = {nkCharLit..nkUInt64Lit}
-  nkFloatLiterals* = {nkFloatLit..nkFloat64Lit}
-  nkStrLiterals*   = {nkStrLit..nkTripleStrLit}
-  # TODO: include `nkNilLit` as it's a literal, not the same as `nnkLiterals`
-  nkLiterals*      = nkIntLiterals + nkFloatLiterals + nkStrLiterals
-  
   nkLambdaKinds* = {nkLambda, nkDo}
   declarativeDefs* = {nkProcDef, nkFuncDef, nkMethodDef, nkIteratorDef, nkConverterDef}
   routineDefs* = declarativeDefs + {nkMacroDef, nkTemplateDef}
@@ -357,17 +351,17 @@ proc containsNode*(n: PNode, kinds: TNodeKinds): bool =
   if n == nil: return
   case n.kind
   of nkWithoutSons: result = n.kind in kinds
-  else:
+  of nkWithSons:
     for i in 0..<n.len:
       if n.kind in kinds or containsNode(n[i], kinds): return true
 
 proc hasSubnodeWith*(n: PNode, kind: TNodeKind): bool =
   case n.kind
-  of nkEmpty..nkNilLit, nkFormalParams, nkCommentStmt:
+  of nkWithoutSons - nkError, nkFormalParams:
     result = n.kind == kind
   of nkError:
     result = hasSubnodeWith(n.diag.wrongNode, kind)
-  else:
+  of nkWithSons - nkFormalParams:
     for i in 0..<n.len:
       if (n[i].kind == kind) or hasSubnodeWith(n[i], kind):
         return true
@@ -375,11 +369,9 @@ proc hasSubnodeWith*(n: PNode, kind: TNodeKind): bool =
 
 proc getInt*(a: PNode): Int128 =
   case a.kind
-  of nkCharLit, nkUIntLit..nkUInt64Lit:
+  of nkUIntLiterals:
     result = toInt128(cast[uint64](a.intVal))
-  of nkInt8Lit..nkInt64Lit:
-    result = toInt128(a.intVal)
-  of nkIntLit:
+  of nkSIntLiterals:
     # XXX: enable this assert
     # assert a.typ.kind notin {tyChar, tyUint..tyUInt64}
     result = toInt128(a.intVal)
@@ -388,7 +380,7 @@ proc getInt*(a: PNode): Int128 =
 
 proc getInt64*(a: PNode): int64 {.deprecated: "use getInt".} =
   case a.kind
-  of nkCharLit, nkUIntLit..nkUInt64Lit, nkIntLit..nkInt64Lit:
+  of nkIntLiterals:
     result = a.intVal
   else:
     raiseRecoverableError("cannot extract number from invalid AST node")
@@ -396,7 +388,7 @@ proc getInt64*(a: PNode): int64 {.deprecated: "use getInt".} =
 proc getFloat*(a: PNode): BiggestFloat =
   case a.kind
   of nkFloatLiterals: result = a.floatVal
-  of nkCharLit, nkUIntLit..nkUInt64Lit, nkIntLit..nkInt64Lit:
+  of nkIntLiterals:
     result = BiggestFloat a.intVal
   else:
     raiseRecoverableError("cannot extract number from invalid AST node")
@@ -406,7 +398,7 @@ proc getFloat*(a: PNode): BiggestFloat =
 
 proc getStr*(a: PNode): string =
   case a.kind
-  of nkStrLit..nkTripleStrLit: result = a.strVal
+  of nkStrLiterals: result = a.strVal
   of nkNilLit:
     # let's hope this fixes more problems than it creates:
     result = ""
@@ -418,8 +410,8 @@ proc getStr*(a: PNode): string =
 
 proc getStrOrChar*(a: PNode): string =
   case a.kind
-  of nkStrLit..nkTripleStrLit: result = a.strVal
-  of nkCharLit..nkUInt64Lit: result = $chr(int(a.intVal))
+  of nkStrLiterals: result = a.strVal
+  of nkIntLiterals: result = $chr(int(a.intVal))
   else:
     raiseRecoverableError("cannot extract string from invalid AST node")
     #doAssert false, "getStrOrChar"
@@ -561,7 +553,7 @@ iterator pairs*(n: PNode): tuple[i: int, n: PNode] =
   for i in 0..<n.safeLen: yield (i, n[i])
 
 proc isAtom*(n: PNode): bool {.inline.} =
-  n.kind in nkNone..nkNilLit or n.kind == nkCommentStmt
+  n.kind in nkWithoutSons - nkError
 
 proc isEmptyType*(t: PType): bool {.inline.} =
   ## 'void' and 'typed' types are often equivalent to 'nil' these days:
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 1f0730c04c0..86be02e8ffa 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -244,14 +244,20 @@ type
   TNodeKinds* = set[TNodeKind]
 
 const
+  nkUIntLiterals*  = {nkCharLit, nkUIntLit..nkUInt64Lit}
+    ## Unsigned int literals
+  nkSIntLiterals*  = {nkIntLit..nkInt64Lit}
+    ## Signed int literals
+  nkIntLiterals*   = nkUIntLiterals + nkSIntLiterals
+  nkFloatLiterals* = {nkFloatLit..nkFloat64Lit}
+  nkStrLiterals*   = {nkStrLit..nkTripleStrLit}
+  nkLiterals*      = nkIntLiterals + nkFloatLiterals + nkStrLiterals + nkNilLit
+
   nkWithoutSons* =
     {nkEmpty, nkNone} +
     {nkIdent, nkSym} +
     {nkType} +
-    {nkCharLit..nkUInt64Lit} +
-    {nkFloatLit..nkFloat64Lit} +
-    {nkStrLit..nkTripleStrLit} +
-    {nkNilLit} +
+    nkLiterals +
     {nkError} +
     {nkCommentStmt}
 
@@ -1572,15 +1578,15 @@ type
     info*: TLineInfo
     flags*: TNodeFlags
     case kind*: TNodeKind
-    of nkCharLit..nkUInt64Lit:
+    of nkIntLiterals:
       intVal*: BiggestInt
       intLitBase*: NumericalBase
-    of nkFloatLit..nkFloat64Lit:
+    of nkFloatLiterals:
       floatVal*: BiggestFloat
       floatLitBase*: NumericalBase
         # Once case branches can share fields this can be unified with
         # intLitBase above
-    of nkStrLit..nkTripleStrLit:
+    of nkStrLiterals:
       strVal*: string
     of nkSym:
       sym*: PSym
diff --git a/compiler/ast/astalgo.nim b/compiler/ast/astalgo.nim
index ed20ab768da..7c28ef0f070 100644
--- a/compiler/ast/astalgo.nim
+++ b/compiler/ast/astalgo.nim
@@ -75,12 +75,12 @@ proc skipConvCastAndClosure*(n: PNode): PNode =
 proc sameValue*(a, b: PNode): bool =
   result = false
   case a.kind
-  of nkCharLit..nkUInt64Lit:
-    if b.kind in {nkCharLit..nkUInt64Lit}: result = getInt(a) == getInt(b)
-  of nkFloatLit..nkFloat64Lit:
-    if b.kind in {nkFloatLit..nkFloat64Lit}: result = a.floatVal == b.floatVal
-  of nkStrLit..nkTripleStrLit:
-    if b.kind in {nkStrLit..nkTripleStrLit}: result = a.strVal == b.strVal
+  of nkIntLiterals:
+    if b.kind in nkIntLiterals: result = getInt(a) == getInt(b)
+  of nkFloatLiterals:
+    if b.kind in nkFloatLiterals: result = a.floatVal == b.floatVal
+  of nkStrLiterals:
+    if b.kind in nkStrLiterals: result = a.strVal == b.strVal
   else:
     # don't raise an internal error for 'nim check':
     #InternalError(a.info, "SameValue")
@@ -90,19 +90,19 @@ proc leValue*(a, b: PNode): bool =
   # a <= b?
   result = false
   case a.kind
-  of nkCharLit..nkUInt64Lit:
-    if b.kind in {nkCharLit..nkUInt64Lit}: result = getInt(a) <= getInt(b)
-  of nkFloatLit..nkFloat64Lit:
-    if b.kind in {nkFloatLit..nkFloat64Lit}: result = a.floatVal <= b.floatVal
-  of nkStrLit..nkTripleStrLit:
-    if b.kind in {nkStrLit..nkTripleStrLit}: result = a.strVal <= b.strVal
+  of nkIntLiterals:
+    if b.kind in nkIntLiterals: result = getInt(a) <= getInt(b)
+  of nkFloatLiterals:
+    if b.kind in nkFloatLiterals: result = a.floatVal <= b.floatVal
+  of nkStrLiterals:
+    if b.kind in nkStrLiterals: result = a.strVal <= b.strVal
   else:
     # don't raise an internal error for 'nim check':
     #InternalError(a.info, "leValue")
     discard
 
 proc weakLeValue*(a, b: PNode): TImplication =
-  if a.kind notin nkLiterals or b.kind notin nkLiterals:
+  if a.kind notin nkLiterals - nkNilLit or b.kind notin nkLiterals - nkNilLit:
     result = impUnknown
   else:
     result = if leValue(a, b): impYes else: impNo
diff --git a/compiler/ast/errorhandling.nim b/compiler/ast/errorhandling.nim
index be3cf77e13d..eb34e2e75a2 100644
--- a/compiler/ast/errorhandling.nim
+++ b/compiler/ast/errorhandling.nim
@@ -50,11 +50,11 @@ when defined(nimDebugUnreportedErrors):
 proc errorSubNode*(n: PNode): PNode =
   ## find the first error node, or nil, under `n` using a depth first traversal
   case n.kind
-  of nkEmpty..nkNilLit:
-    result = nil
   of nkError:
     result = n
-  else:
+  of nkWithoutSons - nkError:
+    result = nil
+  of nkWithSons:
     result = nil
     for s in n.items:
       if s.isNil: continue
@@ -165,7 +165,7 @@ proc buildErrorList(config: ConfigRef, n: PNode, errs: var seq[PNode]) =
   ## creates a list (`errs` seq) from most specific to least specific
   ## by traversing the the error tree in a depth-first-search.
   case n.kind
-  of nkEmpty .. nkNilLit, nkCommentStmt:
+  of nkWithoutSons - nkError:
     discard
   of nkError:
     buildErrorList(config, n.diag.wrongNode, errs)
@@ -173,7 +173,7 @@ proc buildErrorList(config: ConfigRef, n: PNode, errs: var seq[PNode]) =
       if n.errorKind == adWrappedError and errs.len == 0:
         echo "Empty WrappedError: ", config $ n.info
     errs.add n
-  else:
+  of nkWithSons:
     for i in 0..<n.len:
       buildErrorList(config, n[i], errs)
 
diff --git a/compiler/ast/filters.nim b/compiler/ast/filters.nim
index 4ed551afd4e..06548cbae15 100644
--- a/compiler/ast/filters.nim
+++ b/compiler/ast/filters.nim
@@ -37,14 +37,16 @@ proc invalidPragma(conf: ConfigRef; n: PNode) =
 
 proc getArg(conf: ConfigRef; n: PNode, name: string, pos: int): PNode =
   result = nil
-  if n.kind in {nkEmpty..nkNilLit}: return
-  for i in 1..<n.len:
-    if n[i].kind == nkExprEqExpr:
-      if n[i][0].kind != nkIdent: invalidPragma(conf, n)
-      if cmpIgnoreStyle(n[i][0].ident.s, name) == 0:
-        return n[i][1]
-    elif i == pos:
-      return n[i]
+  case n.kind
+  of nkWithoutSons: discard # these can't have args
+  of nkWithSons:
+    for i in 1..<n.len:
+      if n[i].kind == nkExprEqExpr:
+        if n[i][0].kind != nkIdent: invalidPragma(conf, n)
+        if cmpIgnoreStyle(n[i][0].ident.s, name) == 0:
+          return n[i][1]
+      elif i == pos:
+        return n[i]
 
 proc charArg*(conf: ConfigRef; n: PNode, name: string, pos: int, default: char): char =
   var x = getArg(conf, n, name, pos)
@@ -55,7 +57,7 @@ proc charArg*(conf: ConfigRef; n: PNode, name: string, pos: int, default: char):
 proc strArg*(conf: ConfigRef; n: PNode, name: string, pos: int, default: string): string =
   var x = getArg(conf, n, name, pos)
   if x == nil: result = default
-  elif x.kind in {nkStrLit..nkTripleStrLit}: result = x.strVal
+  elif x.kind in nkStrLiterals: result = x.strVal
   else: invalidPragma(conf, n)
 
 proc boolArg*(conf: ConfigRef; n: PNode, name: string, pos: int, default: bool): bool =
diff --git a/compiler/ast/trees.nim b/compiler/ast/trees.nim
index 3b604d20d61..9452196c9dd 100644
--- a/compiler/ast/trees.nim
+++ b/compiler/ast/trees.nim
@@ -10,20 +10,27 @@
 ## tree helper routines
 
 import
-  ast, wordrecg, idents
+  compiler/ast/[
+    ast,
+    wordrecg,
+    idents,
+  ],
+  compiler/utils/[
+    idioms,
+  ]
 
 proc cyclicTreeAux(n: PNode, visited: var seq[PNode]): bool =
   if n == nil: return
   for v in visited:
     if v == n: return true
   case n.kind
-  of nkEmpty..nkNilLit, nkCommentStmt:
+  of nkWithoutSons - nkError:
     discard
   of nkError:
     visited.add(n)
     if cyclicTreeAux(n.diag.wrongNode, visited): return true
     discard visited.pop()
-  else:
+  of nkWithSons:
     visited.add(n)
     for nSon in n.sons:
       if cyclicTreeAux(nSon, visited): return true
@@ -49,12 +56,14 @@ proc exprStructuralEquivalent*(a, b: PNode; strictSymEquality=false): bool =
         # don't go nuts here: same symbol as string is enough:
         result = a.sym.name.id == b.sym.name.id
     of nkIdent: result = a.ident.id == b.ident.id
-    of nkCharLit..nkUInt64Lit: result = a.intVal == b.intVal
-    of nkFloatLit..nkFloat64Lit: result = sameFloatIgnoreNan(a.floatVal, b.floatVal)
-    of nkStrLit..nkTripleStrLit: result = a.strVal == b.strVal
+    of nkIntLiterals: result = a.intVal == b.intVal
+    of nkFloatLiterals: result = sameFloatIgnoreNan(a.floatVal, b.floatVal)
+    of nkStrLiterals: result = a.strVal == b.strVal
     of nkCommentStmt: result = a.comment == b.comment
-    of nkEmpty, nkNilLit, nkType: result = true
-    else:
+    of nkNone, nkEmpty, nkNilLit, nkType: result = true
+    of nkError:
+      unreachable()
+    of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
           if not exprStructuralEquivalent(a[i], b[i],
@@ -74,16 +83,18 @@ proc sameTree*(a, b: PNode): bool =
       # don't go nuts here: same symbol as string is enough:
       result = a.sym.name.id == b.sym.name.id
     of nkIdent: result = a.ident.id == b.ident.id
-    of nkCharLit..nkUInt64Lit:
+    of nkIntLiterals:
       result = a.intVal == b.intVal and
                a.intLitBase == b.intLitBase
-    of nkFloatLit..nkFloat64Lit:
+    of nkFloatLiterals:
       result = sameFloatIgnoreNan(a.floatVal, b.floatVal) and
                a.floatLitBase == b.floatLitBase
-    of nkStrLit..nkTripleStrLit: result = a.strVal == b.strVal
+    of nkStrLiterals: result = a.strVal == b.strVal
     of nkCommentStmt: result = a.comment == b.comment
-    of nkEmpty, nkNilLit, nkType: result = true
-    else:
+    of nkNone, nkEmpty, nkNilLit, nkType: result = true
+    of nkError:
+      unreachable()
+    of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
           if not sameTree(a[i], b[i]): return
@@ -99,8 +110,7 @@ proc getMagic*(op: PNode): TMagic =
   else: result = mNone
 
 proc isConstExpr*(n: PNode): bool =
-  const atomKinds = {nkCharLit..nkNilLit} # Char, Int, UInt, Str, Float and Nil literals
-  n.kind in atomKinds or nfAllConst in n.flags
+  n.kind in nkLiterals or nfAllConst in n.flags
 
 proc isCaseObj*(n: PNode): bool =
   if n.kind == nkRecCase: return true
@@ -109,7 +119,7 @@ proc isCaseObj*(n: PNode): bool =
 
 proc isDeepConstExpr*(n: PNode; preventInheritance = false): bool =
   case n.kind
-  of nkCharLit..nkNilLit:
+  of nkLiterals:
     result = true
   of nkExprEqExpr, nkExprColonExpr, nkHiddenStdConv, nkHiddenSubConv:
     result = isDeepConstExpr(n[1], preventInheritance)
diff --git a/compiler/ast/treetab.nim b/compiler/ast/treetab.nim
index 33f6c8988b2..3677cda1010 100644
--- a/compiler/ast/treetab.nim
+++ b/compiler/ast/treetab.nim
@@ -17,21 +17,21 @@ proc hashTree*(n: PNode): Hash =
     return
   result = ord(n.kind)
   case n.kind
-  of nkEmpty, nkNilLit, nkType:
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
     discard
   of nkIdent:
     result = result !& n.ident.h
   of nkSym:
     result = result !& n.sym.id
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     if (n.intVal >= low(int)) and (n.intVal <= high(int)):
       result = result !& int(n.intVal)
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     if (n.floatVal >= - 1000000.0) and (n.floatVal <= 1000000.0):
       result = result !& toInt(n.floatVal)
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     result = result !& hash(n.strVal)
-  else:
+  of nkWithSons:
     for i in 0..<n.len:
       result = result !& hashTree(n[i])
   result = !$result
@@ -43,13 +43,13 @@ proc treesEquivalent(a, b: PNode): bool =
     result = true
   elif (a != nil) and (b != nil) and (a.kind == b.kind):
     case a.kind
-    of nkEmpty, nkNilLit, nkType: result = true
+    of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError: result = true
     of nkSym: result = a.sym.id == b.sym.id
     of nkIdent: result = a.ident.id == b.ident.id
-    of nkCharLit..nkUInt64Lit: result = a.intVal == b.intVal
-    of nkFloatLit..nkFloat64Lit: result = a.floatVal == b.floatVal
-    of nkStrLit..nkTripleStrLit: result = a.strVal == b.strVal
-    else:
+    of nkIntLiterals: result = a.intVal == b.intVal
+    of nkFloatLiterals: result = a.floatVal == b.floatVal
+    of nkStrLiterals: result = a.strVal == b.strVal
+    of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
           if not treesEquivalent(a[i], b[i]): return
diff --git a/compiler/ast/types.nim b/compiler/ast/types.nim
index 54173b158e6..4479cb96d37 100644
--- a/compiler/ast/types.nim
+++ b/compiler/ast/types.nim
@@ -109,11 +109,11 @@ proc getOrdValue*(n: PNode; onError = high(Int128)): Int128 =
       n.kind
 
   case k
-  of nkCharLit, nkUIntLit..nkUInt64Lit:
+  of nkUIntLiterals:
     # XXX: enable this assert
     #assert n.typ == nil or isUnsigned(n.typ), $n.typ
     toInt128(cast[uint64](n.intVal))
-  of nkIntLit..nkInt64Lit:
+  of nkSIntLiterals:
     # XXX: enable this assert
     #assert n.typ == nil or not isUnsigned(n.typ), $n.typ.kind
     toInt128(n.intVal)
@@ -166,10 +166,10 @@ proc iterOverNode(marker: var IntSet, n: PNode, iter: TTypeIter,
                   closure: RootRef): bool =
   if n != nil:
     case n.kind
-    of nkNone..nkNilLit:
+    of nkWithoutSons:
       # a leaf
       result = iterOverTypeAux(marker, n.typ, iter, closure)
-    else:
+    of nkWithSons:
       for i in 0..<n.len:
         result = iterOverNode(marker, n[i], iter, closure)
         if result: return
@@ -344,9 +344,9 @@ proc canFormAcycleNode(marker: var IntSet, n: PNode, startId: int): bool =
     result = canFormAcycleAux(marker, n.typ, startId)
     if not result:
       case n.kind
-      of nkNone..nkNilLit:
+      of nkWithoutSons:
         discard
-      else:
+      of nkWithSons:
         for i in 0..<n.len:
           result = canFormAcycleNode(marker, n[i], startId)
           if result: return
@@ -395,10 +395,10 @@ proc mutateNode(marker: var IntSet, n: PNode, iter: TTypeMutator,
     result = copyNode(n)
     result.typ = mutateTypeAux(marker, n.typ, iter, closure)
     case n.kind
-    of nkNone..nkNilLit:
+    of nkWithoutSons:
       # a leaf
       discard
-    else:
+    of nkWithSons:
       for i in 0..<n.len:
         result.add mutateNode(marker, n[i], iter, closure)
 
diff --git a/compiler/ast/typesrenderer.nim b/compiler/ast/typesrenderer.nim
index 2a7feaa5ca0..50d8f4922ab 100644
--- a/compiler/ast/typesrenderer.nim
+++ b/compiler/ast/typesrenderer.nim
@@ -144,9 +144,9 @@ proc addTypeHeader*(result: var string, conf: ConfigRef; typ: PType; prefer: TPr
 proc valueToString(a: PNode): string =
   ## Returns `int`, `float`, or `string` literals from the node, otherwise returns `<invalid value>`.
   case a.kind
-  of nkCharLit..nkUInt64Lit: result = $a.intVal
-  of nkFloatLit..nkFloat64Lit: result = $a.floatVal
-  of nkStrLit..nkTripleStrLit: result = a.strVal
+  of nkIntLiterals: result = $a.intVal
+  of nkFloatLiterals: result = $a.floatVal
+  of nkStrLiterals: result = a.strVal
   else: result = "<invalid value>"
 
 proc rangeToStr(n: PNode): string =
diff --git a/compiler/front/sexp_reporter.nim b/compiler/front/sexp_reporter.nim
index 4ed98441522..3848489e154 100644
--- a/compiler/front/sexp_reporter.nim
+++ b/compiler/front/sexp_reporter.nim
@@ -117,9 +117,9 @@ proc sexp*(node: PNode): SexpNode =
   result.add newSSymbol(($node.kind)[2 ..^ 1])
   case node.kind
   of nkNone, nkEmpty, nkType, nkCommentStmt: discard
-  of nkCharLit..nkUInt64Lit:    result.add sexp(node.intVal)
-  of nkFloatLit..nkFloat64Lit:  result.add sexp(node.floatVal)
-  of nkStrLit..nkTripleStrLit:  result.add sexp(node.strVal)
+  of nkIntLiterals:             result.add sexp(node.intVal)
+  of nkFloatLiterals:           result.add sexp(node.floatVal)
+  of nkStrLiterals:             result.add sexp(node.strVal)
   of nkSym:                     result.add newSSymbol(node.sym.name.s)
   of nkIdent:                   result.add newSSymbol(node.ident.s)
   of nkError:                   result.add sexp(node.diag.wrongNode)
diff --git a/compiler/ic/dce.nim b/compiler/ic/dce.nim
index e95b0fe0700..2e7741facae 100644
--- a/compiler/ic/dce.nim
+++ b/compiler/ic/dce.nim
@@ -195,7 +195,7 @@ proc aliveCode(c: var AliveContext; g: PackedModuleGraph; tree: PackedTree; n: N
   ## Marks the symbols we encounter when we traverse the AST at `tree[n]` as alive, unless
   ## it is purely in a declarative context (type section etc.).
   case n.kind
-  of nkNone..pred(nkSym), succ(nkSym)..nkNilLit:
+  of nkWithoutSons - nkSym:
     discard "ignore non-sym atoms"
   of nkSym:
     # This symbol is alive and everything its body references.
@@ -209,9 +209,8 @@ proc aliveCode(c: var AliveContext; g: PackedModuleGraph; tree: PackedTree; n: N
     let otherModule = toFileIndexCached(c.decoder, g, c.thisModule, m).int
     followLater(c, g, otherModule, item)
   of nkMacroDef, nkTemplateDef, nkTypeSection, nkTypeOfExpr,
-     nkCommentStmt, nkIncludeStmt,
-     nkImportStmt, nkImportExceptStmt, nkExportStmt, nkExportExceptStmt,
-     nkFromStmt, nkStaticStmt:
+     nkIncludeStmt, nkImportStmt, nkImportExceptStmt,
+     nkExportStmt, nkExportExceptStmt, nkFromStmt, nkStaticStmt:
     discard
   of nkVarSection, nkLetSection, nkConstSection:
     # XXX ignore the defining local variable name?
diff --git a/compiler/ic/ic.nim b/compiler/ic/ic.nim
index 6fce414d834..af802d82292 100644
--- a/compiler/ic/ic.nim
+++ b/compiler/ic/ic.nim
@@ -102,8 +102,8 @@ proc toString*(tree: PackedTree; n: NodePos; m: PackedModule; nesting: int;
 
   result.add $tree[pos].kind
   case tree.nodes[pos].kind
-  of nkNone, nkEmpty, nkNilLit, nkType: discard
-  of nkIdent, nkStrLit..nkTripleStrLit:
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError: discard
+  of nkIdent, nkStrLiterals:
     result.add " "
     result.add m.strings[LitId tree.nodes[pos].operand]
   of nkSym:
@@ -118,10 +118,10 @@ proc toString*(tree: PackedTree; n: NodePos; m: PackedModule; nesting: int;
   of externUIntLit:
     result.add " "
     result.addInt cast[uint64](m.numbers[LitId tree.nodes[pos].operand])
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     result.add " "
     result.addFloat cast[BiggestFloat](m.numbers[LitId tree.nodes[pos].operand])
-  else:
+  of nkWithSons:
     result.add "(\n"
     for i in 1..(nesting+1)*2: result.add ' '
     for child in sonsReadonly(tree, n):
@@ -446,7 +446,7 @@ proc toPackedNode*(n: PNode; ir: var PackedTree; c: var PackedEncoder; m: var Pa
     return
   let info = toPackedInfo(n.info, c, m)
   case n.kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
     ir.nodes.add PackedNode(kind: n.kind, flags: n.flags, operand: 0,
                             typeId: storeTypeLater(n.typ, c, m), info: info)
   of nkIdent:
@@ -471,15 +471,15 @@ proc toPackedNode*(n: PNode; ir: var PackedTree; c: var PackedEncoder; m: var Pa
     ir.nodes.add PackedNode(kind: n.kind, flags: n.flags,
                             operand: int32 getOrIncl(m.numbers, n.intVal),
                             typeId: storeTypeLater(n.typ, c, m), info: info)
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     ir.nodes.add PackedNode(kind: n.kind, flags: n.flags,
                             operand: int32 getOrIncl(m.strings, n.strVal),
                             typeId: storeTypeLater(n.typ, c, m), info: info)
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     ir.nodes.add PackedNode(kind: n.kind, flags: n.flags,
                             operand: int32 getOrIncl(m.numbers, cast[BiggestInt](n.floatVal)),
                             typeId: storeTypeLater(n.typ, c, m), info: info)
-  else:
+  of nkWithSons:
     let patchPos = ir.prepare(n.kind, n.flags,
                               storeTypeLater(n.typ, c, m), info)
     for i in 0..<n.len:
@@ -776,7 +776,7 @@ proc loadNodes*(c: var PackedDecoder; g: var PackedModuleGraph; thisModule: int;
   result.flags = n.flags
 
   case k
-  of nkEmpty, nkNilLit, nkType:
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
     discard
   of nkIdent:
     result.ident = getIdent(c.cache, g[thisModule].fromDisk.strings[n.litId])
@@ -786,9 +786,9 @@ proc loadNodes*(c: var PackedDecoder; g: var PackedModuleGraph; thisModule: int;
     result.intVal = tree.nodes[n.int].operand
   of externIntLit:
     result.intVal = g[thisModule].fromDisk.numbers[n.litId]
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     result.strVal = g[thisModule].fromDisk.strings[n.litId]
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     result.floatVal = cast[BiggestFloat](g[thisModule].fromDisk.numbers[n.litId])
   of nkModuleRef:
     let (n1, n2) = sons2(tree, n)
@@ -796,7 +796,7 @@ proc loadNodes*(c: var PackedDecoder; g: var PackedModuleGraph; thisModule: int;
     assert n2.kind == nkInt32Lit
     transitionNoneToSym(result)
     result.sym = loadSym(c, g, thisModule, PackedItemId(module: n1.litId, item: tree.nodes[n2.int].operand))
-  else:
+  of nkWithSons - nkModuleRef:
     for n0 in sonsReadonly(tree, n):
       result.addAllowNil loadNodes(c, g, thisModule, tree, n0)
 
diff --git a/compiler/ic/integrity.nim b/compiler/ic/integrity.nim
index 786cd014837..b3509b05723 100644
--- a/compiler/ic/integrity.nim
+++ b/compiler/ic/integrity.nim
@@ -79,9 +79,9 @@ proc checkNode(c: var CheckedContext; tree: PackedTree; n: NodePos) =
     checkLocalSym(c, tree.nodes[n.int].operand)
   of directIntLit:
     discard
-  of externIntLit, nkFloatLit..nkFloat64Lit:
+  of externIntLit, nkFloatLiterals:
     assert c.g.packed[c.thisModule].fromDisk.numbers.hasLitId n.litId
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     assert c.g.packed[c.thisModule].fromDisk.strings.hasLitId n.litId
   of nkModuleRef:
     let (n1, n2) = sons2(tree, n)
diff --git a/compiler/ic/packed_ast.nim b/compiler/ic/packed_ast.nim
index 4946724b098..f5349839fb2 100644
--- a/compiler/ic/packed_ast.nim
+++ b/compiler/ic/packed_ast.nim
@@ -140,8 +140,7 @@ proc addSymDef*(tree: var PackedTree; s: SymId; info: PackedLineInfo) =
   tree.nodes.add PackedNode(kind: nkSym, operand: int32(s), info: info)
 
 proc isAtom*(tree: PackedTree; pos: int): bool {.inline.} =
-  let kind = tree.nodes[pos].kind
-  kind <= nkNilLit or kind == nkCommentStmt
+  tree.nodes[pos].kind in nkWithoutSons
 
 proc copyTree*(dest: var PackedTree; tree: PackedTree; n: NodePos) =
   # and this is why the IR is superior. We can copy subtrees
@@ -179,7 +178,7 @@ proc prepare*(dest: var PackedTree; source: PackedTree; sourcePos: NodePos): Pat
 
 proc patch*(tree: var PackedTree; pos: PatchPos) =
   let pos = pos.int
-  assert not isAtom(tree, pos)
+  assert not isAtom(tree, pos), $tree.nodes[pos].kind
   let distance = int32(tree.nodes.len - pos)
   tree.nodes[pos].operand = distance
 
@@ -197,7 +196,7 @@ proc nextChild(tree: PackedTree; pos: var int) {.inline.} =
 
 iterator sonsReadonly*(tree: PackedTree; n: NodePos): NodePos =
   var pos = n.int
-  assert not isAtom(tree, pos)
+  assert not isAtom(tree, pos), $tree.nodes[pos].kind
   let last = pos + tree.nodes[pos].operand
   inc pos
   while pos < last:
@@ -218,7 +217,7 @@ iterator isons*(dest: var PackedTree; tree: PackedTree;
 
 iterator sonsFrom1*(tree: PackedTree; n: NodePos): NodePos =
   var pos = n.int
-  assert not isAtom(tree, pos)
+  assert not isAtom(tree, pos), $tree.nodes[pos].kind
   let last = pos + tree.nodes[pos].operand
   inc pos
   if pos < last:
@@ -350,19 +349,9 @@ when false:
     result = tree.sh.strings[LitId tree.nodes[n.int].operand]
 
 const
-  externIntLit* = {nkCharLit,
-    nkIntLit,
-    nkInt8Lit,
-    nkInt16Lit,
-    nkInt64Lit,
-    nkUIntLit,
-    nkUInt8Lit,
-    nkUInt16Lit,
-    nkUInt32Lit,
-    nkUInt64Lit} # nkInt32Lit is missing by design!
-
-  externSIntLit* = {nkIntLit, nkInt8Lit, nkInt16Lit, nkInt64Lit}
-  externUIntLit* = {nkUIntLit, nkUInt8Lit, nkUInt16Lit, nkUInt32Lit, nkUInt64Lit}
+  externSIntLit* = nkSIntLiterals - nkInt32Lit # nkInt32Lit is excluded by design!
+  externUIntLit* = nkUIntLiterals
+  externIntLit* = externSIntLit + externUIntLit
   directIntLit* = nkInt32Lit
 
 when false:
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 9c573881729..572b334956e 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -2108,7 +2108,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         bu.use toValue(env.constants.add(n.sym), n.sym.typ)
       else:
         unreachable()
-    of nkLiterals, nkNilLit, nkRange:
+    of nkLiterals, nkRange:
       bu.use literal(n)
     of nkHiddenStdConv, nkHiddenSubConv:
       # doesn't translate to a MIR node itself, but the type overrides
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 43337a79b23..0f4721ede8c 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -594,7 +594,7 @@ proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: boo
     result.add ProtoItem(orig: n, typ: n.typ, kind: k, field: val)
 
   case n.kind
-  of nkCharLit..nkNilLit, nkRange, nkNimNodeLit:
+  of nkLiterals, nkRange, nkNimNodeLit:
     node pirLiteral
   of nkLambdaKinds:
     node pirProc, sym, n[namePos].sym
diff --git a/compiler/sem/closureiters.nim b/compiler/sem/closureiters.nim
index 9a075be856e..3f9d6d1ba1e 100644
--- a/compiler/sem/closureiters.nim
+++ b/compiler/sem/closureiters.nim
@@ -195,8 +195,8 @@ type
     idgen: IdGenerator
 
 const
-  nkSkip = {nkEmpty..nkNilLit, nkTemplateDef, nkTypeSection, nkStaticStmt,
-            nkCommentStmt, nkMixinStmt, nkBindStmt} + procDefs
+  nkSkip = nkWithoutSons + {nkTemplateDef, nkTypeSection, nkStaticStmt,
+            nkMixinStmt, nkBindStmt} + procDefs
 
 proc boolLit(ctx: Ctx, info: TLineInfo, val: bool): PNode =
   result = newIntTypeNode(ord val, ctx.g.getSysType(info, tyBool))
@@ -1379,4 +1379,4 @@ proc transformClosureIterator*(g: ModuleGraph; idgen: IdGenerator; fn: PSym, n:
     newTreeI(nkElse, n.info):
       newTreeI(nkReturnStmt, n.info, g.emptyNode)
 
-  result = ctx.wrapIntoStateLoop(result)
\ No newline at end of file
+  result = ctx.wrapIntoStateLoop(result)
diff --git a/compiler/sem/dfa.nim b/compiler/sem/dfa.nim
index d9d3f6ff7c4..6e1183fd1dd 100644
--- a/compiler/sem/dfa.nim
+++ b/compiler/sem/dfa.nim
@@ -793,7 +793,7 @@ proc gen(c: var Con; n: PNode) =
         genNoReturn(c, n)
     else:
       genCall(c, n)
-  of nkCharLit..nkNilLit: discard
+  of nkLiterals: discard
   of nkAsgn, nkFastAsgn:
     gen(c, n[1])
 
diff --git a/compiler/sem/evaltempl.nim b/compiler/sem/evaltempl.nim
index fafc99b73e2..471d46327af 100644
--- a/compiler/sem/evaltempl.nim
+++ b/compiler/sem/evaltempl.nim
@@ -104,7 +104,7 @@ proc evalTemplateAux(templ, actual: PNode, c: var TemplCtx, result: PNode) =
       result.add newNodeI(nkEmpty, templ.info)
   of nkError:
     c.config.internalError(templ.info, "unreported error")
-  else:
+  of nkWithSons:
     let parentIsDeclarative = c.isDeclarative
     if templ.kind in routineDefs + {nkTypeSection, nkVarSection, nkLetSection, nkConstSection}:
       c.isDeclarative = true
diff --git a/compiler/sem/guards.nim b/compiler/sem/guards.nim
index 9c7823c24cd..da8e0b426ea 100644
--- a/compiler/sem/guards.nim
+++ b/compiler/sem/guards.nim
@@ -23,6 +23,7 @@ import
   compiler/utils/[
     saturate,
     int128,
+    idioms,
   ],
   compiler/modules/[
     magicsys,
@@ -62,7 +63,7 @@ const
   someMin = {mMinI}
   someBinaryOp = someAdd+someSub+someMul+someMax+someMin
 
-proc isValue(n: PNode): bool = n.kind in {nkCharLit..nkNilLit}
+proc isValue(n: PNode): bool = n.kind in nkLiterals
 proc isLocation(n: PNode): bool = not n.isValue
 
 proc isLet(n: PNode): bool =
@@ -173,34 +174,34 @@ proc buildCall*(op: PSym; a, b: PNode): PNode =
 
 proc `|+|`(a, b: PNode): PNode =
   result = copyNode(a)
-  if a.kind in {nkCharLit..nkUInt64Lit}: result.intVal = a.intVal |+| b.intVal
+  if a.kind in nkIntLiterals: result.intVal = a.intVal |+| b.intVal
   else: result.floatVal = a.floatVal + b.floatVal
 
 proc `|-|`(a, b: PNode): PNode =
   result = copyNode(a)
-  if a.kind in {nkCharLit..nkUInt64Lit}: result.intVal = a.intVal |-| b.intVal
+  if a.kind in nkIntLiterals: result.intVal = a.intVal |-| b.intVal
   else: result.floatVal = a.floatVal - b.floatVal
 
 proc `|*|`(a, b: PNode): PNode =
   result = copyNode(a)
-  if a.kind in {nkCharLit..nkUInt64Lit}: result.intVal = a.intVal |*| b.intVal
+  if a.kind in nkIntLiterals: result.intVal = a.intVal |*| b.intVal
   else: result.floatVal = a.floatVal * b.floatVal
 
 proc `|div|`(a, b: PNode): PNode =
   result = copyNode(a)
-  if a.kind in {nkCharLit..nkUInt64Lit}: result.intVal = a.intVal div b.intVal
+  if a.kind in nkIntLiterals: result.intVal = a.intVal div b.intVal
   else: result.floatVal = a.floatVal / b.floatVal
 
 proc negate(a, b, res: PNode; o: Operators): PNode =
-  if b.kind in {nkCharLit..nkUInt64Lit} and b.intVal != low(BiggestInt):
+  if b.kind in nkIntLiterals and b.intVal != low(BiggestInt):
     var b = copyNode(b)
     b.intVal = -b.intVal
-    if a.kind in {nkCharLit..nkUInt64Lit}:
+    if a.kind in nkIntLiterals:
       b.intVal = b.intVal |+| a.intVal
       result = b
     else:
       result = buildCall(o.opAdd, a, b)
-  elif b.kind in {nkFloatLit..nkFloat64Lit}:
+  elif b.kind in nkFloatLiterals:
     var b = copyNode(b)
     b.floatVal = -b.floatVal
     result = buildCall(o.opAdd, a, b)
@@ -247,7 +248,7 @@ proc reassociation(n: PNode; o: Operators): PNode =
   else: discard
 
 proc pred(n: PNode): PNode =
-  if n.kind in {nkCharLit..nkUInt64Lit} and n.intVal != low(BiggestInt):
+  if n.kind in nkIntLiterals and n.intVal != low(BiggestInt):
     result = copyNode(n)
     dec result.intVal
   else:
@@ -451,12 +452,15 @@ proc sameTree*(a, b: PNode): bool =
       if not result and a.sym.magic != mNone:
         result = a.sym.magic == b.sym.magic or sameOpr(a.sym, b.sym)
     of nkIdent: result = a.ident.id == b.ident.id
-    of nkCharLit..nkUInt64Lit: result = a.intVal == b.intVal
-    of nkFloatLit..nkFloat64Lit: result = a.floatVal == b.floatVal
-    of nkStrLit..nkTripleStrLit: result = a.strVal == b.strVal
+    of nkIntLiterals: result = a.intVal == b.intVal
+    of nkFloatLiterals: result = a.floatVal == b.floatVal
+    of nkStrLiterals: result = a.strVal == b.strVal
     of nkType: result = a.typ == b.typ
-    of nkEmpty, nkNilLit: result = true
-    else:
+    of nkNone, nkEmpty, nkNilLit, nkCommentStmt:
+      result = true # Ignore comments
+    of nkError:
+      unreachable()
+    of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
           if not sameTree(a[i], b[i]): return
@@ -466,11 +470,11 @@ proc hasSubTree(n, x: PNode): bool =
   if n.sameTree(x): result = true
   else:
     case n.kind
-    of nkEmpty..nkNilLit:
+    of nkWithoutSons - nkFormalParams:
       result = n.sameTree(x)
     of nkFormalParams:
       discard
-    else:
+    of nkWithSons - nkFormalParams:
       for i in 0..<n.len:
         if hasSubTree(n[i], x): return true
 
@@ -499,7 +503,7 @@ proc impliesEq(fact, eq: PNode): TImplication =
   else: discard
 
 proc leImpliesIn(x, c, aSet: PNode): TImplication =
-  if c.kind in {nkCharLit..nkUInt64Lit}:
+  if c.kind in nkIntLiterals:
     # fact:  x <= 4;  question x in {56}?
     # --> true if every value <= 4 is in the set {56}
     #
@@ -515,7 +519,7 @@ proc leImpliesIn(x, c, aSet: PNode): TImplication =
       elif neg == i: result = impNo
 
 proc geImpliesIn(x, c, aSet: PNode): TImplication =
-  if c.kind in {nkCharLit..nkUInt64Lit}:
+  if c.kind in nkIntLiterals:
     # fact:  x >= 4;  question x in {56}?
     # --> true iff every value >= 4 is in the set {56}
     #
@@ -563,7 +567,7 @@ proc impliesIn(fact, loc, aSet: PNode): TImplication =
 
 proc valueIsNil(n: PNode): TImplication =
   if n.kind == nkNilLit: impYes
-  elif n.kind in {nkStrLit..nkTripleStrLit, nkBracket, nkObjConstr}: impNo
+  elif n.kind in nkStrLiterals + {nkBracket, nkObjConstr}: impNo
   else: impUnknown
 
 proc impliesIsNil(fact, eq: PNode): TImplication =
@@ -732,7 +736,7 @@ proc simpleSlice*(a, b: PNode): BiggestInt =
   # returns 'c' if a..b matches (i+c)..(i+c), -1 otherwise. (i)..(i) is matched
   # as if it is (i+0)..(i+0).
   if guards.sameTree(a, b):
-    if a.getMagic in someAdd and a[2].kind in {nkCharLit..nkUInt64Lit}:
+    if a.getMagic in someAdd and a[2].kind in nkIntLiterals:
       result = a[2].intVal
     else:
       result = 0
@@ -744,7 +748,7 @@ template isMul(x): untyped = x.getMagic in someMul
 template isDiv(x): untyped = x.getMagic in someDiv
 template isAdd(x): untyped = x.getMagic in someAdd
 template isSub(x): untyped = x.getMagic in someSub
-template isVal(x): untyped = x.kind in {nkCharLit..nkUInt64Lit}
+template isVal(x): untyped = x.kind in nkIntLiterals
 template isIntVal(x, y): untyped = x.intVal == y
 
 import macros
@@ -783,7 +787,7 @@ macro `=~`(x: PNode, pat: untyped): bool =
   result = nestList(ident"and", conds)
 
 proc isMinusOne(n: PNode): bool =
-  n.kind in {nkCharLit..nkUInt64Lit} and n.intVal == -1
+  n.kind in nkIntLiterals and n.intVal == -1
 
 proc pleViaModel(model: TModel; aa, bb: PNode): TImplication
 
diff --git a/compiler/sem/isolation_check.nim b/compiler/sem/isolation_check.nim
index 0b731dfe2c8..e5357c9307e 100644
--- a/compiler/sem/isolation_check.nim
+++ b/compiler/sem/isolation_check.nim
@@ -89,7 +89,7 @@ proc checkIsolate*(n: PNode): bool =
     # XXX Maybe require that 'n.typ' is acyclic. This is not much
     # worse than the already exisiting inheritance and closure restrictions.
     case n.kind
-    of nkCharLit..nkNilLit:
+    of nkLiterals:
       result = true
     of nkCallKinds:
       # XXX: as long as we don't update the analysis while examining arguments
diff --git a/compiler/sem/lookups.nim b/compiler/sem/lookups.nim
index f5e3981b242..cfb1c94e7a7 100644
--- a/compiler/sem/lookups.nim
+++ b/compiler/sem/lookups.nim
@@ -98,7 +98,7 @@ proc considerQuotedIdent*(c: PContext; n: PNode): PIdentResult =
 
   const
     atomicIdentKinds = {nkIdent, nkSym}
-    renderableLiterals = nkLiterals - nkFloatLiterals
+    renderableLiterals = nkLiterals - nkFloatLiterals - nkNilLit
     renderableKinds = atomicIdentKinds + renderableLiterals
     allNodeKinds = {low(TNodeKind)..high(TNodeKind)}
 
@@ -1184,4 +1184,4 @@ proc fieldVisible*(c: PContext, f: PSym): bool {.inline.} =
         for sym in scope.allowPrivateAccess:
           if symObj.id == sym.id or
              (genericOwner != nil and genericOwner.id == sym.id):
-            return true
\ No newline at end of file
+            return true
diff --git a/compiler/sem/nilcheck.nim b/compiler/sem/nilcheck.nim
index 670579f25a3..58c8be11217 100644
--- a/compiler/sem/nilcheck.nim
+++ b/compiler/sem/nilcheck.nim
@@ -1244,10 +1244,10 @@ proc check(n: PNode, ctx: NilCheckerContext, map: NilMap): Check =
     result = checkTry(n, ctx, map)
   of nkWhileStmt:
     result = checkWhile(n, ctx, map)
-  of nkNone..pred(nkSym), succ(nkSym)..nkNilLit, nkTypeSection, nkProcDef, nkConverterDef,
+  of nkWithoutSons - nkSym, nkTypeSection, nkProcDef, nkConverterDef,
       nkMethodDef, nkIteratorDef, nkMacroDef, nkTemplateDef, nkLambda, nkDo,
       nkFuncDef, nkConstSection, nkConstDef, nkIncludeStmt, nkImportStmt,
-      nkExportStmt, nkPragma, nkCommentStmt, nkTypeOfExpr, nkMixinStmt,
+      nkExportStmt, nkPragma, nkTypeOfExpr, nkMixinStmt,
       nkBindStmt:
 
     discard "don't follow this : same as varpartitions"
@@ -1304,12 +1304,12 @@ proc preVisitNode(ctx: NilCheckerContext, node: PNode, conf: ConfigRef) =
             ctx.dependants.setLen(baseIndex + 1.ExprIndex)
           ctx.dependants[baseIndex].incl(index.int)
   case node.kind:
-  of nkSym, nkEmpty, nkNilLit, nkType, nkIdent, nkCharLit .. nkUInt64Lit, nkFloatLit .. nkFloat64Lit, nkStrLit .. nkTripleStrLit:
+  of nkWithoutSons:
     discard
   of nkDotExpr:
     # visit only the base
     ctx.preVisitNode(node[0], conf)
-  else:
+  of nkWithSons - nkDotExpr:
     for element in node:
       ctx.preVisitNode(element, conf)
 
diff --git a/compiler/sem/parampatterns.nim b/compiler/sem/parampatterns.nim
index 0c571e1312c..ec6278dd6bd 100644
--- a/compiler/sem/parampatterns.nim
+++ b/compiler/sem/parampatterns.nim
@@ -188,7 +188,7 @@ proc checkForSideEffects*(n: PNode): TSideEffectAnalysis =
       if ret == seSideEffect: return ret
       elif ret == seUnknown and result == seNoSideEffect:
         result = seUnknown
-  of nkNone..nkNilLit:
+  of nkWithoutSons:
     # an atom cannot produce a side effect:
     result = seNoSideEffect
   else:
@@ -356,7 +356,7 @@ proc matchNodeKinds*(p, n: PNode): bool =
     of ppNot: stack[sp-1] = not stack[sp-1]
     of ppSym: push n.kind == nkSym
     of ppAtom: push isAtom(n)
-    of ppLit: push n.kind in {nkCharLit..nkNilLit}
+    of ppLit: push n.kind in nkLiterals
     of ppIdent: push n.kind == nkIdent
     of ppCall: push n.kind in nkCallKinds
     of ppSymKind:
diff --git a/compiler/sem/patterns.nim b/compiler/sem/patterns.nim
index 09e9173d42d..af41d94f013 100644
--- a/compiler/sem/patterns.nim
+++ b/compiler/sem/patterns.nim
@@ -21,6 +21,9 @@ import
     sigmatch,
     aliases,
     parampatterns
+  ],
+  compiler/utils/[
+    idioms
   ]
 
 type
@@ -50,7 +53,7 @@ proc canonKind(n: PNode): TNodeKind =
   result = n.kind
   case result
   of nkCallKinds: result = nkCall
-  of nkStrLit..nkTripleStrLit: result = nkStrLit
+  of nkStrLiterals: result = nkStrLit
   of nkFastAsgn: result = nkAsgn
   else: discard
 
@@ -62,12 +65,15 @@ proc sameTrees*(a, b: PNode): bool =
     case a.kind
     of nkSym: result = a.sym == b.sym
     of nkIdent: result = a.ident.id == b.ident.id
-    of nkCharLit..nkInt64Lit: result = a.intVal == b.intVal
-    of nkFloatLit..nkFloat64Lit: result = a.floatVal == b.floatVal
-    of nkStrLit..nkTripleStrLit: result = a.strVal == b.strVal
-    of nkEmpty, nkNilLit: result = true
+    of nkIntLiterals: result = a.intVal == b.intVal
+    of nkFloatLiterals: result = a.floatVal == b.floatVal
+    of nkStrLiterals: result = a.strVal == b.strVal
+    of nkNone, nkEmpty, nkNilLit, nkCommentStmt:
+      result = true # Ignore comments
+    of nkError:
+      unreachable()
     of nkType: result = sameTypeOrNil(a.typ, b.typ)
-    else:
+    of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
           if not sameTrees(a[i], b[i]): return
@@ -178,12 +184,14 @@ proc matches(c: PPatternContext, p, n: PNode): bool =
     case p.kind
     of nkSym: result = p.sym == n.sym
     of nkIdent: result = p.ident.id == n.ident.id
-    of nkCharLit..nkInt64Lit: result = p.intVal == n.intVal
-    of nkFloatLit..nkFloat64Lit: result = p.floatVal == n.floatVal
-    of nkStrLit..nkTripleStrLit: result = p.strVal == n.strVal
-    of nkEmpty, nkNilLit, nkType:
-      result = true
-    else:
+    of nkIntLiterals: result = p.intVal == n.intVal
+    of nkFloatLiterals: result = p.floatVal == n.floatVal
+    of nkStrLiterals: result = p.strVal == n.strVal
+    of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
+      result = true # Ignore comments
+    of nkError:
+      unreachable()
+    of nkWithSons:
       # special rule for p(X) ~ f(...); this also works for stuff like
       # partial case statements, etc! - Not really ... :-/
       let v = lastSon(p)
diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index 7e60c3ae5a4..f6b50c29ca2 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -283,7 +283,7 @@ proc intLitToIntOrErr(c: PContext, n: PNode): (int, PNode) =
   else:
     n[1] = c.semConstExpr(c, n[1])
     case n[1].kind
-    of nkIntLit..nkInt64Lit:
+    of nkSIntLiterals:
       (int(n[1].intVal), nil)
     else:
       (-1, c.config.newError(n, PAstDiag(kind: adSemIntLiteralExpected)))
@@ -371,7 +371,7 @@ proc getLib(c: PContext, kind: TLibKind, path: PNode): LibId =
 
   var lib = initLib(kind)
   lib.path = path
-  if path.kind in {nkStrLit..nkTripleStrLit}:
+  if path.kind in nkStrLiterals:
     lib.isOverriden = options.isDynlibOverride(c.config, path.strVal)
 
   result = c.addLib(lib)
@@ -960,13 +960,14 @@ proc pragmaLocks(c: PContext, it: PNode): (TLockLevel, PNode) =
         result = (UnknownLockLevel, wrapError(c.config, it))
     else:
       let (x, err) = intLitToIntOrErr(c, it)
-      if err.isNil:
-        if x < 0 or x > MaxLockLevel:
-          it[1] = c.config.newError(it[1], PAstDiag(
-            kind: adSemLocksPragmaBadLevelRange))
-          result = (UnknownLockLevel, wrapError(c.config, it))
-        else:
-          result = (TLockLevel(x), nil)
+      if err != nil:
+        result = (UnknownLockLevel, err)
+      elif x < 0 or x > MaxLockLevel:
+        it[1] = c.config.newError(it[1], PAstDiag(
+          kind: adSemLocksPragmaBadLevelRange))
+        result = (UnknownLockLevel, wrapError(c.config, it))
+      else:
+        result = (TLockLevel(x), nil)
 
 proc typeBorrow(c: PContext; sym: PSym, n: PNode): PNode =
   result = n
diff --git a/compiler/sem/semdata.nim b/compiler/sem/semdata.nim
index 375f4c60934..184edbe0536 100644
--- a/compiler/sem/semdata.nim
+++ b/compiler/sem/semdata.nim
@@ -1152,7 +1152,7 @@ proc warnAboutDeprecated(conf: ConfigRef; info: TLineInfo; s: PSym) =
   if pragmaNode != nil:
     for it in pragmaNode:
       if whichPragma(it) == wDeprecated and it.safeLen == 2 and
-          it[1].kind in {nkStrLit..nkTripleStrLit}:
+          it[1].kind in nkStrLiterals:
         localReport(conf, info, reportSym(
           rsemDeprecated, s, str = it[1].strVal))
         return
@@ -1164,7 +1164,7 @@ proc userError(conf: ConfigRef; info: TLineInfo; s: PSym) =
   if pragmaNode != nil:
     for it in pragmaNode:
       if whichPragma(it) == wError and it.safeLen == 2 and
-          it[1].kind in {nkStrLit..nkTripleStrLit}:
+          it[1].kind in nkStrLiterals:
         localReport(conf, info, reportSym(
           rsemUsageIsError, s, str = it[1].strVal))
         return
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 39ed98b095a..e19ed1ad859 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -167,19 +167,19 @@ proc checkConvertible(c: PContext, targetTyp: PType, src: PNode): TConvStatus =
     if targetTyp.kind == tyBool:
       discard "convOk"
     elif targetTyp.isOrdinalType:
-      if src.kind in nkCharLit..nkUInt64Lit and
+      if src.kind in nkIntLiterals and
           src.getInt notin firstOrd(c.config, targetTyp)..lastOrd(c.config, targetTyp):
         result = convNotInRange
-      elif src.kind in nkFloatLit..nkFloat64Lit:
+      elif src.kind in nkFloatLiterals:
         if not src.floatVal.inInt128Range:
           result = convNotInRange
         elif src.floatVal.toInt128 notin firstOrd(c.config, targetTyp)..lastOrd(c.config, targetTyp):
           result = convNotInRange
     elif targetBaseTyp.kind in tyFloat..tyFloat64:
-      if src.kind in nkFloatLit..nkFloat64Lit and
+      if src.kind in nkFloatLiterals and
           not floatRangeCheck(src.floatVal, targetTyp):
         result = convNotInRange
-      elif src.kind in nkCharLit..nkUInt64Lit and
+      elif src.kind in nkIntLiterals and
           not floatRangeCheck(src.intVal.float, targetTyp):
         result = convNotInRange
     elif targetBaseTyp.enumHasHoles:
@@ -476,7 +476,7 @@ proc isOpImpl(c: PContext, n: PNode, flags: TExprFlags): PNode =
   ## or an expression whose type is compared with `x`'s type.
   c.config.internalAssert:
     n.len == 3 and n[1].typ != nil and
-    n[2].kind in {nkStrLit..nkTripleStrLit, nkType}
+    n[2].kind in nkStrLiterals + nkType
 
   var
     res = false
@@ -486,7 +486,7 @@ proc isOpImpl(c: PContext, n: PNode, flags: TExprFlags): PNode =
   if t1.kind == tyTypeDesc and t2.kind != tyTypeDesc:
     t1 = t1.base
 
-  if n[2].kind in {nkStrLit..nkTripleStrLit}:
+  if n[2].kind in nkStrLiterals:
     case n[2].strVal.normalize
     of "closure":
       let t = skipTypes(t1, abstractRange)
@@ -541,7 +541,7 @@ proc semIs(c: PContext, n: PNode, flags: TExprFlags): PNode =
   n[1] = semExprWithType(c, n[1], flags + {efWantIterator})
 
   case n[2].kind
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     n[2] = semExpr(c, n[2])
   of nkError:
     discard # below we'll wrap the result in an error
@@ -671,7 +671,7 @@ proc changeType(c: PContext, n: PNode, newType: PType, check: bool): PNode =
       result = newError(c.config, n,
                         PAstDiag(kind: adSemNoTupleTypeForConstructor))
       return # hard error
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     if check and n.kind != nkUInt64Lit and not sameType(n.typ, newType):
       let val = n.intVal
       if val < firstOrd(c.config, newType) or val > lastOrd(c.config, newType):
@@ -679,7 +679,7 @@ proc changeType(c: PContext, n: PNode, newType: PType, check: bool): PNode =
                           PAstDiag(kind: adSemCannotBeConvertedTo,
                                    inputVal: n,
                                    targetTyp: newType))
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     if check and not floatRangeCheck(n.floatVal, newType):
       result = newError(c.config, n,
                         PAstDiag(kind: adSemCannotBeConvertedTo,
@@ -3601,7 +3601,7 @@ proc semExpr(c: PContext, n: PNode, flags: TExprFlags = {}): PNode =
     # handle `nkFloatLit` here to keep raw information of the float literal;
     # not sure why though, also why not do that for int?
     if result.typ == nil: result.typ = getSysType(c.graph, n.info, tyFloat64)
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     if result.typ == nil: result.typ = getSysType(c.graph, n.info, tyString)
   of nkCharLit:
     if result.typ == nil: result.typ = getSysType(c.graph, n.info, tyChar)
diff --git a/compiler/sem/semfields.nim b/compiler/sem/semfields.nim
index 3ebc3719b20..0145db3bac8 100644
--- a/compiler/sem/semfields.nim
+++ b/compiler/sem/semfields.nim
@@ -23,7 +23,8 @@ proc instFieldLoopBody(c: TFieldInstCtx, n: PNode, forLoop: PNode): PNode =
     result = newNode(nkEmpty)
     return
   case n.kind
-  of nkEmpty..pred(nkIdent), succ(nkSym)..nkNilLit: result = copyNode(n)
+  of nkWithoutSons - {nkIdent, nkSym}:
+    result = copyNode(n)
   of nkIdent, nkSym:
     result = n
     let (ident, err) = considerQuotedIdent(c.c, n)
@@ -50,7 +51,7 @@ proc instFieldLoopBody(c: TFieldInstCtx, n: PNode, forLoop: PNode): PNode =
           result.add(tupl)
           result.add(newSymNode(c.field, n.info))
         break
-  else:
+  of nkWithSons:
     if n.kind == nkContinueStmt:
       localReport(c.c.config, n, reportSem rsemFieldsIteratorCannotContinue)
     result = shallowCopy(n)
diff --git a/compiler/sem/semfold.nim b/compiler/sem/semfold.nim
index 66b5e4468f4..875f6f3fd6e 100644
--- a/compiler/sem/semfold.nim
+++ b/compiler/sem/semfold.nim
@@ -54,7 +54,7 @@ type
 
 const
   ExpressionNodes = nkCallKinds + nkLiterals + nkTypeExprs + {
-    nkSym, nkEmpty, nkNimNodeLit, nkNilLit,
+    nkSym, nkEmpty, nkNimNodeLit,
 
     nkRange, nkBracket, nkCurly, nkObjConstr, nkTupleConstr,
 
@@ -217,7 +217,7 @@ proc evalOp*(m: TMagic, n, a, b, c: PNode; idgen: IdGenerator; g: ModuleGraph):
   of mLengthSeq, mLengthOpenArray, mLengthStr:
     if a.kind == nkNilLit:
       result = newIntNodeT(Zero, n, idgen, g)
-    elif a.kind in {nkStrLit..nkTripleStrLit}:
+    elif a.kind in nkStrLiterals:
       if a.typ.kind == tyString:
         result = newIntNodeT(toInt128(a.strVal.len), n, idgen, g)
       elif a.typ.kind == tyCstring:
@@ -401,15 +401,15 @@ proc getConstIfExpr(c: PSym, n: PNode; idgen: IdGenerator; g: ModuleGraph): PNod
 proc leValueConv*(a, b: PNode): bool =
   result = false
   case a.kind
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     case b.kind
-    of nkCharLit..nkUInt64Lit: result = a.getInt <= b.getInt
-    of nkFloatLit..nkFloat64Lit: result = a.intVal <= round(b.floatVal).int
+    of nkIntLiterals: result = a.getInt <= b.getInt
+    of nkFloatLiterals: result = a.intVal <= round(b.floatVal).int
     else: result = false #internalError(a.info, "leValueConv")
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     case b.kind
-    of nkFloatLit..nkFloat64Lit: result = a.floatVal <= b.floatVal
-    of nkCharLit..nkUInt64Lit: result = a.floatVal <= toFloat64(b.getInt)
+    of nkFloatLiterals: result = a.floatVal <= b.floatVal
+    of nkIntLiterals: result = a.floatVal <= toFloat64(b.getInt)
     else: result = false # internalError(a.info, "leValueConv")
   else: result = false # internalError(a.info, "leValueConv")
 
@@ -562,7 +562,7 @@ proc foldArrayAccess(m: PSym, n: PNode; idgen: IdGenerator; g: ModuleGraph): PNo
     else:
       result = outOfBounds(n, x, y, g.config)
 
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     if 0 <= idx and idx < x.strVal.len:
       result = newNodeIT(nkCharLit, x.info, n.typ)
       result.intVal = ord(x.strVal[int(idx)])
@@ -673,7 +673,7 @@ proc getConstExpr(m: PSym, n: PNode; idgen: IdGenerator; g: ModuleGraph): PNode
       else:
         result = newSymNodeTypeDesc(s, idgen, n.info)
     else: discard
-  of nkCharLit..nkNilLit:
+  of nkLiterals:
     result = copyNode(n)
   of nkIfExpr:
     result = getConstIfExpr(m, n, idgen, g)
@@ -838,7 +838,7 @@ proc foldConstExprAux(m: PSym, n: PNode, idgen: IdGenerator, g: ModuleGraph): Fo
 
   # first step: fold the sub-expressions
   case n.kind
-  of nkEmpty, nkLiterals, nkNimNodeLit, nkNilLit:
+  of nkEmpty, nkLiterals, nkNimNodeLit:
     # short-circuit the following ``getConstExpr`` call, so that no
     # unnecessary copy of the node is created
     return
diff --git a/compiler/sem/semgnrc.nim b/compiler/sem/semgnrc.nim
index eaa4596cb53..3e510a55760 100644
--- a/compiler/sem/semgnrc.nim
+++ b/compiler/sem/semgnrc.nim
@@ -235,7 +235,7 @@ proc semGenericStmt(c: PContext, n: PNode,
     let a = n.sym
     let b = getGenSym(c, a)
     if b != a: n.sym = b
-  of nkEmpty, succ(nkSym)..nkNilLit, nkCommentStmt:
+  of nkWithoutSons - {nkIdent, nkSym}:
     # see tests/compile/tgensymgeneric.nim:
     # We need to open the gensym'ed symbol again so that the instantiation
     # creates a fresh copy; but this is wrong the very first reason for gensym
diff --git a/compiler/sem/semmagic.nim b/compiler/sem/semmagic.nim
index 0fbb1d84380..a2e826b97a6 100644
--- a/compiler/sem/semmagic.nim
+++ b/compiler/sem/semmagic.nim
@@ -105,7 +105,7 @@ proc semIsPartOf(c: PContext, n: PNode, flags: TExprFlags): PNode =
 proc expectIntLit(c: PContext, n: PNode): int =
   let x = c.semConstExpr(c, n)
   case x.kind
-  of nkIntLit..nkInt64Lit: result = int(x.intVal)
+  of nkSIntLiterals: result = int(x.intVal)
   else: localReport(c.config, n, reportSem rsemIntLiteralExpected)
 
 proc semInstantiationInfo(c: PContext, n: PNode): PNode =
diff --git a/compiler/sem/semobjconstr.nim b/compiler/sem/semobjconstr.nim
index 9b7f16a13bf..a8c32e1bcf6 100644
--- a/compiler/sem/semobjconstr.nim
+++ b/compiler/sem/semobjconstr.nim
@@ -222,7 +222,7 @@ proc checkConstructFields(c: PContext, n: PNode,
 
       if discriminatorVal != nil and discriminatorVal.kind != nkError:
         discriminatorVal = discriminatorVal.skipHidden
-        if discriminatorVal.kind notin nkLiterals and (
+        if discriminatorVal.kind notin nkLiterals - nkNilLit and (
             not isOrdinalType(discriminatorVal.typ, true) or
             lengthOrd(c.config, discriminatorVal.typ) > MaxSetElements or
             lengthOrd(c.config, n[0].typ) > MaxSetElements):
diff --git a/compiler/sem/sempass2.nim b/compiler/sem/sempass2.nim
index 713154ac4b5..74b6e2e2c89 100644
--- a/compiler/sem/sempass2.nim
+++ b/compiler/sem/sempass2.nim
@@ -163,7 +163,8 @@ proc getLockLevel(t: PType): TLockLevel =
   var t = t
   # tyGenericInst(TLock {tyGenericBody}, tyStatic, tyObject):
   if t.kind == tyGenericInst and t.len == 3: t = t[1]
-  if t.kind == tyStatic and t.n != nil and t.n.kind in {nkCharLit..nkInt64Lit}:
+  if t.kind == tyStatic and t.n != nil and t.n.kind in nkIntLiterals:
+    assert t.n.kind in nkSIntLiterals
     result = t.n.intVal.TLockLevel
 
 proc lockLocations(a: PEffects; pragma: PNode) =
@@ -694,7 +695,7 @@ proc notNilCheck(tracked: PEffects, n: PNode, paramType: PType) =
         # addr(x[]) can't be proven, but addr(x) can:
         if not containsNode(n, {nkDerefExpr, nkHiddenDeref}): return
       elif (n.kind == nkSym and n.sym.kind in routineKinds) or
-          (n.kind in procDefs+{nkObjConstr, nkBracket, nkClosure, nkStrLit..nkTripleStrLit}) or
+          (n.kind in procDefs + {nkObjConstr, nkBracket, nkClosure} + nkStrLiterals) or
           (n.kind in nkCallKinds and n[0].kind == nkSym and n[0].sym.magic == mArrToSeq) or
           n.typ.kind == tyTypeDesc:
         # 'p' is not nil obviously:
@@ -1008,7 +1009,7 @@ proc trackCall(tracked: PEffects; n: PNode) =
       let arg = n[1]
       initVarViaNew(tracked, arg)
       if arg.typ.len != 0 and {tfRequiresInit} * arg.typ.lastSon.flags != {}:
-        if a.sym.magic == mNewSeq and n[2].kind in {nkCharLit..nkUInt64Lit} and
+        if a.sym.magic == mNewSeq and n[2].kind in nkIntLiterals and
             n[2].intVal == 0:
           # var s: seq[notnil];  newSeq(s, 0)  is a special case!
           discard
@@ -1124,14 +1125,14 @@ proc trackInnerProc(tracked: PEffects, n: PNode) =
     let s = n.sym
     if s.kind == skParam and s.owner == tracked.owner:
       tracked.escapingParams.incl s.id
-  of nkNone..pred(nkSym), succ(nkSym)..nkNilLit:
+  of nkWithoutSons - nkSym:
     discard
   of nkProcDef, nkConverterDef, nkMethodDef, nkIteratorDef, nkLambda, nkFuncDef, nkDo:
     if n[0].kind == nkSym and n[0].sym.ast != nil:
       trackInnerProc(tracked, getBody(tracked.graph, n[0].sym))
-  of nkTypeSection, nkMacroDef, nkTemplateDef, nkError,
+  of nkTypeSection, nkMacroDef, nkTemplateDef,
      nkConstSection, nkConstDef, nkIncludeStmt, nkImportStmt,
-     nkExportStmt, nkPragma, nkCommentStmt, nkTypeOfExpr, nkMixinStmt,
+     nkExportStmt, nkPragma, nkTypeOfExpr, nkMixinStmt,
      nkBindStmt:
     discard
   else:
@@ -1139,7 +1140,7 @@ proc trackInnerProc(tracked: PEffects, n: PNode) =
 
 proc allowCStringConv(n: PNode): bool =
   case n.kind
-  of nkStrLit..nkTripleStrLit: result = true
+  of nkStrLiterals: result = true
   of nkSym: result = n.sym.kind in {skConst, skParam}
   of nkAddr: result = isCharArrayPtr(n.typ, true)
   of nkCallKinds:
diff --git a/compiler/sem/semstmts.nim b/compiler/sem/semstmts.nim
index 72a669dfe28..ed49396a823 100644
--- a/compiler/sem/semstmts.nim
+++ b/compiler/sem/semstmts.nim
@@ -339,7 +339,7 @@ proc fitRemoveHiddenConv(c: PContext, typ: PType, n: PNode): PNode =
   case result.kind
   of nkHiddenStdConv, nkHiddenSubConv:
     let r1 = result[1]
-    if r1.kind in {nkCharLit..nkUInt64Lit} and
+    if r1.kind in nkIntLiterals and
        typ.skipTypes(abstractRange).kind in {tyFloat..tyFloat64}:
       result = newFloatNode(nkFloatLit, BiggestFloat r1.intVal)
       result.info = n.info
diff --git a/compiler/sem/semtempl.nim b/compiler/sem/semtempl.nim
index e8f86c3e2a1..554c08ea14a 100644
--- a/compiler/sem/semtempl.nim
+++ b/compiler/sem/semtempl.nim
@@ -648,7 +648,7 @@ proc semTemplBody(c: var TemplCtx, n: PNode): PNode =
   of nkMixinStmt:
     if c.scopeN > 0: result = semTemplBodySons(c, n)
     else: result = semMixinStmt(c.c, n, c.toMixin)
-  of nkEmpty, nkSym..nkNilLit:
+  of nkWithoutSons - nkIdent:
     discard
   of nkIfStmt:
     for i in 0..<n.len:
@@ -954,8 +954,6 @@ proc semTemplBody(c: var TemplCtx, n: PNode): PNode =
 
       if result[i].isError:
         hasError = true
-  of nkError, nkCommentStmt:
-    result = n
   else:
     result = semTemplBodySons(c, n)
   
@@ -1009,7 +1007,7 @@ proc semTemplBodyDirty(c: var TemplCtx, n: PNode): PNode =
     result = semTemplBodyDirty(c, n[0])
   of nkBindStmt:
     result = semBindStmt(c.c, n, c.toBind)
-  of nkEmpty, nkSym..nkNilLit, nkError, nkCommentStmt:
+  of nkWithoutSons - nkIdent:
     discard
   of nkDotExpr, nkAccQuoted:
     # dotExpr is ambiguous: note that we explicitly allow 'x.TemplateParam',
@@ -1220,7 +1218,7 @@ proc semPatternBody(c: var TemplCtx, n: PNode): PNode =
           # more flexibility
   of nkBindStmt:
     result = semBindStmt(c.c, n, c.toBind)
-  of nkEmpty, nkSym..nkNilLit:
+  of nkWithoutSons - nkIdent:
     discard
   of nkCurlyExpr:
     # we support '(pattern){x}' to bind a subpattern to a parameter 'x';
diff --git a/compiler/sem/semtypes.nim b/compiler/sem/semtypes.nim
index 9076eb9d078..6dbd5dc5a31 100644
--- a/compiler/sem/semtypes.nim
+++ b/compiler/sem/semtypes.nim
@@ -412,8 +412,8 @@ proc semRangeAux(c: PContext, n: PNode, prev: PType): PType =
     elif enumHasHoles(rangeT[0]):
       localReport(c.config, n.info, reportTyp(rsemExpectedUnholyEnum, rangeT[0]))
 
-  if (result.n[0].kind in {nkFloatLit..nkFloat64Lit} and result.n[0].floatVal.isNaN) or
-      (result.n[1].kind in {nkFloatLit..nkFloat64Lit} and result.n[1].floatVal.isNaN):
+  if (result.n[0].kind in nkFloatLiterals and result.n[0].floatVal.isNaN) or
+      (result.n[1].kind in nkFloatLiterals and result.n[1].floatVal.isNaN):
     localReport(c.config, n, reportSem rsemRangeDoesNotSupportNan)
 
   if weakLeValue(result.n[0], result.n[1]) == impNo:
@@ -427,14 +427,14 @@ proc semRange(c: PContext, n: PNode, prev: PType): PType =
     if isRange(n[1]):
       result = semRangeAux(c, n[1], prev)
       let n = result.n
-      if n[0].kind in {nkCharLit..nkUInt64Lit} and n[0].intVal > 0:
+      if n[0].kind in nkIntLiterals and n[0].intVal > 0:
         incl(result.flags, tfRequiresInit)
-      elif n[1].kind in {nkCharLit..nkUInt64Lit} and n[1].intVal < 0:
+      elif n[1].kind in nkIntLiterals and n[1].intVal < 0:
         incl(result.flags, tfRequiresInit)
-      elif n[0].kind in {nkFloatLit..nkFloat64Lit} and
+      elif n[0].kind in nkFloatLiterals and
           n[0].floatVal > 0.0:
         incl(result.flags, tfRequiresInit)
-      elif n[1].kind in {nkFloatLit..nkFloat64Lit} and
+      elif n[1].kind in nkFloatLiterals and
           n[1].floatVal < 0.0:
         incl(result.flags, tfRequiresInit)
     else:
@@ -481,7 +481,7 @@ proc semArrayIndex(c: PContext, n: PNode): PType =
 
     # an expression that doesn't reference type variables
     e = semExprWithType(c, e)
-    if e.kind in {nkIntLit..nkUInt64Lit}:
+    if e.kind in nkIntLiterals:
       if e.intVal < 0:
         localReport(c.config, n.info,
           SemReport(
@@ -492,7 +492,7 @@ proc semArrayIndex(c: PContext, n: PNode): PType =
       result = makeRangeType(c, 0, e.intVal-1, n.info, e.typ)
     else:
       let x = semConstExpr(c, e)
-      if x.kind in {nkIntLit..nkUInt64Lit}:
+      if x.kind in nkIntLiterals:
         result = makeRangeType(c, 0, x.intVal-1, n.info,
                              x.typ.skipTypes({tyTypeDesc}))
       else:
diff --git a/compiler/sem/semtypinst.nim b/compiler/sem/semtypinst.nim
index 2954006cb22..7e90a126ff7 100644
--- a/compiler/sem/semtypinst.nim
+++ b/compiler/sem/semtypinst.nim
@@ -306,7 +306,7 @@ proc replaceTypeVarsN(cl: var TReplTypeVars, n: PNode; start=0): PNode =
   if n.typ != nil:
     result.typ = replaceTypeVarsT(cl, n.typ)
   case n.kind
-  of nkNone..pred(nkSym), succ(nkSym)..nkNilLit:
+  of nkWithoutSons - nkSym:
     discard
   of nkOpenSymChoice, nkClosedSymChoice: result = n
   of nkSym:
diff --git a/compiler/sem/sighashes.nim b/compiler/sem/sighashes.nim
index 701606082b1..1c10717784e 100644
--- a/compiler/sem/sighashes.nim
+++ b/compiler/sem/sighashes.nim
@@ -22,7 +22,8 @@ import
     modulegraphs
   ],
   compiler/utils/[
-    ropes
+    ropes,
+    idioms
   ]
 
 proc `&=`(c: var MD5Context, s: string) = md5Update(c, s, s.len)
@@ -82,22 +83,25 @@ proc hashTree(c: var MD5Context, n: PNode; flags: set[ConsiderFlag]) =
   # we really must not hash line information. 'n.typ' is debatable but
   # shouldn't be necessary for now and avoids potential infinite recursions.
   case n.kind
-  of nkEmpty, nkNilLit, nkType: discard
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
+    discard # ignore comments (could appear in a tyFromExpr)
+  of nkError:
+    unreachable()
   of nkIdent:
     c &= n.ident.s
   of nkSym:
     hashSym(c, n.sym)
     if CoHashTypeInsideNode in flags and n.sym.typ != nil:
       hashType(c, n.sym.typ, flags)
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     let v = n.intVal
     lowlevel v
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     let v = n.floatVal
     lowlevel v
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     c &= n.strVal
-  else:
+  of nkWithSons:
     for i in 0..<n.len: hashTree(c, n[i], flags)
 
 proc hashType(c: var MD5Context, t: PType; flags: set[ConsiderFlag]) =
@@ -350,7 +354,10 @@ proc hashBodyTree(graph: ModuleGraph, c: var MD5Context, n: PNode) =
     return
   c &= char(n.kind)
   case n.kind
-  of nkEmpty, nkNilLit, nkType, nkCommentStmt: discard
+  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
+    discard # ignore comments
+  of nkError:
+    unreachable()
   of nkIdent:
     c &= n.ident.s
   of nkSym:
@@ -362,13 +369,13 @@ proc hashBodyTree(graph: ModuleGraph, c: var MD5Context, n: PNode) =
       c &= hashNonProc(n.sym)
   of nkProcDef, nkFuncDef, nkTemplateDef, nkMacroDef:
     discard # we track usage of proc symbols not their definition
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     c &= n.intVal
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     c &= n.floatVal
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     c &= n.strVal
-  else:
+  of nkWithSons - {nkProcDef, nkFuncDef, nkTemplateDef, nkMacroDef} :
     for i in 0..<n.len:
       hashBodyTree(graph, c, n[i])
 
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 0f69e8eb3c8..829171cb34c 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -295,9 +295,9 @@ proc transformConstSection(c: PTransf, v: PNode): PNode =
 
 proc hasContinue(n: PNode): bool =
   case n.kind
-  of nkEmpty..nkNilLit, nkCommentStmt, nkForStmt, nkWhileStmt: discard
+  of nkWithoutSons, nkForStmt, nkWhileStmt: discard
   of nkContinueStmt: result = true
-  else:
+  of nkWithSons - {nkForStmt, nkWhileStmt, nkContinueStmt}:
     for i in 0..<n.len:
       if hasContinue(n[i]): return true
 
@@ -420,7 +420,7 @@ proc introduceNewLocalVars(c: PTransf, n: PNode): PNode =
   case n.kind
   of nkSym:
     result = transformSym(c, n)
-  of nkEmpty..pred(nkSym), succ(nkSym)..nkNilLit, nkCommentStmt:
+  of nkWithoutSons - nkSym:
     # nothing to be done for leaves:
     result = n
   of callableDefs:
@@ -721,13 +721,13 @@ proc findWrongOwners(c: PTransf, n: PNode) =
 proc isSimpleIteratorVar(c: PTransf; iter: PSym): bool =
   proc rec(n: PNode; owner: PSym; dangerousYields: var int) =
     case n.kind
-    of nkEmpty..nkNilLit: discard
+    of nkWithoutSons: discard
     of nkYieldStmt:
       if n[0].kind == nkSym and n[0].sym.owner == owner:
         discard "good: yield a single variable that we own"
       else:
         inc dangerousYields
-    else:
+    of nkWithSons - nkYieldStmt:
       for c in n: rec(c, owner, dangerousYields)
 
   var dangerousYields = 0
@@ -1136,7 +1136,7 @@ proc transform(c: PTransf, n: PNode): PNode =
     unreachable("errors can't reach here")
   of nkSym:
     result = transformSym(c, n)
-  of nkEmpty..pred(nkSym), succ(nkSym)..nkNilLit:
+  of nkWithoutSons - {nkSym, nkError}:
     # nothing to be done for leaves:
     result = n
   of nkBracketExpr: result = transformArrayAccess(c, n)
@@ -1212,7 +1212,7 @@ proc transform(c: PTransf, n: PNode): PNode =
         # ensure that e.g. discard "some comment" gets optimized away
         # completely:
         result = newNode(nkCommentStmt)
-  of nkCommentStmt, nkTemplateDef, nkImportStmt, nkStaticStmt,
+  of nkTemplateDef, nkImportStmt, nkStaticStmt,
       nkExportStmt, nkExportExceptStmt:
     return n
   of nkConstSection:
diff --git a/compiler/sem/typeallowed.nim b/compiler/sem/typeallowed.nim
index 6fecd323ee1..2493c710ee6 100644
--- a/compiler/sem/typeallowed.nim
+++ b/compiler/sem/typeallowed.nim
@@ -38,9 +38,9 @@ proc typeAllowedNode(marker: var IntSet, n: PNode, kind: TSymKind,
     result = typeAllowedAux(marker, n.typ, kind, c, flags)
     if result == nil:
       case n.kind
-      of nkNone..nkNilLit:
+      of nkWithoutSons:
         discard
-      else:
+      of nkWithSons:
         #if n.kind == nkRecCase and kind in {skProc, skFunc, skConst}:
         #  return n[0].typ
         for i in 0..<n.len:
diff --git a/compiler/sem/varpartitions.nim b/compiler/sem/varpartitions.nim
index 2aaca7df9c7..cb2662057a3 100644
--- a/compiler/sem/varpartitions.nim
+++ b/compiler/sem/varpartitions.nim
@@ -292,7 +292,7 @@ proc connect(v: var Partitions; a, b: PSym; info: TLineInfo) =
 
 proc borrowFromConstExpr(n: PNode): bool =
   case n.kind
-  of nkCharLit..nkNilLit:
+  of nkLiterals:
     result = true
   of nkExprEqExpr, nkExprColonExpr, nkHiddenStdConv, nkHiddenSubConv,
       nkCast, nkObjUpConv, nkObjDownConv:
@@ -440,7 +440,7 @@ proc destMightOwn(c: var Partitions; dest: var VarIndex; n: PNode) =
   ## Analyse if 'n' is an expression that owns the data, if so mark 'dest'
   ## with 'ownsData'.
   case n.kind
-  of nkEmpty, nkCharLit..nkNilLit:
+  of nkEmpty, nkLiterals:
     # primitive literals including the empty are harmless:
     discard
 
@@ -665,11 +665,11 @@ proc deps(c: var Partitions; dest, src: PNode) =
                 c.s[vid].flags.incl preventCursor
 
 const
-  nodesToIgnoreSet = {nkNone..pred(nkSym), succ(nkSym)..nkNilLit,
+  nodesToIgnoreSet = nkWithoutSons - nkSym + {
     nkTypeSection, nkProcDef, nkConverterDef,
     nkMethodDef, nkIteratorDef, nkMacroDef, nkTemplateDef, nkLambda, nkDo,
     nkFuncDef, nkConstSection, nkConstDef, nkIncludeStmt, nkImportStmt,
-    nkExportStmt, nkPragma, nkCommentStmt, nkTypeOfExpr, nkMixinStmt,
+    nkExportStmt, nkPragma, nkTypeOfExpr, nkMixinStmt,
     nkBindStmt}
 
 proc potentialMutationViaArg(c: var Partitions; n: PNode; callee: PType) =
diff --git a/compiler/tools/docgen.nim b/compiler/tools/docgen.nim
index 1fc2a99921a..1f3729735b8 100644
--- a/compiler/tools/docgen.nim
+++ b/compiler/tools/docgen.nim
@@ -892,7 +892,7 @@ proc genDeprecationMsg(d: PDoc, n: PNode): string =
     result = getConfigVar(d.conf, "doc.deprecationmsg") % [
        "label" , "Deprecated", "message", ""]
   of 2: # Deprecated w/ a message
-    if n[1].kind in {nkStrLit..nkTripleStrLit}:
+    if n[1].kind in nkStrLiterals:
       result = getConfigVar(d.conf, "doc.deprecationmsg") % [
           "label", "Deprecated:", "message", xmltree.escape(n[1].strVal)]
   else:
diff --git a/compiler/utils/astrepr.nim b/compiler/utils/astrepr.nim
index 47a10e3c74b..13b1cbbdb9f 100644
--- a/compiler/utils/astrepr.nim
+++ b/compiler/utils/astrepr.nim
@@ -681,19 +681,19 @@ proc cyclicTreeAux(n: PNode, visited: var seq[PNode], count: var int): bool =
 
   inc count
   case n.kind
-  of {nkEmpty..nkNilLit}:
+  of nkWithoutSons - nkError:
     discard
-  else:
+  of nkWithSons, nkError:
     visited.add(n)
 
-    let sons =
+    let nWithSons =
       case n.kind
       of nkError:
-        @[n.diag.wrongNode]
+        n.diag.wrongNode
       else:
-        @[]
+        n
 
-    for nSon in sons:
+    for nSon in nWithSons.items:
       if cyclicTreeAux(nSon, visited, count):
         return true
 
@@ -854,12 +854,12 @@ proc treeRepr*(
         add "\"" & n.strVal + style.strLit & "\""
         postLiteral()
 
-      of nkCharLit .. nkUInt64Lit:
+      of nkIntLiterals:
         add " "
         add $n.intVal + style.number
         postLiteral()
 
-      of nkFloatLit .. nkFloat64Lit:
+      of nkFloatLiterals:
         add " "
         add $n.floatVal + style.floatLit
         postLiteral()
@@ -909,7 +909,7 @@ proc treeRepr*(
       else:
         discard
 
-    if n.kind notin {nkNone .. nkNilLit, nkCommentStmt}:
+    if n.kind notin nkWithoutSons - nkError:
       addFlags()
       if (n.kind == nkError and trfSkipAuxError notin rconf) or
           (n.kind != nkError and n.len > 0):
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index 35fb26ed657..305befd81e5 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -733,12 +733,12 @@ proc loadNode(dec: var TypeInfoDecoder, ps: PackedEnv, id: NodeId): (PNode, int3
   case n.kind
   of nkEmpty, nkType, nkNilLit, nkCommentStmt:
     discard "do nothing"
-  of nkCharLit..nkUInt64Lit:
+  of nkIntLiterals:
     r.intVal = ps.numbers[n.operand.LitId]
-  of nkFloatLit..nkFloat64Lit:
+  of nkFloatLiterals:
     # use a `cast` to preserve the bit representation:
     r.floatVal = cast[BiggestFloat](ps.numbers[n.operand.LitId])
-  of nkStrLit..nkTripleStrLit:
+  of nkStrLiterals:
     r.strVal = ps.strings[n.operand.LitId]
   of nkSym:
     r.sym = dec.loadSym(ps, n.operand.SymId)
diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index f3646516021..8ec5a6b354b 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -2386,7 +2386,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       let src = regs[rb].nimNode
       # TODO: This if-else block should be reordered so as to match the
       #       expectation of occurence
-      if src.kind in {nkEmpty..nkNilLit, nkError}:
+      if src.kind in nkWithoutSons:
         raiseVmError(VmEvent(kind: vmEvtCannotGetChild, ast: src))
       elif idx >=% src.len:
         raiseVmError(reportVmIdx(idx, src.len - 1))
@@ -2398,7 +2398,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       var dest = regs[ra].nimNode
       if nfSem in dest.flags:
         raiseVmError(VmEvent(kind: vmEvtCannotModifyTypechecked))
-      elif dest.kind in {nkEmpty..nkNilLit, nkError}:
+      elif dest.kind in nkWithoutSons:
         raiseVmError(VmEvent(kind: vmEvtCannotSetChild, ast: dest))
       elif idx >=% dest.len:
         raiseVmError(reportVmIdx(idx, dest.len - 1))
@@ -2409,7 +2409,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       var u = regs[rb].nimNode
       if nfSem in u.flags:
         raiseVmError(VmEvent(kind: vmEvtCannotModifyTypechecked))
-      elif u.kind in {nkEmpty..nkNilLit, nkError}:
+      elif u.kind in nkWithoutSons:
         raiseVmError(VmEvent(kind: vmEvtCannotAddChild, ast: u))
       else:
         u.add(regs[rc].nimNode)
@@ -2425,7 +2425,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       var u = regs[rb].nimNode
       if nfSem in u.flags:
         raiseVmError(VmEvent(kind: vmEvtCannotModifyTypechecked))
-      elif u.kind in {nkEmpty..nkNilLit, nkError}:
+      elif u.kind in nkWithoutSons:
         raiseVmError(VmEvent(kind: vmEvtCannotAddChild, ast: u))
       else:
         let L = arrayLen(x)
@@ -2450,7 +2450,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
     of opcNIntVal:
       decodeB(rkInt)
       let a = regs[rb].nimNode
-      if a.kind in {nkCharLit..nkUInt64Lit}:
+      if a.kind in nkIntLiterals:
         regs[ra].intVal = a.intVal
       elif a.kind == nkSym and a.sym.kind == skEnumField:
         regs[ra].intVal = a.sym.position
@@ -2460,7 +2460,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       decodeB(rkFloat)
       let a = regs[rb].nimNode
       case a.kind
-      of nkFloatLit..nkFloat64Lit: regs[ra].floatVal = a.floatVal
+      of nkFloatLiterals: regs[ra].floatVal = a.floatVal
       else: raiseVmError(VmEvent(kind: vmEvtFieldNotFound, msg: "floatVal"))
     of opcNodeId:
       decodeB(rkInt)
@@ -2538,7 +2538,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       decodeB(akString)
       let a = regs[rb].nimNode
       case a.kind
-      of nkStrLit..nkTripleStrLit:
+      of nkStrLiterals:
         regs[ra].strVal = a.strVal
       of nkCommentStmt:
         regs[ra].strVal = a.comment
@@ -2724,7 +2724,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
     of opcNSetIntVal:
       decodeB(rkNimNode)
       var dest = regs[ra].nimNode
-      if dest.kind in {nkCharLit..nkUInt64Lit}:
+      if dest.kind in nkIntLiterals:
         dest.intVal = regs[rb].intVal
       elif dest.kind == nkSym and dest.sym.kind == skEnumField:
         raiseVmError(VmEvent(
@@ -2735,7 +2735,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
     of opcNSetFloatVal:
       decodeB(rkNimNode)
       var dest = regs[ra].nimNode
-      if dest.kind in {nkFloatLit..nkFloat64Lit}:
+      if dest.kind in nkFloatLiterals:
         dest.floatVal = regs[rb].floatVal
       else:
         raiseVmError(VmEvent(kind: vmEvtFieldNotFound, msg: "floatVal"))
@@ -2744,7 +2744,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       checkHandle(regs[rb])
       var dest = regs[ra].nimNode
       assert regs[rb].handle.typ.kind == akString
-      if dest.kind in {nkStrLit..nkTripleStrLit}:
+      if dest.kind in nkStrLiterals:
         dest.strVal = $regs[rb].strVal
       elif dest.kind == nkCommentStmt:
         dest.comment = $regs[rb].strVal
diff --git a/tests/errmsgs/tnnodeindexkind.nim b/tests/errmsgs/tnnodeindexkind.nim
index 9ea045e6658..b07662e2edc 100644
--- a/tests/errmsgs/tnnodeindexkind.nim
+++ b/tests/errmsgs/tnnodeindexkind.nim
@@ -1,8 +1,17 @@
 discard """
-  errormsg: "cannot set child of node kind: nnkStrLit"
-  line: 7
+  matrix: "--errorMax:2"
+  action: reject
+  nimout: '''
+tnnodeindexkind.nim(11, 4) Error: cannot set child of node kind: nnkStrLit
+tnnodeindexkind.nim(15, 7) Error: cannot set child of node kind: nnkCommentStmt
+'''
 """
 import macros
 macro t(x: untyped): untyped =
   x[0] = newEmptyNode()
 t("abc")
+
+macro t2(x: untyped): untyped =
+  x[0][0] = newEmptyNode()
+t2:
+  ## comment
diff --git a/tests/lang_experimental/trmacros/trmacros_various2.nim b/tests/lang_experimental/trmacros/trmacros_various2.nim
index c1367cb1be2..44941a02dff 100644
--- a/tests/lang_experimental/trmacros/trmacros_various2.nim
+++ b/tests/lang_experimental/trmacros/trmacros_various2.nim
@@ -6,6 +6,8 @@ output: '''
 hel
 lo
 my awesome concat
+1
+TRM
 '''
 """
 
@@ -87,3 +89,13 @@ in_to_out(char, int)
 
 # This works
 proc to_out2(x: char{lit}): int = result = ord(x)
+
+# Unsigned literals
+template times3is1{`*`(u,3'u)}(u: uint): uint = 1
+var u = 3'u
+echo u * 3'u # 1
+
+# Char literals
+template dontAppendE{`&`(s, 'E')}(s: string): string = s
+var s = "T"
+echo s & 'E' & 'R' & 'M'
diff --git a/tests/pragmas/tlocks.nim b/tests/pragmas/tlocks.nim
index ba66a2dca25..ad29e28624f 100644
--- a/tests/pragmas/tlocks.nim
+++ b/tests/pragmas/tlocks.nim
@@ -11,3 +11,13 @@ method testMethod(g: SomeDerived) =
 # ensure int literals still work
 proc plain*() {.locks: 0.} =
   discard
+
+# ensure unknown locklevel works
+proc plain2*() {.locks: "unknown".} =
+  discard
+
+# ensure char literals are rejected
+doAssert not compiles (;
+  proc plain3() {.locks: 'c'.} =
+    discard
+  )

From 23c71c44893600c91faf0844f49ab075536ec02d Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Mon, 11 Mar 2024 20:42:08 +0100
Subject: [PATCH 027/169] Remove nkNone and replace it with nkError (#1229)

## Summary
* Remove `nkNone` and replace it with `nkError`
* Move some  `nkError`  branches to the start of the their case
statements

## Details
`nkNone`  could be replaced by either  `nkEmpty`  or  `nkError` . I've
decided for  `nkError`  here, as  `nkNone`  nodes already signified
errors, albeit compiler bugs.
That means that an uninitialized node that would previously be of kind
`nkNone`  is now of kind  `nkError`  and will cause a crash if it's
uninitialized  `diag`  field is accessed.
This is IMO preferable to  silently bubbling up uninitialized nodes
(that signify a compiler bug), but should not actually matter in
practice, as I don't think there are any recent or open known cases
where  `nkNone`  nodes were actually produced.
---
 compiler/ast/ast.nim                                |  2 +-
 compiler/ast/ast_types.nim                          | 12 +++++-------
 compiler/ast/trees.nim                              |  4 ++--
 compiler/ast/treetab.nim                            |  4 ++--
 compiler/front/condsyms.nim                         |  1 +
 compiler/front/sexp_reporter.nim                    |  2 +-
 compiler/ic/ic.nim                                  |  6 +++---
 compiler/sem/evaltempl.nim                          |  2 +-
 compiler/sem/guards.nim                             |  6 +++---
 compiler/sem/modulelowering.nim                     |  2 --
 compiler/sem/patterns.nim                           | 10 +++++-----
 compiler/sem/sem.nim                                |  2 +-
 compiler/sem/semexprs.nim                           |  2 +-
 compiler/sem/sighashes.nim                          |  8 ++++----
 compiler/vm/packed_env.nim                          |  6 +++---
 doc/astspec.txt                                     |  4 ++--
 lib/core/macros.nim                                 | 13 +++++--------
 tests/lang_callable/macros/tdumpast2.nim            |  2 +-
 tests/lang_callable/macros/tincremental.nim         |  2 +-
 tests/lang_callable/macros/tmacro3.nim              |  2 +-
 tests/lang_callable/macros/trecmacro.nim            |  2 +-
 tests/lang_callable/template/tparams_gensymed.nim   |  2 +-
 .../defer/tdefer_malformed_many_children.nim        |  2 +-
 23 files changed, 46 insertions(+), 52 deletions(-)

diff --git a/compiler/ast/ast.nim b/compiler/ast/ast.nim
index 58f01eaf313..3665b29341d 100644
--- a/compiler/ast/ast.nim
+++ b/compiler/ast/ast.nim
@@ -483,7 +483,7 @@ template copyNodeImpl(dst, src, processSonsStmt) =
   of nkSym: dst.sym = src.sym
   of nkIdent: dst.ident = src.ident
   of nkStrLiterals: dst.strVal = src.strVal
-  of nkEmpty, nkNone, nkNilLit, nkType, nkCommentStmt: discard "no children"
+  of nkEmpty, nkNilLit, nkType, nkCommentStmt: discard "no children"
   of nkError: dst.diag = src.diag # do cheap copies
   of nkWithSons: processSonsStmt
 
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 86be02e8ffa..c5b048d0bb7 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -52,10 +52,9 @@ type
   TNodeKind* = enum
     ## order is important, because ranges are used to check whether a node
     ## belongs to a certain class
-
-    nkNone                ## unknown node kind: indicates an error
-                          ## Expressions:
-                          ## Atoms:
+    ## Expressions:
+    ## Atoms:
+    nkError               ## erroneous AST node see `errorhandling`
     nkEmpty               ## the node is empty
     nkIdent               ## node is an identifier
     nkSym                 ## node is a symbol
@@ -234,7 +233,6 @@ type
                           ## transformation
     nkFuncDef             ## a func
     nkTupleConstr         ## a tuple constructor
-    nkError               ## erroneous AST node see `errorhandling`
     nkNimNodeLit          ## a ``NimNode`` literal. Stores a single sub node
                           ## that represents the ``NimNode`` AST
     nkModuleRef           ## for .rod file support: A (moduleId, itemId) pair
@@ -254,7 +252,7 @@ const
   nkLiterals*      = nkIntLiterals + nkFloatLiterals + nkStrLiterals + nkNilLit
 
   nkWithoutSons* =
-    {nkEmpty, nkNone} +
+    {nkEmpty} +
     {nkIdent, nkSym} +
     {nkType} +
     nkLiterals +
@@ -1592,7 +1590,7 @@ type
       sym*: PSym
     of nkIdent:
       ident*: PIdent
-    of nkEmpty, nkNone, nkType, nkNilLit, nkCommentStmt:
+    of nkEmpty, nkType, nkNilLit, nkCommentStmt:
       discard
     of nkError:
       diag*: PAstDiag
diff --git a/compiler/ast/trees.nim b/compiler/ast/trees.nim
index 9452196c9dd..da324808325 100644
--- a/compiler/ast/trees.nim
+++ b/compiler/ast/trees.nim
@@ -60,7 +60,7 @@ proc exprStructuralEquivalent*(a, b: PNode; strictSymEquality=false): bool =
     of nkFloatLiterals: result = sameFloatIgnoreNan(a.floatVal, b.floatVal)
     of nkStrLiterals: result = a.strVal == b.strVal
     of nkCommentStmt: result = a.comment == b.comment
-    of nkNone, nkEmpty, nkNilLit, nkType: result = true
+    of nkEmpty, nkNilLit, nkType: result = true
     of nkError:
       unreachable()
     of nkWithSons:
@@ -91,7 +91,7 @@ proc sameTree*(a, b: PNode): bool =
                a.floatLitBase == b.floatLitBase
     of nkStrLiterals: result = a.strVal == b.strVal
     of nkCommentStmt: result = a.comment == b.comment
-    of nkNone, nkEmpty, nkNilLit, nkType: result = true
+    of nkEmpty, nkNilLit, nkType: result = true
     of nkError:
       unreachable()
     of nkWithSons:
diff --git a/compiler/ast/treetab.nim b/compiler/ast/treetab.nim
index 3677cda1010..7ec94f6074e 100644
--- a/compiler/ast/treetab.nim
+++ b/compiler/ast/treetab.nim
@@ -17,7 +17,7 @@ proc hashTree*(n: PNode): Hash =
     return
   result = ord(n.kind)
   case n.kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
+  of nkError, nkEmpty, nkNilLit, nkType, nkCommentStmt:
     discard
   of nkIdent:
     result = result !& n.ident.h
@@ -43,7 +43,7 @@ proc treesEquivalent(a, b: PNode): bool =
     result = true
   elif (a != nil) and (b != nil) and (a.kind == b.kind):
     case a.kind
-    of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError: result = true
+    of nkError, nkEmpty, nkNilLit, nkType, nkCommentStmt: result = true
     of nkSym: result = a.sym.id == b.sym.id
     of nkIdent: result = a.ident.id == b.ident.id
     of nkIntLiterals: result = a.intVal == b.intVal
diff --git a/compiler/front/condsyms.nim b/compiler/front/condsyms.nim
index 1af4b0141cb..9746de20026 100644
--- a/compiler/front/condsyms.nim
+++ b/compiler/front/condsyms.nim
@@ -76,3 +76,4 @@ proc initDefines*(symbols: StringTableRef) =
   defineSymbol("nimskullNoFloat128")
   defineSymbol("nimskullNewExceptionRt")
   defineSymbol("nimskullNoNkStmtListTypeAndNkBlockType")
+  defineSymbol("nimskullNoNkNone")
diff --git a/compiler/front/sexp_reporter.nim b/compiler/front/sexp_reporter.nim
index 3848489e154..e6e5a551692 100644
--- a/compiler/front/sexp_reporter.nim
+++ b/compiler/front/sexp_reporter.nim
@@ -116,7 +116,7 @@ proc sexp*(node: PNode): SexpNode =
   result = newSList()
   result.add newSSymbol(($node.kind)[2 ..^ 1])
   case node.kind
-  of nkNone, nkEmpty, nkType, nkCommentStmt: discard
+  of nkEmpty, nkType, nkCommentStmt: discard
   of nkIntLiterals:             result.add sexp(node.intVal)
   of nkFloatLiterals:           result.add sexp(node.floatVal)
   of nkStrLiterals:             result.add sexp(node.strVal)
diff --git a/compiler/ic/ic.nim b/compiler/ic/ic.nim
index af802d82292..1692da69a9e 100644
--- a/compiler/ic/ic.nim
+++ b/compiler/ic/ic.nim
@@ -102,7 +102,7 @@ proc toString*(tree: PackedTree; n: NodePos; m: PackedModule; nesting: int;
 
   result.add $tree[pos].kind
   case tree.nodes[pos].kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError: discard
+  of nkError, nkEmpty, nkNilLit, nkType, nkCommentStmt: discard
   of nkIdent, nkStrLiterals:
     result.add " "
     result.add m.strings[LitId tree.nodes[pos].operand]
@@ -446,7 +446,7 @@ proc toPackedNode*(n: PNode; ir: var PackedTree; c: var PackedEncoder; m: var Pa
     return
   let info = toPackedInfo(n.info, c, m)
   case n.kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
+  of nkError, nkEmpty, nkNilLit, nkType, nkCommentStmt:
     ir.nodes.add PackedNode(kind: n.kind, flags: n.flags, operand: 0,
                             typeId: storeTypeLater(n.typ, c, m), info: info)
   of nkIdent:
@@ -776,7 +776,7 @@ proc loadNodes*(c: var PackedDecoder; g: var PackedModuleGraph; thisModule: int;
   result.flags = n.flags
 
   case k
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt, nkError:
+  of nkError, nkEmpty, nkNilLit, nkType, nkCommentStmt:
     discard
   of nkIdent:
     result.ident = getIdent(c.cache, g[thisModule].fromDisk.strings[n.litId])
diff --git a/compiler/sem/evaltempl.nim b/compiler/sem/evaltempl.nim
index 471d46327af..0411400f3a8 100644
--- a/compiler/sem/evaltempl.nim
+++ b/compiler/sem/evaltempl.nim
@@ -92,7 +92,7 @@ proc evalTemplateAux(templ, actual: PNode, c: var TemplCtx, result: PNode) =
           result.add newSymNode(x, if c.instLines: actual.info else: templ.info)
     else:
       result.add copyNode(c, templ, actual)
-  of nkNone..nkIdent, nkType..nkNilLit: # atom
+  of nkEmpty..nkIdent, nkType..nkNilLit: # atom
     result.add copyNode(c, templ, actual)
   of nkCommentStmt:
     # for the documentation generator we don't keep documentation comments
diff --git a/compiler/sem/guards.nim b/compiler/sem/guards.nim
index da8e0b426ea..74c1c838609 100644
--- a/compiler/sem/guards.nim
+++ b/compiler/sem/guards.nim
@@ -447,6 +447,8 @@ proc sameTree*(a, b: PNode): bool =
     result = true
   elif a != nil and b != nil and a.kind == b.kind:
     case a.kind
+    of nkError:
+      unreachable()
     of nkSym:
       result = a.sym == b.sym
       if not result and a.sym.magic != mNone:
@@ -456,10 +458,8 @@ proc sameTree*(a, b: PNode): bool =
     of nkFloatLiterals: result = a.floatVal == b.floatVal
     of nkStrLiterals: result = a.strVal == b.strVal
     of nkType: result = a.typ == b.typ
-    of nkNone, nkEmpty, nkNilLit, nkCommentStmt:
+    of nkEmpty, nkNilLit, nkCommentStmt:
       result = true # Ignore comments
-    of nkError:
-      unreachable()
     of nkWithSons:
       if a.len == b.len:
         for i in 0..<a.len:
diff --git a/compiler/sem/modulelowering.nim b/compiler/sem/modulelowering.nim
index cce620e81f9..8ee0ccded31 100644
--- a/compiler/sem/modulelowering.nim
+++ b/compiler/sem/modulelowering.nim
@@ -151,8 +151,6 @@ proc group(n: PNode, decl, imperative: var seq[PNode]) =
   of nkEmpty, nkError:
     # errors were already reported earlier
     discard "drop errors and empty nodes"
-  of nkNone:
-    unreachable()
   of nkStmtList:
     # flatten statement lists
     for it in n.items:
diff --git a/compiler/sem/patterns.nim b/compiler/sem/patterns.nim
index af41d94f013..391f19b2f9e 100644
--- a/compiler/sem/patterns.nim
+++ b/compiler/sem/patterns.nim
@@ -68,10 +68,10 @@ proc sameTrees*(a, b: PNode): bool =
     of nkIntLiterals: result = a.intVal == b.intVal
     of nkFloatLiterals: result = a.floatVal == b.floatVal
     of nkStrLiterals: result = a.strVal == b.strVal
-    of nkNone, nkEmpty, nkNilLit, nkCommentStmt:
-      result = true # Ignore comments
     of nkError:
       unreachable()
+    of nkEmpty, nkNilLit, nkCommentStmt:
+      result = true # Ignore comments
     of nkType: result = sameTypeOrNil(a.typ, b.typ)
     of nkWithSons:
       if a.len == b.len:
@@ -182,15 +182,15 @@ proc matches(c: PPatternContext, p, n: PNode): bool =
         result = bindOrCheck(c, p[1].sym, n)
   elif sameKinds(p, n):
     case p.kind
+    of nkError:
+      unreachable()
     of nkSym: result = p.sym == n.sym
     of nkIdent: result = p.ident.id == n.ident.id
     of nkIntLiterals: result = p.intVal == n.intVal
     of nkFloatLiterals: result = p.floatVal == n.floatVal
     of nkStrLiterals: result = p.strVal == n.strVal
-    of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
+    of nkEmpty, nkNilLit, nkType, nkCommentStmt:
       result = true # Ignore comments
-    of nkError:
-      unreachable()
     of nkWithSons:
       # special rule for p(X) ~ f(...); this also works for stuff like
       # partial case statements, etc! - Not really ... :-/
diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index 3d98df006e9..84ba9bfc3bd 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -603,7 +603,7 @@ proc tryConstExpr(c: PContext, n: PNode): PNode =
 
   result = evalConstExpr(c.module, c.idgen, c.graph, result)
   case result.kind
-  of nkEmpty, nkError:
+  of nkError, nkEmpty:
     result = nil
   else:
     discard
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index e19ed1ad859..0c51fe54b89 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -3571,7 +3571,7 @@ proc semExpr(c: PContext, n: PNode, flags: TExprFlags = {}): PNode =
     # because of the changed symbol binding, this does not mean that we
     # don't have to check the symbol for semantics here again!
     result = semSym(c, n, n.sym, flags)
-  of nkEmpty, nkNone, nkCommentStmt, nkType:
+  of nkEmpty, nkCommentStmt, nkType:
     discard
   of nkNilLit:
     if result.typ == nil: result.typ = getNilType(c)
diff --git a/compiler/sem/sighashes.nim b/compiler/sem/sighashes.nim
index 1c10717784e..1e417616928 100644
--- a/compiler/sem/sighashes.nim
+++ b/compiler/sem/sighashes.nim
@@ -83,10 +83,10 @@ proc hashTree(c: var MD5Context, n: PNode; flags: set[ConsiderFlag]) =
   # we really must not hash line information. 'n.typ' is debatable but
   # shouldn't be necessary for now and avoids potential infinite recursions.
   case n.kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
-    discard # ignore comments (could appear in a tyFromExpr)
   of nkError:
     unreachable()
+  of nkEmpty, nkNilLit, nkType, nkCommentStmt:
+    discard # ignore comments (could appear in a tyFromExpr)
   of nkIdent:
     c &= n.ident.s
   of nkSym:
@@ -354,10 +354,10 @@ proc hashBodyTree(graph: ModuleGraph, c: var MD5Context, n: PNode) =
     return
   c &= char(n.kind)
   case n.kind
-  of nkNone, nkEmpty, nkNilLit, nkType, nkCommentStmt:
-    discard # ignore comments
   of nkError:
     unreachable()
+  of nkEmpty, nkNilLit, nkType, nkCommentStmt:
+    discard # ignore comments
   of nkIdent:
     c &= n.ident.s
   of nkSym:
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index 305befd81e5..a4776b0eb9b 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -667,8 +667,8 @@ func storeNode(enc: var TypeInfoEncoder, ps: var PackedEnv, n: PNode): NodeId =
     of nkWithSons:
       hasSons = true
       n.sons.len.int32
-    of nkError, nkNone:
-      unreachable("errors and invalid nodes must not reach here")
+    of nkError:
+      unreachable("errors must not reach here")
 
   result = ps.nimNodes.len.NodeId
   ps.nimNodes.add(PackedNodeLite(kind: n.kind, flags: n.flags,
@@ -753,7 +753,7 @@ proc loadNode(dec: var TypeInfoDecoder, ps: PackedEnv, id: NodeId): (PNode, int3
       nextId += skip
 
     return (r, nextId - id.int32)
-  of nkNone, nkError:
+  of nkError:
     # should have not been stored in the first place
     unreachable()
 
diff --git a/doc/astspec.txt b/doc/astspec.txt
index 6d3fa1f8c20..3ff99540b5f 100644
--- a/doc/astspec.txt
+++ b/doc/astspec.txt
@@ -10,7 +10,7 @@ contains:
 
   type
     NimNodeKind = enum     ## kind of a node; only explanatory
-      nnkNone,             ## invalid node kind
+      nnkError,            ## erroneous AST node
       nnkEmpty,            ## empty node
       nnkIdent,            ## node contains an identifier
       nnkIntLit,           ## node contains an int literal (example: 10)
@@ -22,7 +22,7 @@ contains:
     NimNode = ref NimNodeObj
     NimNodeObj = object
       case kind: NimNodeKind           ## the node's kind
-      of nnkNone, nnkEmpty, nnkNilLit:
+      of nnkError, nnkEmpty, nnkNilLit:
         discard                        ## node contains no additional fields
       of nnkCharLit..nnkUInt64Lit:
         intVal: BiggestInt             ## the int literal
diff --git a/lib/core/macros.nim b/lib/core/macros.nim
index f5a731cb857..40d9efba1ff 100644
--- a/lib/core/macros.nim
+++ b/lib/core/macros.nim
@@ -47,7 +47,8 @@ template skipEnumValue(define: untyped, predecessor: untyped; gap = 1): untyped
 
 type
   NimNodeKind* = enum
-    nnkNone, nnkEmpty, nnkIdent, nnkSym,
+    nnkError,  ## erroneous AST node
+    nnkEmpty, nnkIdent, nnkSym,
     nnkType, nnkCharLit, nnkIntLit, nnkInt8Lit,
     nnkInt16Lit, nnkInt32Lit, nnkInt64Lit, nnkUIntLit, nnkUInt8Lit,
     nnkUInt16Lit, nnkUInt32Lit, nnkUInt64Lit, nnkFloatLit,
@@ -111,8 +112,7 @@ type
     nnkGotoState,
     nnkFuncDef = skipEnumValue(nimHasNkBreakStateNodeRemoved, nnkGotoState, 2),
     nnkTupleConstr,
-    nnkError,  ## erroneous AST node
-    nnkNimNodeLit
+    nnkNimNodeLit = skipEnumValue(nimskullNoNkNone, nnkTupleConstr)
 
   NimNodeKinds* = set[NimNodeKind]
   NimTypeKind* = enum  # some types are no longer used, see ast.nim
@@ -843,8 +843,6 @@ proc treeTraverse(n: NimNode; res: var string; level = 0; isLisp = false, indent
     res.add(" " & $n.floatVal)
   of nnkStrLit .. nnkTripleStrLit, nnkCommentStmt, nnkIdent, nnkSym:
     res.add(" " & $n.strVal.newLit.repr)
-  of nnkNone:
-    assert false
   elif n.kind in {nnkOpenSymChoice, nnkClosedSymChoice} and collapseSymChoice:
     res.add(" " & $n.len)
     if n.len > 0:
@@ -885,7 +883,7 @@ proc astGenRepr*(n: NimNode): string {.benign.} =
   ## See also `repr`, `treeRepr`, and `lispRepr`.
 
   const
-    NodeKinds = {nnkEmpty, nnkIdent, nnkSym, nnkNone, nnkCommentStmt}
+    NodeKinds = {nnkEmpty, nnkIdent, nnkSym, nnkCommentStmt}
     LitKinds = {nnkCharLit..nnkInt64Lit, nnkFloatLit..nnkFloat64Lit, nnkStrLit..nnkTripleStrLit}
 
   proc traverse(res: var string, level: int, n: NimNode) {.benign.} =
@@ -906,7 +904,6 @@ proc astGenRepr*(n: NimNode): string {.benign.} =
     of nnkFloatLit..nnkFloat64Lit: res.add($n.floatVal)
     of nnkStrLit..nnkTripleStrLit, nnkCommentStmt, nnkIdent, nnkSym:
       res.add(n.strVal.newLit.repr)
-    of nnkNone: assert false
     elif n.kind in {nnkOpenSymChoice, nnkClosedSymChoice} and collapseSymChoice:
       res.add(", # unrepresentable symbols: " & $n.len)
       if n.len > 0:
@@ -1098,7 +1095,7 @@ proc last*(node: NimNode): NimNode = node[node.len-1]
 const
   RoutineNodes* = {nnkProcDef, nnkFuncDef, nnkMethodDef, nnkDo, nnkLambda,
                    nnkIteratorDef, nnkTemplateDef, nnkConverterDef, nnkMacroDef}
-  AtomicNodes* = {nnkNone..nnkNilLit}
+  AtomicNodes* = {nnkEmpty..nnkNilLit}
   CallNodes* = {nnkCall, nnkInfix, nnkPrefix, nnkPostfix, nnkCommand,
     nnkCallStrLit, nnkHiddenCallConv}
 
diff --git a/tests/lang_callable/macros/tdumpast2.nim b/tests/lang_callable/macros/tdumpast2.nim
index 005d268020c..09408f528d8 100644
--- a/tests/lang_callable/macros/tdumpast2.nim
+++ b/tests/lang_callable/macros/tdumpast2.nim
@@ -13,7 +13,7 @@ proc dumpit(n: NimNode): string {.compileTime.} =
   of nnkFloatLit..nnkFloat64Lit: add(result, $n.floatVal)
   of nnkStrLit..nnkTripleStrLit: add(result, n.strVal)
   of nnkIdent:                   add(result, n.strVal)
-  of nnkSym, nnkNone:            assert false
+  of nnkSym:                     assert false
   else:
     add(result, dumpit(n[0]))
     for j in 1..n.len-1:
diff --git a/tests/lang_callable/macros/tincremental.nim b/tests/lang_callable/macros/tincremental.nim
index 401d6f3f844..3a21a6761f7 100644
--- a/tests/lang_callable/macros/tincremental.nim
+++ b/tests/lang_callable/macros/tincremental.nim
@@ -41,7 +41,7 @@ macro graph_discovery(n: typed{nkSym}): untyped =
   var visited: seq[NimNode]
   proc discover(n: NimNode) = 
     case n.kind:
-      of nnkNone..pred(nnkSym), succ(nnkSym)..nnkNilLit: discard
+      of nnkEmpty..pred(nnkSym), succ(nnkSym)..nnkNilLit: discard
       of nnkSym:
         if n.symKind in {nskFunc, nskProc}:
           if n notin visited:
diff --git a/tests/lang_callable/macros/tmacro3.nim b/tests/lang_callable/macros/tmacro3.nim
index 38e8349e7e8..da348cc22fe 100644
--- a/tests/lang_callable/macros/tmacro3.nim
+++ b/tests/lang_callable/macros/tmacro3.nim
@@ -21,7 +21,7 @@ macro test2*(a: untyped): untyped =
     echo "That's weird"
     var o : NimNode = nil
     echo "  no its not!"
-    o = newNimNode(nnkNone)
+    o = newNimNode(nnkEmpty)
     if recurse > 0:
       testproc(recurse - 1)
   testproc(5)
diff --git a/tests/lang_callable/macros/trecmacro.nim b/tests/lang_callable/macros/trecmacro.nim
index d804178bc17..34c5d6b896b 100644
--- a/tests/lang_callable/macros/trecmacro.nim
+++ b/tests/lang_callable/macros/trecmacro.nim
@@ -6,7 +6,7 @@ discard """
 
 macro dump(n: untyped): untyped =
   dump(n)
-  if kind(n) == nnkNone:
+  if kind(n) == nnkEmpty:
     nil
   else:
     hint($kind(n))
diff --git a/tests/lang_callable/template/tparams_gensymed.nim b/tests/lang_callable/template/tparams_gensymed.nim
index c50b7961c73..79f98a825c7 100644
--- a/tests/lang_callable/template/tparams_gensymed.nim
+++ b/tests/lang_callable/template/tparams_gensymed.nim
@@ -30,7 +30,7 @@ template genNodeKind(kind, name: untyped) =
     for c in children:
       result.add(c)
 
-genNodeKind(nnkNone, None)
+genNodeKind(nnkEmpty, None)
 
 
 # Test that generics in templates still work (regression to fix #1915)
diff --git a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
index 20ed5fb30d0..9e9c9d8ebf3 100644
--- a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
+++ b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
@@ -13,4 +13,4 @@ macro bar(): untyped =
 proc foo() =
   bar()
 
-foo()
\ No newline at end of file
+foo()

From e223adb3cb0dfcb55bd5907c8dfe30bdbc007d7a Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 11 Mar 2024 23:57:15 +0000
Subject: [PATCH 028/169] build(deps): Bump softprops/action-gh-release from
 0.1.15 to 2.0.3 (#1232)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[softprops/action-gh-release](https://github.com/softprops/action-gh-release)
from 0.1.15 to 2.0.3.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/releases">softprops/action-gh-release's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.2</h2>
<ul>
<li>Revisit approach to <a

href="https://redirect.github.com/softprops/action-gh-release/pull/384">#384</a>
making unresolved pattern failures opt-in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/417">#417</a></li>
</ul>
<h2>v2.0.1</h2>
<ul>
<li>Add support for make_latest property <a

href="https://redirect.github.com/softprops/action-gh-release/pull/304">softprops/action-gh-release#304</a>
via <a

href="https://github.com/samueljseay"><code>@​samueljseay</code></a></li>
<li>Fail run if files setting contains invalid patterns <a

href="https://redirect.github.com/softprops/action-gh-release/pull/384">softprops/action-gh-release#384</a>
via <a
href="https://github.com/rpdelaney"><code>@​rpdelaney</code></a></li>
<li>Add support for proxy env variables (don't use node-fetch) <a

href="https://redirect.github.com/softprops/action-gh-release/pull/386/">softprops/action-gh-release#386</a>
via <a

href="https://github.com/timor-raiman"><code>@​timor-raiman</code></a></li>
<li>Suppress confusing warning when input_files is empty <a

href="https://redirect.github.com/softprops/action-gh-release/pull/389">softprops/action-gh-release#389</a>
via <a href="https://github.com/Drowze"><code>@​Drowze</code></a></li>
</ul>
<h2>v2.0.0</h2>
<ul>
<li>update actions.yml declaration to node20 to address warnings</li>
</ul>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/blob/master/CHANGELOG.md">softprops/action-gh-release's
changelog</a>.</em></p>
<blockquote>
<h2>2.0.3</h2>
<ul>
<li>Declare <code>make_latest</code> as an input field in
<code>action.yml</code> <a

href="https://redirect.github.com/softprops/action-gh-release/pull/419">#419</a></li>
</ul>
<h2>2.0.2</h2>
<ul>
<li>Revisit approach to <a

href="https://redirect.github.com/softprops/action-gh-release/pull/384">#384</a>
making unresolved pattern failures opt-in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/417">#417</a></li>
</ul>
<h2>2.0.1</h2>
<ul>
<li>Add support for make_latest property <a

href="https://redirect.github.com/softprops/action-gh-release/pull/304">#304</a>
via <a

href="https://github.com/samueljseay"><code>@​samueljseay</code></a></li>
<li>Fail run if files setting contains invalid patterns <a

href="https://redirect.github.com/softprops/action-gh-release/pull/384">#384</a>
via <a
href="https://github.com/rpdelaney"><code>@​rpdelaney</code></a></li>
<li>Add support for proxy env variables (don't use node-fetch) <a

href="https://redirect.github.com/softprops/action-gh-release/pull/386/">#386</a>
via <a

href="https://github.com/timor-raiman"><code>@​timor-raiman</code></a></li>
<li>Suppress confusing warning when input_files is empty <a

href="https://redirect.github.com/softprops/action-gh-release/pull/389">#389</a>
via <a href="https://github.com/Drowze"><code>@​Drowze</code></a></li>
</ul>
<h2>2.0.0</h2>
<ul>
<li><code>2.0.0</code>!? this release corrects a disjunction between git
tag versions used in the marketplace and versions list this file.
Previous versions should have really been 1.*. Going forward this should
be better aligned.</li>
<li>Upgrade action.yml declaration to node20 to address
deprecations</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/softprops/action-gh-release/commit/3198ee18f814cdf787321b4a32a26ddbf37acc52"><code>3198ee1</code></a>
prep release</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/7ee8e0638151a48bb421b567d7d53a07cb158121"><code>7ee8e06</code></a>
declare an update docs for make_latest input (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/419">#419</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/d99959edae48b5ffffd7b00da66dcdb0a33a52ee"><code>d99959e</code></a>
prep release</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/0e39c679e8bac647fe5ad41070fe2295b0393d58"><code>0e39c67</code></a>
make pattern error opt in (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/417">#417</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/20e085ccc73308c2c8e43ab8da4f8d7ecbb94d4e"><code>20e085c</code></a>
kick off 2.0.1 release</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/9f5c4d39bc56b5ed07f92f260dd05d33000058a6"><code>9f5c4d3</code></a>
update changelog</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/0bea76b22707a1871a52b97e07c80657071adb76"><code>0bea76b</code></a>
Add support for make_latest property (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/304">#304</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/762fe13dfbc8921c36ebb81da5626a394a6a5b95"><code>762fe13</code></a>
typo in changelog</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/c0f2569fb90b35a0e2b043535a5778f437ec86ea"><code>c0f2569</code></a>
remove unused script</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/5743e060246b253faba6cb8e051511b63e7639c9"><code>5743e06</code></a>
update changelog</li>
<li>Additional commits viewable in <a

href="https://github.com/softprops/action-gh-release/compare/v0.1.15...v2.0.3">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=softprops/action-gh-release&package-manager=github_actions&previous-version=0.1.15&new-version=2.0.3)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 28b483edd74..e87c1367b16 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -101,7 +101,7 @@ jobs:
 
       - id: release
         name: Create pre-release
-        uses: softprops/action-gh-release@v0.1.15
+        uses: softprops/action-gh-release@v2.0.3
         with:
           prerelease: true
           files: ${{ steps.release-files.outputs.result }}

From df33ca4b3946016565fc0aee872a4ed61fa72be0 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 12 Mar 2024 18:45:26 +0100
Subject: [PATCH 029/169] jsgen: use the new-style CGIR (#1230)

## Summary

* use the goto-using CGIR for JavaScript code generation
* as a side-effect, multiple bugs with tracking of the current
  exception are fixed
* exceptions thrown from `asm` or `.emit` code cannot be expected to be
  caught anymore (this was already undefined behaviour)

## Details

The CGIR for a body is first passed to the new `jsflow` module, where
the shape of the necessary JavaScript is computed, with the focus on
the control-flow constructs (`if`, `switch`, `try`, etc.). Constructs
are translated as follows:
* `cnkGotoStmt` and `cnkJoinStmt` are translated to `break` and labeled
  blocks (JavaScript doesn't support goto directly)
* `cnkCaseStmt` dispatchers are translated to `switch`/`case`
  statements
* `cnkFinally` and `cnkExcept` are translated to `try`/`finally` and
  `try`/`catch`, respectively

It's first computed which statements `try`s and labeled blocks *must*
enclose. Afterwards, their starts are reordered such that valid
JavaScript is formed.

Since `finally` and `catch` clauses can then intercept `break`s or
`throw`s that they shouldn't, `finally` and `catch` clauses are guarded
by a boolean flag. Immediately before an explicit (`break` and `throw`)
or implicit (procedure call) jump that would enter a clause it
shouldn't, the boolean locals for the problematic clauses are set to
false. Upon exit of a disabled clause, the local is set back to true.

#### Case Statements

Direct translation of `cnkCaseStmt`s into `switch`/`case` statement
where each branch is a `break` would result in very deep block nesting
for `case` statements with many branches. The resulting JavaScript code
can cause the V8 JavaScript engine to fail/crash when compiling the
code!

Therefore, the jump targets need to be inlined whenever possible.
`jsflow` computes the code regions eligible for inlining, and `jsgen`
handles the actual inlining.

#### Current Exception Tracking

When control-flow leaves an `except` handler, the `prevJSError` global
(whose content is returned by `getCurrentException`) needs to be reset
to the exception caught by the enclosing handler, something that was
previously missing for the most part.

The exception is restored:
* at the end of a block when the block is broken out of from within a
  `catch`
* at the start of a `finally` clause intercepting a `break` from within
  a `catch`
* at the start of a `finally` clause when it's entered due to an
  exception

If there's no enclosing `catch` within a procedure when the current
exception has to be restored, the value of `lastJSError` is captured at
procedure entry. Tracking of the current exception still doesn't
include in-flight exceptions, so `tfinally6.nim` still fails.

#### Unhandled Exception Reporting

Instead of incrementing, at run-time, a global counter (`excHandler`)
before entering a `try` and decrementing it again on exit, and then
reporting unhandled exceptions when throwing, the module-init
procedures (i.e., top-level code) are wrapped in a `try`/`catch` that
reports the escaping exceptions.

This is simpler to implement and should also have less run-time
overhead.

#### Throwing with `asm`

`asm` and `emit` statements are considered not to raise, and thus they
don't prevent `except` and `finally` sections from being eliminated by
unreachable code elimination.

The `tnativeexc` test is updated to not rely on undefined behaviour.

### Unreachable Code Elimination

Labels that mark the exit of case statements are now eliminated too, if
structured control-flow doesn't leave the case statement (i.e., each
branch ends in a noreturn-like statement).

---------

Co-authored-by: Clay Sweetser <Varriount@users.noreply.github.com>
---
 compiler/backend/cgirgen.nim                  |   4 +-
 compiler/backend/compat.nim                   |   5 +
 compiler/backend/jsbackend.nim                |   6 +-
 compiler/backend/jsflow.nim                   | 362 +++++++++++
 compiler/backend/jsgen.nim                    | 584 ++++++++++++------
 lib/system/jssys.nim                          |   7 -
 tests/exception/tleave_except.nim             |   1 -
 tests/exception/tleave_except2.nim            |   1 -
 .../exception/traise_and_handle_in_except.nim |   1 -
 tests/exception/treraise2.nim                 |   1 -
 tests/js/tnativeexc.nim                       |  12 +-
 11 files changed, 788 insertions(+), 196 deletions(-)
 create mode 100644 compiler/backend/jsflow.nim

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 753574c224e..4c6af0a160d 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -1000,9 +1000,9 @@ proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
 
     leave(tree, cr)
 
-  # we used manual gotos, so emission of a join statement has to be forced
-  join result.info, exit, required=true
   if doesExit:
+    # we used manual gotos, so emission of a join statement has to be forced
+    join result.info, exit, required=true
     cl.isActive = true
   else:
     cl.disable()
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 22f5f5def2e..b46e62634e4 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -210,3 +210,8 @@ func numArgs*(n: CgNode): int {.inline.} =
   ## Returns the number of arguments for a call-like node. The callee
   ## is excluded.
   n.len - 1 - ord(n.kind == cnkCheckedCall)
+
+func callLen*(n: CgNode): int {.inline.} =
+  ## The number of sub-nodes in a call-like node, excluding the trailing jump
+  ## target description.
+  n.len - ord(n.kind == cnkCheckedCall)
diff --git a/compiler/backend/jsbackend.nim b/compiler/backend/jsbackend.nim
index 55069b22b5a..da2d9f132db 100644
--- a/compiler/backend/jsbackend.nim
+++ b/compiler/backend/jsbackend.nim
@@ -74,11 +74,11 @@ proc processEvent(g: PGlobals, graph: ModuleGraph, modules: BModuleList,
       p = startProc(g, bmod, evt.id, Body())
       partial[evt.sym.id] = p
 
-    let body = generateIRLegacy(graph, bmod.idgen, g.env, evt.sym, evt.body)
+    let body = generateIR(graph, bmod.idgen, g.env, evt.sym, evt.body)
     genPartial(p, merge(p.fullBody, body))
   of bekProcedure:
     let
-      body = generateIRLegacy(graph, bmod.idgen, g.env, evt.sym, evt.body)
+      body = generateIR(graph, bmod.idgen, g.env, evt.sym, evt.body)
       r = genProc(g, bmod, evt.id, body)
 
     if sfCompilerProc in evt.sym.flags:
@@ -116,7 +116,7 @@ proc generateCodeForMain(globals: PGlobals, graph: ModuleGraph, m: BModule,
   let owner = m.module
   genTopLevelStmt(globals, m):
     canonicalize(graph, m.idgen, globals.env, owner, body, TranslationConfig(),
-                 legacy=true)
+                 legacy=false)
 
 proc generateCode*(graph: ModuleGraph, mlist: sink ModuleList) =
   ## Entry point into the JS backend. Generates the code for all modules and
diff --git a/compiler/backend/jsflow.nim b/compiler/backend/jsflow.nim
new file mode 100644
index 00000000000..4e2ec3d1d60
--- /dev/null
+++ b/compiler/backend/jsflow.nim
@@ -0,0 +1,362 @@
+## Implements the translation of CGIR control-flow constructs to JavaScript
+## constructs.
+##
+## While JavaScript doesn't directly support the kind of control flow that
+## the MIR supports, it does support 'finally' and 'catch', both which are
+## leveraged for the translation. The idea: figure out which statements
+## JavaScript blocks, 'finally's, and 'catch's need to enclose and then place
+## them in a way such that the behaviour is translated correctly.
+
+import
+  std/[
+    packedsets,
+    tables
+  ],
+  compiler/backend/[
+    cgir
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+type
+  StructKind* = enum
+    stkTry   ## start of a 'try' statement
+    stkBlock ## start of a labeled block
+
+    stkStructStart ## start of an 'if' or 'while'
+    stkCatch   ## a 'catch' clause of a 'try' statement
+    stkFinally ## a 'finally' clause of a 'try' statement
+
+    stkEnd     ## end of a catch, finally, block, or `stkStructStart`
+               ## (if and while)
+
+    stkTerminator ## a goto or raise statement. Only relevant during analysis
+    stkReturn     ## JavaScript return
+
+  Structure* = object
+    ## A list of ``Structure`` items describes how the JavaScript control-flow
+    ## statements are laid out.
+    stmt*: int
+      ## the associated CGIR statement
+    case kind*: StructKind
+    of stkStructStart, stkTry, stkBlock, stkCatch, stkFinally, stkEnd:
+      label*: BlockId
+        ## the associated CGIR label
+    of stkTerminator, stkReturn:
+      discard
+
+  StructDesc* = tuple
+    ## Describes how a CGIR statement-list translates to JavaScript code. The
+    ## focus is on the control-flow constructs, hence the name.
+    structs: seq[Structure]
+    finallys: PackedSet[BlockId]
+      ## labels that denote finally sections
+    inline: Table[BlockId, int]
+      ## maps all blocks that can be inlined into swith-case statements to
+      ## the blocks' 'end' item
+
+const
+  Terminators = {stkReturn, stkTerminator}
+
+func finalTarget*(n: CgNode): CgNode =
+  ## Given a label or target list, retrieves the target.
+  case n.kind
+  of cnkLabel:      n
+  of cnkTargetList: n[^1]
+  else:
+    unreachable()
+
+proc spawnOpens(items: var seq[Structure], pos: int, n: CgNode, isError: bool,
+                finallys: PackedSet[BlockId], marker: var PackedSet[BlockId]) =
+  ## Using the jump action description `n`, spawns the 'try' or labeled block
+  ## openings needed for the jump targets. The set of targets for which
+  ## openings were already spawned are tracked by `marker`.
+  ##
+  ## `pos` is the index of the statement. `isError` indicates whether `n`
+  ## describes exceptional control-flow, and is required to interpret what the
+  ## final jump target represents (exception handler or ordinary join point).
+  let target: range[stkTry..stkBlock] = if isError: stkTry else: stkBlock
+
+  case n.kind
+  of cnkLabel:
+    # direct jump to something that cannot be a finally section
+    if not containsOrIncl(marker, n.label):
+      items.add Structure(kind: target, stmt: pos, label: n.label)
+
+  of cnkTargetList:
+    for i in 0..<n.len-1:
+      case n[i].kind
+      of cnkLabel:
+        # an intermediate target must be a finally section (so spawn a try)
+        let label = n[i].label
+        if not containsOrIncl(marker, label):
+          items.add Structure(kind: stkTry, stmt: pos, label: label)
+      of cnkLeave:
+        discard "not handled here"
+      else:
+        unreachable()
+
+    # special handling for the final target
+    case n[^1].kind
+    of cnkLabel:
+      let label = n[^1].label
+      if not containsOrIncl(marker, label):
+        # the final target might be a finally section, in which case a
+        # 'try' needs to be spawned, always
+        if label in finallys:
+          items.add Structure(kind: stkTry, stmt: pos, label: label)
+        else:
+          items.add Structure(kind: target, stmt: pos, label: label)
+    of cnkResume:
+      discard "no special handling for the 'resume' target"
+    else:
+      unreachable()
+
+  else:
+    unreachable(n.kind)
+
+func endsInTerminator(structs: seq[Structure], start: int): bool =
+  ## Computes and returns whether the region starting at `start` ends in a
+  ## terminator.
+  var
+    i = start
+    depth = 0
+  while depth >= 0 and i < structs.len:
+    case structs[i].kind
+    of stkBlock, stkTry, stkStructStart:
+      inc depth
+    of stkEnd:
+      dec depth
+    of stkCatch, stkFinally:
+      if depth == 0:
+        # end of scope
+        break
+      # depth stays the same
+    of Terminators:
+      if depth == 0:
+        # a terminator is reached and it's at the same level as was started
+        # at
+        return true
+
+    inc i
+
+  result = false # doesn't end in a terminator
+
+proc toStructureList*(stmts: openArray[CgNode]): StructDesc =
+  ## Creates and returns the JavaScript control-flow-construct-focused
+  ## representation for `stmts`.
+  var
+    structs = newSeq[Structure]()
+    finallys = initPackedSet[BlockId]()
+    marker = initPackedSet[BlockId]()
+
+  # before doing anything else, we need to know which labels belong to finallys
+  for it in stmts.items:
+    if it.kind == cnkFinally:
+      finallys.incl it[0].label
+
+  # the first step is computing the first statement that opening 'try's and
+  # labeled blocks *must* enclose:
+  #   def x = 0
+  #   def y = f() -> [L0, L1]
+  #   goto [L0, L2]
+  #   L0: # finalizer
+  #     ...
+  #     Continue
+  #   L1: # exception handler
+  #     ...
+  #   L2: ...
+  #
+  # Here, two JavaScript 'try' statements need to start right before the
+  # `def y`, the first one for the finalizer, the second one for the exception
+  # handler. A labeled JS block must enclose the `goto`.
+  for i, it in stmts.pairs:
+    template exit(n: CgNode, isError: bool) =
+      spawnOpens(structs, i, n, isError, finallys, marker)
+
+    template terminator() =
+      structs.add Structure(kind: stkTerminator, stmt: i)
+
+    template struct(k: StructKind, lbl: BlockId) =
+      structs.add Structure(kind: k, stmt: i, label: lbl)
+
+    case it.kind
+    of cnkDef, cnkAsgn, cnkFastAsgn:
+      if it[1].kind == cnkCheckedCall:
+        exit(it[1][^1], isError=true)
+    of cnkCheckedCall:
+      exit(it[^1], isError=true)
+    of cnkGotoStmt:
+      exit(it[0], isError=false)
+      let target = finalTarget(it[0])
+      # if the goto jumps to a finally, there's no label for the break.
+      # Since this can only happen when structured control-flow never
+      # leaves the finally, a JavaScript 'return' can be used
+      if target.label in finallys:
+        structs.add Structure(kind: stkReturn, stmt: i)
+      else:
+        terminator()
+    of cnkRaiseStmt:
+      exit(it[^1], isError=true)
+      terminator()
+    of cnkCaseStmt:
+      for j in 1..<it.len:
+        exit(it[j][^1], isError=false)
+      terminator()
+    of cnkLoopJoinStmt:
+      # start of a 'while'
+      struct(stkStructStart, it[0].label)
+    of cnkIfStmt:
+      struct(stkStructStart, it[1].label)
+    of cnkEnd, cnkContinueStmt, cnkLoopStmt:
+      struct(stkEnd, it[0].label)
+    of cnkJoinStmt:
+      assert it[0].label in marker
+      struct(stkEnd, it[0].label)
+    of cnkFinally:
+      assert it[0].label in marker
+      struct(stkFinally, it[0].label)
+    of cnkExcept:
+      assert it[0].label in marker
+      struct(stkCatch, it[0].label)
+      if it.len > 1:
+        # not a catch-all handler; raising might continue
+        exit(it[^1], isError=true)
+    else:
+      discard "not relevant"
+
+  # the list of openings and closing produced by the first pass will in most
+  # cases not be valid JavaScript code. We have to "solve" the representation
+  # by reordering the openings until they're matched with their corresponding
+  # end. ``stkCatch``, ``stkFinally``, ``stkStructStart``, and ``stkEnd`` must
+  # keep their relative order and stay attached to the same statements, only
+  # ``stkTry`` and ``stkBlock`` can be moved, but only backwards
+  var i = structs.high
+  while i > 0:
+    if structs[i].kind in {stkTry, stkBlock}:
+      # compute the difference in nesting between the try/block and its
+      # corresponding end:
+      var
+        depth = 1
+        j = i
+      while true:
+        inc j
+        case structs[j].kind
+        of stkTry, stkBlock, stkStructStart:
+          inc depth
+        of stkFinally, stkCatch:
+          if structs[j].label == structs[i].label:
+            dec depth
+            break
+        of stkEnd:
+          dec depth
+          if structs[j].label == structs[i].label:
+            break
+        of Terminators:
+          discard "not relevant"
+
+      # depth < 0 means that the try/block start is more nested than its end.
+      # In other words, the try or block start is currently too nested. Move
+      # it backwards (i.e., associate it with an earlier statement) until it's
+      # at the same level as its end
+      let moved = depth < 0
+      var x = i
+      while depth < 0:
+        # change the associated statement...
+        structs[x].stmt = structs[x - 1].stmt
+        # ... then swap
+        swap(structs[x], structs[x - 1])
+
+        case structs[x].kind
+        of stkEnd:
+          dec depth
+        of stkBlock, stkTry, stkStructStart:
+          inc depth
+        of Terminators, stkCatch, stkFinally:
+          # catch and finally don't change the nesting (the try's body is at
+          # the same level as catch/finally's body)
+          discard
+
+        dec x
+
+      if moved:
+        # a different item than before is in the slot now; it needs to be
+        # processed too
+        continue # skip the following decrement
+
+    dec i
+
+  # note: changing what statements a 'try' encloses can alter semantics! That's
+  # none of our concern here, however: the code generator is reponsible for
+  # addressing/fixing it.
+
+  # if a case dispatcher is the only break targeting a block, and the block is
+  # not exited through structured control-flow, the code following the block
+  # can be inlined directly at the break within the switch-case statement:
+  #   L2: {
+  #     L1: {
+  #       switch (x) {
+  #       case 0:
+  #         break L1;
+  #       default:
+  #         break L2;
+  #       }
+  #     }
+  #     // A
+  #     break L2
+  #   }
+  #
+  # Here, the A section plus the ``break L2`` can be inlined directly at
+  # the ``break L1``.
+  # We perform two passes over the structure list:
+  #   1. the first one counts for each block how many breaks target it
+  #   2. the second pass removes all ineligible blocks from the table and
+  #      replaces the counter with an item index of the blocks' 'end'
+  # For efficiency, and thanks to the forward-only control-flow, both
+  # steps are performed with a single pass.
+  var inline: Table[BlockId, int]
+  for i, it in structs.pairs:
+    case it.kind
+    of stkTerminator:
+      let n = stmts[it.stmt]
+      case n.kind
+      of cnkCaseStmt:
+        for j in 1..<n.len:
+          inline.mgetOrPut(n[j][^1].label, 0) += 1
+      of cnkGotoStmt:
+        # we don't inline the target at bare gotos. Mark the block the goto
+        # targets as ineligible by incrementing the counter by two
+        inline.mgetOrPut(finalTarget(n[0]).label, 0) += 2
+      else:
+        discard "only gotos are interesting"
+    of stkEnd:
+      case inline.getOrDefault(it.label, 0)
+      of 0:
+        discard "must be the end of a finally or catch; ignore"
+      of 1:
+        # possible candidate. Is the region preceded by a terminator (meaning
+        # that structured control-flow doesn't enter it) and ends in one?
+        if structs[i - 1].kind in Terminators and
+           endsInTerminator(structs, i + 1):
+          # can be inlined. Replace the counter value with the index
+          inline[it.label] = i
+        else:
+          # not eligible, remove it from the set of candidates
+          inline.del(it.label)
+      else:
+        # blocks broken out of more than once cannot be inlined. Remove
+        # them from the table
+        inline.del(it.label)
+    of stkTry, stkBlock, stkCatch, stkFinally, stkStructStart, stkReturn:
+      discard "not relevant"
+
+  # the `inline` table now contains only the blocks inline-able into swith-case
+  # statements
+
+  # possible improvements:
+  # * breaks and the associated block could be eliminated where JavaScript's
+  #   structured control-flow would take same route
+  # * a chain of exception could be merged into a single JavaScript catch
+
+  result = (structs, finallys, inline)
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index 20a020ff7cc..1b95ed3c651 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -60,7 +60,8 @@ import
   ],
   compiler/backend/[
     cgir,
-    compat
+    compat,
+    jsflow
   ]
 
 # xxx: reports are a code smell meaning data types are misplaced
@@ -140,6 +141,22 @@ type
     typ: PType
     storage: StorageFlags
 
+  BlockKind = enum
+    bkBlock
+    bkTryFinally ## try with attached 'finally'
+    bkTryCatch   ## try with attached 'catch'
+    bkFinally
+    bkCatch
+
+  BlockFlag = enum
+    needsRecover
+    needsEnableFlag
+
+  BlockInfo = object
+    label: BlockId
+    kind: BlockKind
+    flags: set[BlockFlag]
+
   PProc* = ref TProc
   TProc* = object
     prc: PSym
@@ -149,11 +166,17 @@ type
     options: TOptions
     module: BModule
     g: PGlobals
-    beforeRetNeeded: bool
+    lastErrorBackupNeeded: bool
+      ## signals whether the value of ``lastJSError`` needs to be captured
+      ## on procedure entry
     unique: int    # for temp identifier generation
-    blocks: seq[int]
-      ## the stack of enclosing blocks, indexed by ``BlockId``. Each entry
-      ## stores the number to use for the label name
+    blocks: seq[BlockInfo]
+      ## enclosing exception handlers, finallys, and labeled blocks. Used
+      ## for correcting wrong control-flow paths and tracking where the
+      ## current exception needs to be restored
+    numHandlers: int
+      ## number of enclosing 'catch' clauses. The name of the
+      ## exception local is derived from this counter
     extraIndent: int
 
     locals: OrdinalSeq[LocalId, Loc]
@@ -170,6 +193,9 @@ const
     ## magics that are treated like normal procedures by the code
     ## generator
 
+template `$`(x: BlockId): string =
+  $ord(x)
+
 template isFilled(x: string): bool =
   x.len != 0
 
@@ -215,9 +241,9 @@ template config*(p: PProc): ConfigRef = p.module.config
 template env*(p: PProc): untyped = p.g.env
 
 proc indentLine(p: PProc, r: Rope): Rope =
-  result = r
-  for i in 0..<p.blocks.len + p.extraIndent:
-    prepend(result, rope"  ")
+  for i in 0..<p.extraIndent:
+    result.add "  "
+  result.add r
 
 template line(p: PProc, added: string) =
   p.body.add(indentLine(p, rope(added)))
@@ -233,6 +259,14 @@ template nested(p, body) =
   body
   dec p.extraIndent
 
+template startBlock(p: PProc, frmt: FormatStr, args: varargs[Rope]) =
+  lineF(p, frmt, args)
+  inc p.extraIndent
+
+template endBlock(p: PProc, frmt: FormatStr = "}$n", args: varargs[Rope]) =
+  dec p.extraIndent
+  lineF(p, frmt, args)
+
 proc newGlobals*(): PGlobals =
   new(result)
   result.typeInfoGenerated = initIntSet()
@@ -246,7 +280,6 @@ proc rdLoc(a: TCompRes): Rope {.inline.} =
 proc newProc(globals: PGlobals, module: BModule, prc: PSym,
              options: TOptions): PProc =
   result = PProc(
-    blocks: @[],
     options: options,
     module: module,
     prc: prc,
@@ -538,7 +571,7 @@ proc arithAux(p: PProc, n: CgNode, r: var TCompRes, op: TMagic) =
     xLoc,yLoc: Rope
 
   useMagic(p, jsMagics[op])
-  if n.len > 2:
+  if numArgs(n) == 2:
     gen(p, n[1], x)
     gen(p, n[2], y)
     xLoc = x.rdLoc
@@ -666,110 +699,131 @@ proc genLineDir(p: PProc, n: CgNode) =
   if hasFrameInfo(p):
     lineF(p, "F.line = $1;$n", [rope(line)])
 
-proc genRepeatStmt(p: PProc, n: CgNode) =
-  internalAssert p.config, isEmptyType(n.typ)
-  genLineDir(p, n)
-  lineF(p, "while (true) {$n")
-  p.nested: genStmt(p, n[0])
-  lineF(p, "}$n")
-
-proc genTry(p: PProc, n: CgNode) =
-  # code to generate:
-  #
-  #  ++excHandler;
-  #  var tmpFramePtr = framePtr;
-  #  try {
-  #    stmts;
-  #    --excHandler;
-  #  } catch (EXCEPTION) {
-  #    var prevJSError = lastJSError; lastJSError = EXCEPTION;
-  #    framePtr = tmpFramePtr;
-  #    --excHandler;
-  #    if (e.typ && e.typ == NTI433 || e.typ == NTI2321) {
-  #      stmts;
-  #    } else if (e.typ && e.typ == NTI32342) {
-  #      stmts;
-  #    } else {
-  #      stmts;
-  #    }
-  #    lastJSError = prevJSError;
-  #  } finally {
-  #    framePtr = tmpFramePtr;
-  #    stmts;
-  #  }
-  genLineDir(p, n)
-  inc(p.unique)
-  var i = 1
-  var catchBranchesExist = n.len > 1 and n[i].kind == cnkExcept
-  if catchBranchesExist:
-    p.body.add("++excHandler;\L")
-  var tmpFramePtr = rope"F"
-  if optStackTrace notin p.options:
-    tmpFramePtr = p.getTemp(true)
-    line(p, tmpFramePtr & " = framePtr;\L")
-  lineF(p, "try {$n", [])
-  genStmt(p, n[0])
-  var generalCatchBranchExists = false
-  if catchBranchesExist:
-    p.body.addf("--excHandler;$n} catch (EXCEPTION) {$n var prevJSError = lastJSError;$n" &
-        " lastJSError = EXCEPTION;$n --excHandler;$n", [])
-    line(p, "framePtr = $1;$n" % [tmpFramePtr])
-  while i < n.len and n[i].kind == cnkExcept:
-    if n[i].len == 1:
-      # general except section:
-      generalCatchBranchExists = true
-      if i > 1: lineF(p, "else {$n", [])
-      genStmt(p, n[i][0])
-      if i > 1: lineF(p, "}$n", [])
-    else:
-      var orExpr = ""
-      var excAlias: CgNode = nil
+proc handleJump(p: PProc, n: CgNode, fromError: bool): seq[BlockId] =
+  ## Makes sure the control-flow described by jump action description `n`
+  ## matches the actual JavaScript control-flow. If catch or finally
+  ## sections would be entered that shouldn't be, they're flagged as
+  ## requiring an "is enabled" guard and a boolean local is spawned.
+  ##
+  ## Returns the list of sections that need to be disabled.
+
+  iterator mreverse[T](s: var seq[T]): (int, var T) =
+    for i in countdown(s.high, 0):
+      yield (i, s[i])
+
+  template onMiss(idx: int, b: var BlockInfo) =
+    if b.kind == bkTryFinally or (b.kind == bkTryCatch and fromError):
+      # JavaScript control-flow enters a 'finally' or 'catch' it shouldn't.
+      # The section needs to be disabled; a boolean flag is used for this.
+      # Thanks to `var`, the local can be spawned without regards to
+      # scoping.
+      # XXX: this is not ideal. It would be better if the local is defined
+      #      at the start of the scope, but that's a bit tricky to do at
+      #      the moment
+      if needsEnableFlag notin b.flags:
+        lineF(p, "var Enabled$1_ = true;\L", [$b.label])
+        b.flags.incl needsEnableFlag
+
+      result.add b.label
+
+  case n.kind
+  of cnkLabel:
+    for i, b in mreverse(p.blocks):
+      if n.label == b.label:
+        break # found the target
+      else:
+        onMiss(i, b)
+
+  of cnkTargetList:
+    # marking blocks as having to restore the current exceptions is also done
+    # here
+    var
+      t = 0
+      wasLeave = fromError
+    # ^^ exceptional control-flow could come from within a procedure call, where
+    # an exception handler boundary crossed
+    for i, b in mreverse(p.blocks):
+      wasLeave = wasLeave or n[t].kind == cnkLeave
+      # skip leave actions:
+      while n[t].kind == cnkLeave:
+        inc t
+
+      if n[t].kind == cnkLabel and n[t].label == b.label:
+        inc t
+        if wasLeave:
+          b.flags.incl needsRecover
+          # the next jump target doesn't need to recover the exception,
+          # unless there's another leave action in-between
+          wasLeave = false
+        # stop searching when we reach the end
+        if t >= n.len:
+          break
+      else:
+        onMiss(i, b)
 
+  of cnkCheckedCall:
+    # to reduce conditionals at the callsite
+    result = handleJump(p, n[^1], fromError)
+  else:
+    unreachable()
+
+proc setEnabled(p: PProc, sections: seq[BlockId], val: Rope) =
+  ## Emits code for assigning `val` to the enabled flag of all given
+  ## `sections`.
+  for it in sections.items:
+    # the block/section index is used for the name:
+    lineF(p, "Enabled$1_ = $2;$n", [$it, val])
+
+proc genExcept(p: PProc, n: CgNode) =
+  ## Generates and emits code for an ``cnkExcept`` join point.
+  let id = p.numHandlers # name suffix of the exception variable
+
+  if n.len > 1:
+    # handler with filter
+    var orExpr = ""
+    for i in 1..<n.len - 1:
       useMagic(p, "isObj")
-      for j in 0..<n[i].len - 1:
-        let it = n[i][j]
-        let throwObj = it
-
-        if it.kind == cnkLocal:
-          excAlias = it
-          # If this is a ``except exc as sym`` branch there must be no following
-          # nodes
-          doAssert orExpr == ""
-
-        if orExpr != "": orExpr.add("||")
-        # Generate the correct type checking code depending on whether this is a
-        # |NimSkull|-native or a JS-native exception
-        if isImportedException(throwObj.typ, p.config):
-          orExpr.addf("lastJSError instanceof $1",
-            [throwObj.typ.sym.extname])
-        else:
-          orExpr.addf("isObj(lastJSError.m_type, $1)",
-               [genTypeInfo(p, throwObj.typ)])
-
-      if i > 1: line(p, "else ")
-      lineF(p, "if (lastJSError && ($1)) {$n", [orExpr])
-      # If some branch requires a local alias introduce it here. This is needed
-      # since JS cannot do ``catch x as y``.
-      if excAlias != nil:
-        setupLocalLoc(p, excAlias.local, skVar)
-        lineF(p, "var $1 = lastJSError;$n", p.locals[excAlias.local].name)
-      genStmt(p, n[i][^1])
-      lineF(p, "}$n", [])
-    inc(i)
-  if catchBranchesExist:
-    if not generalCatchBranchExists:
-      useMagic(p, "reraiseException")
-      line(p, "else {\L")
-      line(p, "\treraiseException();\L")
-      line(p, "}\L")
-    lineF(p, "lastJSError = prevJSError;$n")
-  line(p, "} finally {\L")
-  line(p, "framePtr = $1;$n" % [tmpFramePtr])
-  if i < n.len and n[i].kind == cnkFinally:
-    genStmt(p, n[i][0])
-  line(p, "}\L")
+      let throwObj = n[i]
+
+      if orExpr != "": orExpr.add("||")
+      # Generate the correct type checking code depending on whether this is a
+      # |NimSkull|-native or a JS-native exception
+      if isImportedException(throwObj.typ, p.config):
+        orExpr.addf("Exception$1_ instanceof $2",
+          [$id, throwObj.typ.sym.extname])
+      else:
+        orExpr.addf("isObj(Exception$1_.m_type, $2)",
+          [$id, genTypeInfo(p, throwObj.typ)])
+
+    # re-throw the exception when it doesn't match the filter
+    lineF(p, "if (!(Exception$1_ && ($2))) {\L",
+          [$id, orExpr])
+    p.nested:
+      # disable the necessary sections before throwing
+      setEnabled(p, handleJump(p, n[^1], fromError=true), "false")
+      lineF(p, "throw Exception$1_;\L", [$id])
+    lineF(p, "}\L")
+
+    if n[1].kind == cnkLocal:
+      # it's a handler for an imported exception. Setup the local
+      let local = n[1].local
+      setupLocalLoc(p, local, skVar)
+      lineF(p, "var $1 = Exception$2_;$n", [p.locals[local].name, $id])
+
+  else:
+    # catch-all handler
+    discard
+
+  # set the current exception:
+  lineF(p, "lastJSError = Exception$1_;$n", [$id])
+
+  # restore the framePtr (it's incorrect when coming from unwinding)
+  if hasFrameInfo(p):
+    lineF(p, "framePtr = F;$n", [])
 
 proc genRaiseStmt(p: PProc, n: CgNode) =
+  # disable the necessary sections before throwing:
+  setEnabled(p, handleJump(p, n[^1], fromError=true), "false")
   if n[0].kind != cnkEmpty:
     var a: TCompRes
     gen(p, n[0], a)
@@ -788,7 +842,12 @@ func intLiteral(v: Int128, typ: PType): string =
     else:         "true"
   else:           $v
 
-proc genCaseJS(p: PProc, n: CgNode) =
+proc gen(p: PProc, desc: StructDesc, stmts: openArray[CgNode], start: int)
+
+proc genCaseJS(p: PProc, desc: StructDesc, stmts: openArray[CgNode], n: CgNode) =
+  ## Generates and emits the JavaScript code for dispatcher `n`. The branch
+  ## targes may be inlined directly (if safe) -- `desc` and `stmts` are
+  ## required for the inlining. The inlining is a source of call recursion.
   var
     cond: TCompRes
     totalRange = Zero
@@ -825,28 +884,22 @@ proc genCaseJS(p: PProc, n: CgNode) =
           else:
             gen(p, e, cond)
             lineF(p, "case $1:$n", [cond.rdLoc])
-      p.nested:
-        genStmt(p, lastSon(it))
-        lineF(p, "break;$n", [])
     else:
       lineF(p, "default: $n", [])
-      p.nested:
-        genStmt(p, it[0])
-        lineF(p, "break;$n", [])
-  lineF(p, "}$n", [])
 
-proc genBlock(p: PProc, n: CgNode) =
-  inc(p.unique)
-  let labl = p.unique
-  lineF(p, "Label$1: {$n", [labl.rope])
-  p.blocks.add labl # push a new block
-  genStmt(p, n[1])
-  p.blocks.setLen(p.blocks.len - 1) # pop the block from the stack
-  lineF(p, "}$n", [labl.rope])
-
-proc genBreakStmt(p: PProc, n: CgNode) =
-  genLineDir(p, n)
-  lineF(p, "break Label$1;$n", [$p.blocks[n[0].label.int]])
+    let target = it[^1].label
+    p.nested:
+      if target in desc.inline:
+        # inline the code from the jump destination. The block nesting that
+        # would otherwise ensue can be too much for JavaScript engines to
+        # handle (V8 would fail to compile the code, for example)
+        gen(p, desc, stmts, desc.inline[target])
+      else:
+        # cannnot inline; a jump is needed
+        setEnabled(p, handleJump(p, it[^1], fromError=false), "false")
+        lineF(p, "break Label$1;$n", [$target])
+
+  lineF(p, "}$n", [])
 
 proc genAsmOrEmitStmt(p: PProc, n: CgNode) =
   genLineDir(p, n)
@@ -882,15 +935,6 @@ proc genAsmOrEmitStmt(p: PProc, n: CgNode) =
       p.body.add(r.rdLoc)
   p.body.add "\L"
 
-proc genIf(p: PProc, n: CgNode) =
-  let it = n
-
-  var cond: TCompRes
-  p.nested: gen(p, it[0], cond)
-  lineF(p, "if ($1) {$n", [cond.rdLoc])
-  genStmt(p, it[1])
-  lineF(p, "}$n", [])
-
 proc generateHeader(params: openArray[Loc]): string =
   ## Generates the JavaScript function parameter list for `params`.
   result = ""
@@ -1154,6 +1198,7 @@ proc genAddr(p: PProc, n: CgNode, r: var TCompRes) =
     internalError(p.config, n.info, "genAddr: " & $n.kind)
 
 proc accessLoc(s: Loc, r: var TCompRes) =
+    assert s.typ != nil, repr(s)
     let k = mapType(s.typ)
     if k == etyBaseIndex:
       r.typ = etyBaseIndex
@@ -1227,7 +1272,7 @@ proc genArgs(p: PProc, n: CgNode, r: var TCompRes; start=1) =
   assert(typ.len == typ.n.len)
   var emitted = start-1
 
-  for i in start..<n.len:
+  for i in start..<callLen(n):
     let it = n[i]
     var paramType: PNode = nil
     if i < typ.len:
@@ -1247,11 +1292,11 @@ proc genArgs(p: PProc, n: CgNode, r: var TCompRes; start=1) =
 
 proc genOtherArg(p: PProc; n: CgNode; i: int; typ: PType;
                  generated: var int; r: var TCompRes) =
-  if i >= n.len:
+  if i >= callLen(n):
     globalReport(p.config, n.info, semReportCountMismatch(
       rsemExpectedParameterForJsPattern,
       expected = i,
-      got = n.len - 1))
+      got = numArgs(n)))
 
   let it = n[i]
   var paramType: PNode = nil
@@ -1274,7 +1319,7 @@ proc genPatternCall(p: PProc; n: CgNode; pat: string; typ: PType;
     case pat[i]
     of '@':
       var generated = 0
-      for k in j..<n.len:
+      for k in j..<callLen(n):
         if generated > 0: r.res.add(", ")
         genOtherArg(p, n, k, typ, generated, r)
       inc i
@@ -1311,7 +1356,7 @@ proc genInfixCall(p: PProc, n: CgNode, r: var TCompRes) =
       assert(typ.kind == tyProc)
       genPatternCall(p, n, pat, typ, r)
       return
-  if n.len != 1:
+  if numArgs(n) != 0:
     gen(p, n[1], r)
     if r.typ == etyBaseIndex:
       p.config.internalAssert(r.address != "", n.info, "cannot invoke with infix syntax")
@@ -1341,7 +1386,7 @@ proc genEcho(p: PProc, n: CgNode, r: var TCompRes) =
   useMagic(p, "rawEcho")
   r.res.add("rawEcho(")
   # the first argument is a literal type that we don't need
-  for i in 2..<n.len:
+  for i in 2..<callLen(n):
     let it = n[i]
     if it.typ.isCompileTimeOnly: continue
     if i > 2: r.res.add(", ")
@@ -2058,12 +2103,6 @@ proc genRangeChck(p: PProc, n: CgNode, r: var TCompRes) =
     r.res = "chckRange($1, $2, $3)" % [r.res, a.res, b.res]
     r.kind = resExpr
 
-proc genReturnStmt(p: PProc, n: CgNode) =
-  p.config.internalAssert(p.prc != nil, n.info, "genReturnStmt")
-  p.beforeRetNeeded = true
-  genLineDir(p, n)
-  lineF(p, "break BeforeRet;$n", [])
-
 proc frameCreate(p: PProc; procname, filename: Rope): Rope =
   const frameFmt =
     "var F = {procname: $1, prev: framePtr, filename: $2, line: 0};$n"
@@ -2087,15 +2126,23 @@ proc genProcBody(p: PProc, prc: PSym): Rope =
               makeJSString(toFilenameOption(p.config, prc.info.fileIndex, foStacktrace)))
   else:
     result = ""
-  if p.beforeRetNeeded:
-    result.add p.indentLine(~"BeforeRet: {$n")
-    result.add p.body
-    result.add p.indentLine(~"}$n")
-  else:
-    result.add(p.body)
+
+  if p.lastErrorBackupNeeded:
+    result.add(p.indentLine("var Exception0_ = lastJSError;$n" % []))
+
+  result.add(p.body)
   if prc.typ.callConv == ccSysCall:
     result = ("try {$n$1} catch (e) {$n" &
       " alert(\"Unhandled exception:\\n\" + e.message + \"\\n\"$n}") % [result]
+  elif sfModuleInit in prc.flags:
+    # report an unhandled exception when a |NimSkull| exception escapes
+    # module-level code
+    # XXX: this is common logic across all backends; it needs to be handled at
+    #      the MIR level
+    useMagic(p, "unhandledException")
+    result = ("try {$n$1} catch (e) {$n" &
+              "  if (e.m_type !== undefined) { unhandledException(e); }$n" &
+              "  else { throw e; }$n}$n") % [result]
   if hasFrameInfo(p):
     result.add(frameDestroy(p))
 
@@ -2201,10 +2248,171 @@ proc finishProc*(p: PProc): string =
   #if gVerbosity >= 3:
   #  echo "END   generated code for: " & prc.name.s
 
+proc handleRecover(p: PProc, b: BlockInfo) =
+  if needsRecover in b.flags:
+    let nesting = p.numHandlers
+    lineF(p, "lastJSError = Exception$1_;$n", [$nesting])
+    if nesting == 0:
+      # there's no enclosing 'catch'; the value of ``lastJSError`` needs to
+      # be captured on procedure entry
+      p.lastErrorBackupNeeded = true
+
+proc handleSectionStart(p: PProc) =
+  # wrap the section in an 'if' if it can be disabled at run-time (only the
+  # opening is handled here)
+  if needsEnableFlag in p.blocks[^1].flags:
+    # the local is only defined when its first set to false, so it being
+    # undefined is treated as meaning "enabled"
+    startBlock(p, "if (Enabled$1_ === undefined || Enabled$1_) {$n",
+               $p.blocks[^1].label)
+
+proc popBlock(p: PProc) =
+  let blk = p.blocks.pop()
+  case blk.kind
+  of bkBlock:
+    endBlock(p)
+    # restore
+    handleRecover(p, blk)
+  of bkFinally:
+    if needsEnableFlag in blk.flags:
+      # close the wrapper 'if' and re-enable the section
+      endBlock(p, "} else { Enabled$1_ = true; }$n", $blk.label)
+    endBlock(p)
+  of bkCatch:
+    # the counterpart to the opening logic
+    if needsEnableFlag in blk.flags:
+      # close the wrapper 'if', re-enable the section, and re-throw
+      endBlock(p, "} else { Enabled$1_ = true; throw Exception$2_; }$n",
+               [$blk.label, $p.numHandlers])
+    endBlock(p)
+    # release the name:
+    dec p.numHandlers
+  of bkTryCatch, bkTryFinally:
+    discard "nothing to do when exiting these"
+
+proc gen(p: PProc, desc: StructDesc, stmts: openArray[CgNode], start: int) =
+  ## Generates code for `desc` and `stmts` starting at (but not including)
+  ## structure item `start`. Code generation continues until encountering
+  ## the first terminator that's at the same nesting level as the item at
+  ## `start`.
+  var
+    depth = 0
+    i     = start + 1
+
+  template structs: untyped = desc.structs
+
+  template gen(a, b: int) =
+    for i in a..<b:
+      genStmt(p, stmts[i])
+
+  block:
+    # generate code for the statements leading up to the first structure item
+    let
+      first =
+        if start == -1: 0
+        else:           structs[start].stmt
+      next =
+        if structs.len == 0: stmts.len
+        else:                structs[i].stmt
+
+    gen(first, next)
+
+  # code generation is driven by the control-flow constructs. Indentation is
+  # also (mostly) managed here
+  while i < structs.len:
+    let it = desc.structs[i]
+    case it.kind
+    of stkTry:
+      p.blocks.add BlockInfo(label: it.label)
+      p.blocks[^1].kind =
+        if it.label in desc.finallys: bkTryFinally
+        else:                         bkTryCatch
+      startBlock(p, "try {$n", [])
+      gen(it.stmt, structs[i+1].stmt)
+      inc depth
+    of stkBlock:
+      if it.label notin desc.inline:
+        p.blocks.add BlockInfo(kind: bkBlock, label: it.label)
+        startBlock(p, "Label$1: {$n", [$it.label.int])
+        gen(it.stmt, structs[i+1].stmt)
+      # still increment the depth; it makes handling of the 'end' item easier
+      inc depth
+    of stkStructStart:
+      # indentation is managed by ``genStmt`` here
+      gen(it.stmt, structs[i+1].stmt)
+      inc depth
+    of stkCatch:
+      endBlock(p)
+      p.blocks[^1].kind = bkCatch # replace the try block
+      inc p.numHandlers
+      startBlock(p, "catch(Exception$1_) {$n", [$p.numHandlers])
+      handleSectionStart(p)
+      gen(it.stmt, structs[i+1].stmt)
+    of stkFinally:
+      endBlock(p)
+      startBlock(p, "finally {$n", [])
+      p.blocks[^1].kind = bkFinally # replace the try block
+      handleSectionStart(p)
+      handleRecover(p, p.blocks[^1])
+      gen(it.stmt, structs[i+1].stmt)
+    of stkTerminator:
+      let n = stmts[it.stmt]
+      if n.kind == cnkCaseStmt:
+        genCaseJS(p, desc, stmts, n)
+      else:
+        genStmt(p, n)
+      # the statements immediately following the terminator are dead code,
+      # ignore them
+      if depth == 0:
+        break
+    of stkReturn:
+      lineF(p, "return;$n", [])
+      if depth == 0:
+        break
+    of stkEnd:
+      if it.label in desc.inline:
+        # skip the skip code following the block's end; this code is emitted from
+        # elsewhere
+        let orig = depth
+        while depth >= orig:
+          inc i
+          case structs[i].kind
+          of stkBlock, stkTry, stkStructStart:
+            inc depth
+          of stkEnd:
+            dec depth
+          of stkCatch, stkFinally:
+            discard "decrements and then increments the depth; a no-op"
+          of stkTerminator, stkReturn:
+            # the first terminator at the same level as the 'end' delimits
+            # the inlined section
+            if depth == orig:
+              break
+
+      else:
+        if p.blocks.len > 0 and p.blocks[^1].label == it.label:
+          popBlock(p)
+        else:
+          endBlock(p) # no special handling needed
+        # an 'end' can be the last item in the list
+        gen(it.stmt):
+          if i < structs.high: structs[i+1].stmt
+          else:                stmts.len
+
+      dec depth
+
+    inc i
+
+proc genStmts(p: PProc, stmts: openArray[CgNode]) =
+  let desc = toStructureList(stmts)
+  # we want to generate the statements leading up to the first structure
+  # too, hence -1 as the start
+  gen(p, desc, stmts, -1)
+
 proc genProc*(g: PGlobals, module: BModule, id: ProcedureId,
               body: sink Body): Rope =
   var p = startProc(g, module, id, body)
-  p.nested: genStmt(p, p.fullBody.code)
+  p.nested: genStmts(p, p.fullBody.code.kids)
   result = finishProc(p)
 
 proc genPartial*(p: PProc, n: CgNode) =
@@ -2213,7 +2421,7 @@ proc genPartial*(p: PProc, n: CgNode) =
   ## `startProc`.
   synchronize(p.locals, p.fullBody.locals)
   analyseIfAddressTaken(p.fullBody.code, p.addrTaken)
-  genStmt(p, n)
+  genStmts(p, n.kids)
 
 proc rdData(p: PProc, data: DataId, typ: PType): TCompRes =
   ## Returns the loc for the `data` of type `typ`. Emits the definition for
@@ -2229,8 +2437,20 @@ proc rdData(p: PProc, data: DataId, typ: PType): TCompRes =
 
 proc genStmt(p: PProc, n: CgNode) =
   var r: TCompRes
-  gen(p, n, r)
-  if r.res != "": lineF(p, "$#;$n", [r.res])
+  if n.kind == cnkCheckedCall or (n.kind in {cnkAsgn, cnkFastAsgn, cnkDef} and
+     n[1].kind == cnkCheckedCall):
+    # XXX: somewhat hacky way to handle checked calls
+    let sections = handleJump(p, n[^1], fromError=true)
+    setEnabled(p, sections, "false")
+    gen(p, n, r)
+    if r.res != "": lineF(p, "$#;$n", [r.res])
+    # re-enable the section again. Since disabling sections is uncommon,
+    # this should have less overhead than having to enable the section
+    # prior to *every* relevant jump
+    setEnabled(p, sections, "true")
+  else:
+    gen(p, n, r)
+    if r.res != "": lineF(p, "$#;$n", [r.res])
 
 proc genCast(p: PProc, n: CgNode, r: var TCompRes) =
   var dest = skipTypes(n.typ, abstractVarRange)
@@ -2353,8 +2573,7 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
       genLineDir(p, n)
     if getCalleeMagic(p.g.env, n[0]) != mNone:
       genMagic(p, n, r)
-    elif n[0].kind == cnkProc and sfInfixCall in p.env[n[0].prc].flags and
-        n.len >= 1:
+    elif n[0].kind == cnkProc and sfInfixCall in p.env[n[0].prc].flags:
       genInfixCall(p, n, r)
     else:
       genCall(p, n, r)
@@ -2420,16 +2639,26 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
   of cnkCast: genCast(p, n, r)
   of cnkEmpty: discard
   of cnkType: r.res = genTypeInfo(p, n.typ)
-  of cnkStmtList:
-    for it in n.items:
-      genStmt(p, it)
-  of cnkBlockStmt: genBlock(p, n)
-  of cnkIfStmt: genIf(p, n)
-  of cnkRepeatStmt: genRepeatStmt(p, n)
   of cnkDef: genDef(p, n)
-  of cnkCaseStmt: genCaseJS(p, n)
-  of cnkReturnStmt: genReturnStmt(p, n)
-  of cnkBreakStmt: genBreakStmt(p, n)
+  of cnkGotoStmt:
+    setEnabled(p, handleJump(p, n[0], fromError=false), "false")
+    # jump directly to the final target. Placement of 'try' blocks made
+    # sure that finally sections are visited correctly
+    lineF(p, "break Label$1;$n", [$finalTarget(n[0]).label])
+  of cnkLoopJoinStmt:
+    startBlock(p, "while (true) {$n")
+  of cnkExcept:
+    # emit an exception handler
+    genExcept(p, n)
+  of cnkIfStmt:
+    genLineDir(p, n)
+    var a: TCompRes
+    gen(p, n[0], a)
+    startBlock(p, "if ($1) {$n", [rdLoc(a)])
+  of cnkFinally:
+    # make sure the frame pointer is correct after unwinding
+    if hasFrameInfo(p):
+      lineF(p, "framePtr = F;$n", [])
   of cnkAsgn: genAsgn(p, n)
   of cnkFastAsgn: genFastAsgn(p, n)
   of cnkVoidStmt:
@@ -2444,10 +2673,12 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
     else:
       lineF(p, "($1);$n", [a.res])
   of cnkAsmStmt, cnkEmitStmt: genAsmOrEmitStmt(p, n)
-  of cnkTryStmt: genTry(p, n)
   of cnkRaiseStmt: genRaiseStmt(p, n)
-  of cnkInvalid, cnkMagic, cnkRange, cnkBinding, cnkExcept, cnkFinally,
-     cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkField, cnkNewCfNodes:
+  of cnkJoinStmt, cnkEnd, cnkLoopStmt, cnkContinueStmt:
+    discard "terminators or endings for which no special handling is needed"
+  of cnkInvalid, cnkMagic, cnkRange, cnkBinding, cnkLeave, cnkTargetList,
+     cnkResume, cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkStmtList,
+     cnkField, cnkLegacyNodes, cnkCaseStmt:
     internalError(p.config, n.info, "gen: unknown node type: " & $n.kind)
 
 proc newModule*(g: ModuleGraph; module: PSym): BModule =
@@ -2459,7 +2690,6 @@ proc newModule*(g: ModuleGraph; module: PSym): BModule =
 proc genHeader*(): Rope =
   result = rope("""/* Generated by the Nim Compiler v$1 */
     var framePtr = null;
-    var excHandler = 0;
     var lastJSError = null;
   """.unindent.format(VersionAsString))
 
@@ -2469,7 +2699,7 @@ proc genTopLevelStmt*(globals: PGlobals, m: BModule, body: sink Body) =
   p.fullBody = body
   p.unique = globals.unique
   analyseIfAddressTaken(p.fullBody.code, p.addrTaken)
-  genStmt(p, p.fullBody.code)
+  genStmts(p, p.fullBody.code.kids)
   p.g.code.add(p.defs)
   p.g.code.add(p.body)
 
diff --git a/lib/system/jssys.nim b/lib/system/jssys.nim
index 07b85026618..86b749c47ad 100644
--- a/lib/system/jssys.nim
+++ b/lib/system/jssys.nim
@@ -31,7 +31,6 @@ type
 
 var
   framePtr {.importc, nodecl, volatile.}: PCallFrame
-  excHandler {.importc, nodecl, volatile.}: int = 0
   lastJSError {.importc, nodecl, volatile.}: PJSError = nil
 
 {.push stacktrace: off, profiler:off.}
@@ -148,18 +147,12 @@ proc prepareException(e: ref Exception, ename: cstring) {.
     e.trace = rawWriteStackTrace()
 
 proc raiseException(e: ref Exception) {.compilerproc, asmNoStackFrame.} =
-  if excHandler == 0:
-    unhandledException(e)
   asm "throw `e`;"
 
 proc reraiseException() {.compilerproc, asmNoStackFrame.} =
   if lastJSError == nil:
     raise newException(ReraiseDefect, "no exception to reraise")
   else:
-    if excHandler == 0:
-      if isNimException():
-        unhandledException(cast[ref Exception](lastJSError))
-
     asm "throw lastJSError;"
 
 proc raiseOverflow {.exportc: "raiseOverflow", noreturn, compilerproc.} =
diff --git a/tests/exception/tleave_except.nim b/tests/exception/tleave_except.nim
index f85a9f383dd..f72191c65f1 100644
--- a/tests/exception/tleave_except.nim
+++ b/tests/exception/tleave_except.nim
@@ -4,7 +4,6 @@ discard """
     (``break``) works and properly clears the current exception.
   '''
   output: "done"
-  knownIssue.js: "The current exception is not properly cleared"
 """
 
 var steps: seq[int]
diff --git a/tests/exception/tleave_except2.nim b/tests/exception/tleave_except2.nim
index 66262b80fd9..ec591e27d9a 100644
--- a/tests/exception/tleave_except2.nim
+++ b/tests/exception/tleave_except2.nim
@@ -3,7 +3,6 @@ discard """
     Ensure that leaving an `except` section by raising an exception properly
     updates the current exception.
   '''
-  knownIssue.js: "The current exception is not reset properly"
 """
 
 var steps: seq[string]
diff --git a/tests/exception/traise_and_handle_in_except.nim b/tests/exception/traise_and_handle_in_except.nim
index f970a91594d..af940162800 100644
--- a/tests/exception/traise_and_handle_in_except.nim
+++ b/tests/exception/traise_and_handle_in_except.nim
@@ -4,7 +4,6 @@ discard """
     branch works.
   '''
   output: "done"
-  knownIssue.js: "The current exception is not properly cleared"
 """
 
 var steps: seq[int]
diff --git a/tests/exception/treraise2.nim b/tests/exception/treraise2.nim
index 9fd0a841095..d1646f242d1 100644
--- a/tests/exception/treraise2.nim
+++ b/tests/exception/treraise2.nim
@@ -3,7 +3,6 @@ discard """
     Ensure that raising a caught exception from within an exception handler
     works
   '''
-  knownIssue.js: "The current exception is not properly updated"
 """
 
 proc manualReraise() =
diff --git a/tests/js/tnativeexc.nim b/tests/js/tnativeexc.nim
index ea371c1cdb8..a7f19f6e49a 100644
--- a/tests/js/tnativeexc.nim
+++ b/tests/js/tnativeexc.nim
@@ -4,17 +4,21 @@ discard """
 
 import jsffi
 
+proc throwError() {.importjs: "throw new Error('a new error')".}
+
 # Can catch JS exceptions
 try:
-  asm """throw new Error('a new error');"""
+  throwError()
 except JsError as e:
   doAssert e.message == "a new error"
 except:
   doAssert false
 
+proc parse() {.importjs: "JSON.parse(';;')".}
+
 # Can distinguish different exceptions
 try:
-  asm """JSON.parse(';;');"""
+  parse()
 except JsEvalError:
   doAssert false
 except JsSyntaxError as se:
@@ -22,9 +26,11 @@ except JsSyntaxError as se:
 except JsError as e:
   doAssert false
 
+proc throwSyntaxError() {.importjs: "throw new SyntaxError()".}
+
 # Can catch parent exception
 try:
-  asm """throw new SyntaxError();"""
+  throwSyntaxError()
 except JsError as e:
   discard
 except:

From f3f83e71d6bd5a57e7eec04d3de6579370d132fd Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 13 Mar 2024 00:46:04 +0100
Subject: [PATCH 030/169] macros: disallow creating special nodes manually
 (#1235)

## Summary

Attempting to manually create a node (via `newNimNode`) of kind
`nnkError`, `nnkIdent`, `nnkSym`, or `nnkType` now results in a
compiler error. Creating them was previously allowed, but the
compiler could crash when such incomplete nodes appear in macro
output.

## Details

* all node kinds where the initial state is not valid (`nkError`,
  `nkIdent`, `nkSym`, and `nkType`) are forbidden
* the `opcNNewNimNode` implementation guards against the node kinds
* a VM event, diagnostic, and report is added for the error
* to not introduce a new variant, the `msg` variant is re-used for the
  new VM event
* the untyped `nnkType` test case is removed from `tempty_type_nodes`;
  macros cannot create untyped `nnkType` nodes anymore
---
 compiler/ast/ast_types.nim                    |  4 ++-
 compiler/ast/report_enums.nim                 |  1 +
 compiler/front/cli_reporter.nim               |  6 ++++-
 compiler/front/msgs.nim                       |  1 +
 compiler/vm/vm.nim                            | 19 ++++++++++----
 compiler/vm/vmdef.nim                         |  4 ++-
 compiler/vm/vmrunner.nim                      |  1 +
 .../macros/tdisallow_create_special_nodes.nim | 26 +++++++++++++++++++
 .../macros/tempty_type_nodes.nim              | 10 +------
 9 files changed, 55 insertions(+), 17 deletions(-)
 create mode 100644 tests/lang_callable/macros/tdisallow_create_special_nodes.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index c5b048d0bb7..e4fc830088c 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -987,6 +987,7 @@ type
     adVmFieldNotFound
     adVmNotAField
     adVmFieldUnavailable
+    adVmCannotCreateNode
     adVmCannotSetChild
     adVmCannotAddChild
     adVmCannotGetChild
@@ -1009,7 +1010,8 @@ type
         indexSpec*: tuple[usedIdx, minIdx, maxIdx: Int128]
       of adVmErrInternal, adVmNilAccess, adVmIllegalConv,
           adVmFieldUnavailable, adVmFieldNotFound,
-          adVmCacheKeyAlreadyExists, adVmMissingCacheKey:
+          adVmCacheKeyAlreadyExists, adVmMissingCacheKey,
+          adVmCannotCreateNode:
         msg*: string
       of adVmCannotSetChild, adVmCannotAddChild, adVmCannotGetChild,
           adVmUnhandledException, adVmNoType, adVmNodeNotASymbol:
diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index 78a92bcdfd0..d4da99e7f74 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -247,6 +247,7 @@ type
     rvmCacheKeyAlreadyExists
     rvmFieldNotFound
     rvmFieldInavailable
+    rvmCannotCreateNode
     rvmCannotSetChild
     rvmCannotAddChild
     rvmCannotGetChild
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index cf89556fe88..cee55b31a27 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -2949,6 +2949,9 @@ proc reportBody*(conf: ConfigRef, r: VMReport): string =
   of rvmFieldNotFound:
     result = "node lacks field: " & r.str
 
+  of rvmCannotCreateNode:
+    result = "cannot manually create a node of kind: n" & r.str
+
   of rvmCannotSetChild:
     result = "cannot set child of node kind: n" & $r.ast.kind
 
@@ -3867,7 +3870,8 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
         location: some location,
         reportInst: diag.instLoc.toReportLineInfo)
     of rvmErrInternal, rvmNilAccess, rvmIllegalConv, rvmFieldInavailable,
-        rvmFieldNotFound, rvmCacheKeyAlreadyExists, rvmMissingCacheKey:
+        rvmFieldNotFound, rvmCacheKeyAlreadyExists, rvmMissingCacheKey,
+        rvmCannotCreateNode:
       vmRep = VMReport(
         kind: kind,
         str: diag.vmErr.msg,
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index 664906ce4ad..37dd2a33572 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -391,6 +391,7 @@ func astDiagVmToLegacyReportKind*(
   of adVmFieldNotFound: rvmFieldNotFound
   of adVmNotAField: rvmNotAField
   of adVmFieldUnavailable: rvmFieldInavailable
+  of adVmCannotCreateNode: rvmCannotCreateNode
   of adVmCannotSetChild: rvmCannotSetChild
   of adVmCannotAddChild: rvmCannotAddChild
   of adVmCannotGetChild: rvmCannotGetChild
diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index 8ec5a6b354b..f36289117fa 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -2752,13 +2752,21 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
         raiseVmError(VmEvent(kind: vmEvtFieldNotFound, msg: "strVal"))
     of opcNNewNimNode:
       decodeBC(rkNimNode)
-      var k = regs[rb].intVal
+      let k = regs[rb].intVal
       guestValidate(k in 0..ord(high(TNodeKind)),
         "request to create a NimNode of invalid kind")
 
+      let kind = TNodeKind(int(k))
+      case kind
+      of nkError, nkIdent, nkSym, nkType:
+        # nodes that cannot be created manually
+        raiseVmError(VmEvent(kind: vmEvtCannotCreateNode, msg: $kind))
+      of nkWithSons, nkLiterals, nkCommentStmt, nkEmpty:
+        discard "the uninitialized state is valid"
+
       let cc = regs[rc].nimNode
 
-      let x = newNodeI(TNodeKind(int(k)),
+      let x = newNodeI(kind,
         if cc.kind != nkNilLit:
           cc.info
         elif c.comesFromHeuristic.line != 0'u16:
@@ -2767,8 +2775,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
           c.callsite[1].info
         else:
           c.debug[pc])
-      # prevent crashes in the compiler resulting from wrong macros:
-      if x.kind == nkIdent: x.ident = c.cache.emptyIdent
+
       regs[ra].nimNode = x
     of opcNCopyNimNode:
       decodeB(rkNimNode)
@@ -3017,6 +3024,7 @@ func vmEventToAstDiagVmError*(evt: VmEvent): AstDiagVmError {.inline.} =
     of vmEvtFieldNotFound: adVmFieldNotFound
     of vmEvtNotAField: adVmNotAField
     of vmEvtFieldUnavailable: adVmFieldUnavailable
+    of vmEvtCannotCreateNode: adVmCannotCreateNode
     of vmEvtCannotSetChild: adVmCannotSetChild
     of vmEvtCannotAddChild: adVmCannotAddChild
     of vmEvtCannotGetChild: adVmCannotGetChild
@@ -3048,7 +3056,8 @@ func vmEventToAstDiagVmError*(evt: VmEvent): AstDiagVmError {.inline.} =
           indexSpec: evt.indexSpec)
       of adVmErrInternal, adVmNilAccess, adVmIllegalConv,
           adVmFieldUnavailable, adVmFieldNotFound,
-          adVmCacheKeyAlreadyExists, adVmMissingCacheKey:
+          adVmCacheKeyAlreadyExists, adVmMissingCacheKey,
+          adVmCannotCreateNode:
         AstDiagVmError(
           kind: kind,
           msg: evt.msg)
diff --git a/compiler/vm/vmdef.nim b/compiler/vm/vmdef.nim
index c0b5653ebdc..7eb9b9935c9 100644
--- a/compiler/vm/vmdef.nim
+++ b/compiler/vm/vmdef.nim
@@ -598,6 +598,7 @@ type
     vmEvtFieldNotFound
     vmEvtNotAField
     vmEvtFieldUnavailable
+    vmEvtCannotCreateNode
     vmEvtCannotSetChild
     vmEvtCannotAddChild
     vmEvtCannotGetChild
@@ -623,7 +624,8 @@ type
         indexSpec*: tuple[usedIdx, minIdx, maxIdx: Int128]
       of vmEvtErrInternal, vmEvtNilAccess, vmEvtIllegalConv,
           vmEvtFieldUnavailable, vmEvtFieldNotFound,
-          vmEvtCacheKeyAlreadyExists, vmEvtMissingCacheKey:
+          vmEvtCacheKeyAlreadyExists, vmEvtMissingCacheKey,
+          vmEvtCannotCreateNode:
         msg*: string
       of vmEvtCannotSetChild, vmEvtCannotAddChild, vmEvtCannotGetChild,
          vmEvtNoType, vmEvtNodeNotASymbol:
diff --git a/compiler/vm/vmrunner.nim b/compiler/vm/vmrunner.nim
index a2f0e2e6678..2d097ec5f4c 100644
--- a/compiler/vm/vmrunner.nim
+++ b/compiler/vm/vmrunner.nim
@@ -273,6 +273,7 @@ func vmEventToLegacyReportKind(evt: VmEventKind): ReportKind {.inline.} =
   of vmEvtFieldNotFound: rvmFieldNotFound
   of vmEvtNotAField: rvmNotAField
   of vmEvtFieldUnavailable: rvmFieldInavailable
+  of vmEvtCannotCreateNode: rvmCannotCreateNode
   of vmEvtCannotSetChild: rvmCannotSetChild
   of vmEvtCannotAddChild: rvmCannotAddChild
   of vmEvtCannotGetChild: rvmCannotGetChild
diff --git a/tests/lang_callable/macros/tdisallow_create_special_nodes.nim b/tests/lang_callable/macros/tdisallow_create_special_nodes.nim
new file mode 100644
index 00000000000..4f138f39dfb
--- /dev/null
+++ b/tests/lang_callable/macros/tdisallow_create_special_nodes.nim
@@ -0,0 +1,26 @@
+discard """
+  description: '''
+    Ensure that an error is reported when attempting to create special
+    atom nodes with `newNimNode`
+  '''
+  matrix: "--errorMax:4"
+  action: reject
+"""
+
+import std/macros
+
+static:
+  discard newNimNode(nnkError) #[tt.Error
+                    ^ cannot manually create a node of kind: nnkError]#
+
+static:
+  discard newNimNode(nnkIdent) #[tt.Error
+                    ^ cannot manually create a node of kind: nnkIdent]#
+
+static:
+  discard newNimNode(nnkSym) #[tt.Error
+                    ^ cannot manually create a node of kind: nnkSym]#
+
+static:
+  discard newNimNode(nnkType) #[tt.Error
+                    ^ cannot manually create a node of kind: nnkType]#
diff --git a/tests/lang_callable/macros/tempty_type_nodes.nim b/tests/lang_callable/macros/tempty_type_nodes.nim
index 6ab3d3fc827..1dff4eec242 100644
--- a/tests/lang_callable/macros/tempty_type_nodes.nim
+++ b/tests/lang_callable/macros/tempty_type_nodes.nim
@@ -1,6 +1,6 @@
 discard """
   description: '''
-    Ensure that untyped `nnkEmpty` and `nnkType` nodes used in type positions
+    Ensure that untyped `nnkEmpty` nodes used in type positions
     result in a proper error
   '''
   target: native
@@ -17,11 +17,3 @@ macro test1(): untyped =
     newNimNode(nnkEmpty)
 
 test1()
-
-macro test2(): untyped =
-  # test case #2: untyped ``nnkType`` node in type position
-  nnkConv.newTree(newNimNode(nnkType)): #[tt.Error
-                            ^ type expected, but expression has no type]#
-    newNimNode(nnkEmpty)
-
-test2()

From 0d035765bf39a1ded566fc28566907a9bd803656 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 13 Mar 2024 01:44:27 +0100
Subject: [PATCH 031/169] cgir: remove the legacy CGIR variant (#1234)

## Summary

All code generators use the new goto-using variant of the CGIR now,
rendering the legacy variant obsolete. This is an internal-only
refactoring.

## Details

* remove the `cgirgen_legacy` module
* remove the node kinds belonging to the legacy variant
* remove the sets introduced for the transition
* remove some leftover usages of `cnkStmtListExpr` (they were dead code
  already)
---
 compiler/backend/backends.nim       |  10 +-
 compiler/backend/ccgexprs.nim       |   4 +-
 compiler/backend/cgir.nim           |  22 +-
 compiler/backend/cgirgen_legacy.nim | 920 ----------------------------
 compiler/backend/cgirutils.nim      |   2 +-
 compiler/backend/jsbackend.nim      |   3 +-
 compiler/backend/jsgen.nim          |  19 +-
 compiler/mir/mirbridge.nim          |   9 +-
 compiler/vm/vmgen.nim               |   4 +-
 9 files changed, 17 insertions(+), 976 deletions(-)
 delete mode 100644 compiler/backend/cgirgen_legacy.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 80b9999af09..b2cbf3fdf9a 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -15,8 +15,7 @@ import
   compiler/backend/[
     cgmeth,
     cgir,
-    cgirgen,
-    cgirgen_legacy
+    cgirgen
   ],
   compiler/front/[
     msgs,
@@ -371,13 +370,6 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
   result = cgirgen.generateIR(graph, idgen, env, owner, body)
   echoOutput(graph.config, owner, result)
 
-proc generateIRLegacy*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
-                 owner: PSym, body: sink MirBody): Body =
-  ## Translates the MIR code provided by `code` into legacy ``CgNode`` IR and,
-  ## if enabled, echoes the result.
-  result = cgirgen_legacy.generateIR(graph, idgen, env, owner, body)
-  echoOutput(graph.config, owner, result)
-
 # ------- handling of lifted globals ---------
 
 proc produceFragmentsForGlobals(
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 1a1aa504c38..5a70078b869 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -2130,8 +2130,8 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
   of cnkJoinStmt, cnkGotoStmt:
     unreachable("handled separately")
   of cnkInvalid, cnkType, cnkAstLit, cnkMagic, cnkRange, cnkBinding, cnkBranch,
-     cnkLabel, cnkTargetList, cnkStmtListExpr, cnkField, cnkStmtList,
-     cnkLeave, cnkResume, cnkLegacyNodes:
+     cnkLabel, cnkTargetList, cnkField, cnkStmtList,
+     cnkLeave, cnkResume:
     internalError(p.config, n.info, "expr(" & $n.kind & "); unknown node kind")
 
 proc getDefaultValue(p: BProc; typ: PType; info: TLineInfo): Rope =
diff --git a/compiler/backend/cgir.nim b/compiler/backend/cgir.nim
index 2b489202d4f..a19ac5e1704 100644
--- a/compiler/backend/cgir.nim
+++ b/compiler/backend/cgir.nim
@@ -105,9 +105,8 @@ type
                      ## different type
 
     cnkStmtList
-    cnkStmtListExpr
-    # XXX: both stmtlist and stmtlistexpr are obsolete. They're only kept for
-    #      grouping the top-level statements under a single node
+    # XXX: stmtlist is obsolete, and only kept temporarily to group statements
+    #      together under a single node
 
     cnkVoidStmt   ## discard the operand value (i.e., do nothing with it)
     cnkEmitStmt   ## an ``emit`` statement
@@ -115,20 +114,14 @@ type
 
     cnkIfStmt     ## only execute the body when the condition expression
                   ## evaluates to 'true'
-    cnkRepeatStmt ## execute the body indefinitely
     cnkCaseStmt   ## a ``case`` statement
     cnkBranch     ## the branch of a ``case`` statement
-    cnkBlockStmt  ## an (optionally) labeled block
-    cnkTryStmt
 
     cnkGotoStmt
     cnkLoopStmt   ## jump back to a loop join point
-    cnkBreakStmt  ## break out of labeled block, or, if no label is provided,
-                  ## the closest ``repeat`` loop
     cnkRaiseStmt  ## raise(x) -- set the `x` as the current exception and start
                   ## exceptional control-flow. `x` can be ``cnkEmpty`` in which
                   ## case "set current exception" part is skipped
-    cnkReturnStmt
     cnkContinueStmt## jump to the next target in the active jump list
 
     cnkJoinStmt   ## join point for gotos
@@ -155,19 +148,12 @@ const
   cnkWithOperand*  = {cnkConv, cnkHiddenConv, cnkDeref, cnkAddr, cnkHiddenAddr,
                       cnkDerefView, cnkObjDownConv, cnkObjUpConv, cnkCast,
                       cnkLvalueConv}
-  cnkAtoms*        = {cnkInvalid..cnkResume, cnkReturnStmt}
+  cnkAtoms*        = {cnkInvalid..cnkResume}
     ## node kinds that denote leafs
   cnkWithItems*    = AllKinds - cnkWithOperand - cnkAtoms
     ## node kinds for which the ``items`` iterator is available
 
   cnkLiterals* = {cnkIntLit, cnkUIntLit, cnkFloatLit, cnkStrLit}
-  cnkLegacyNodes* = {cnkBlockStmt, cnkTryStmt, cnkReturnStmt, cnkBreakStmt,
-                     cnkRepeatStmt}
-    ## node kinds that belong to the legacy control-flow representation
-  cnkNewCfNodes* = {cnkGotoStmt, cnkJoinStmt, cnkLeave, cnkResume,
-                    cnkContinueStmt, cnkLoopStmt, cnkLoopJoinStmt,
-                    cnkEnd, cnkTargetList}
-    ## node kinds that belong to the new-style control-flow representation
 
 type
   Local* = object
@@ -199,7 +185,7 @@ type
     info*: TLineInfo
     typ*: PType
     case kind*: CgNodeKind
-    of cnkInvalid, cnkEmpty, cnkType, cnkNilLit, cnkReturnStmt, cnkResume:
+    of cnkInvalid, cnkEmpty, cnkType, cnkNilLit, cnkResume:
       discard
     of cnkIntLit, cnkUIntLit:
       # future direction: use a ``BiggestUint`` for uint values
diff --git a/compiler/backend/cgirgen_legacy.nim b/compiler/backend/cgirgen_legacy.nim
deleted file mode 100644
index cb60ba0eae0..00000000000
--- a/compiler/backend/cgirgen_legacy.nim
+++ /dev/null
@@ -1,920 +0,0 @@
-## Implements the translation from the MIR to the ``CgNode`` IR. All code
-## reaching the code generation phase passes through here.
-##
-## .. note::
-##   The `tb` prefix that's still used in some places is an abbreviation of
-##   "translate back"
-##
-## .. note::
-##   The ``CgNode`` IR is slated for removal, with the MIR intended to take
-##   its place as the code-generator input.
-
-import
-  std/[
-    tables
-  ],
-  compiler/ast/[
-    ast_types,
-    ast_idgen,
-    ast_query,
-    lineinfos,
-    types
-  ],
-  compiler/backend/[
-    cgir
-  ],
-  compiler/front/[
-    options
-  ],
-  compiler/mir/[
-    mirbodies,
-    mirenv,
-    mirtrees,
-    sourcemaps
-  ],
-  compiler/modules/[
-    modulegraphs
-  ],
-  compiler/utils/[
-    containers,
-    idioms,
-    int128
-  ]
-
-from compiler/ast/ast import newSym, newType, rawAddSon
-from compiler/sem/semdata import makeVarType
-
-type
-  TranslateCl = object
-    graph: ModuleGraph
-    idgen: IdGenerator
-
-    owner: PSym
-
-    tempMap: SeqMap[TempId, LocalId]
-      ## maps a ``TempId`` to the ID of the local created for it
-    localsMap: Table[int, LocalId]
-      ## maps a sybmol ID to the corresponding local. Needed because normal
-      ## local variables reach here as ``PSym``s
-    blocks: seq[LabelId]
-      ## the stack of enclosing blocks for the currently processed node
-
-    locals: Store[LocalId, Local]
-      ## the in-progress list of all locals in the translated body
-
-    # a 'def' in the MIR means that the the local starts to exists and that it
-    # is accessible in all connected basic blocks part of the enclosing
-    # ``mnkScope``. The ``CgNode`` IR doesn't use same notion of scope,
-    # so for now, all 'def's (without the initial values) within nested
-    # control-flow-related trees are moved to the start of the enclosing
-    # ``mnkScope``.
-    inUnscoped: bool
-      ## whether the currently proceesed statement/expression is part of an
-      ## unscoped control-flow context
-    defs: seq[CgNode]
-      ## the stack of locals/globals for which the ``cnkDef``/assignemnt needs
-      ## to be inserted later
-
-  TreeCursor = object
-    ## A cursor into a ``MirBody``.
-    pos: uint32 ## the index of the currently pointed to node
-    origin {.cursor.}: PNode ## the source node
-
-func newMagicNode(magic: TMagic, info: TLineInfo): CgNode =
-  CgNode(kind: cnkMagic, info: info, magic: magic)
-
-func get(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
-  cr.origin = t.sourceFor(cr.pos.NodePosition)
-  result = t.code[cr.pos]
-
-  inc cr.pos
-
-func enter(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
-  assert t.code[cr.pos].kind in SubTreeNodes, "not a sub-tree"
-  result = get(t, cr)
-
-func leave(t: MirBody, cr: var TreeCursor) =
-  assert t.code[cr.pos].kind == mnkEnd, "not at the end of sub-tree"
-  inc cr.pos
-
-template info(cr: TreeCursor): TLineInfo =
-  cr.origin.info
-
-template `[]`(t: MirBody, cr: TreeCursor): untyped =
-  t.code[cr.pos]
-
-template hasNext(cr: TreeCursor, t: MirBody): bool =
-  cr.pos.int < t.code.len
-
-template `[]=`(x: CgNode, i: Natural, n: CgNode) =
-  x.kids[i] = n
-
-template `[]=`(x: CgNode, i: BackwardsIndex, n: CgNode) =
-  x.kids[i] = n
-
-template add(x: CgNode, y: CgNode) =
-  x.kids.add y
-
-proc copyTree(n: CgNode): CgNode =
-  case n.kind
-  of cnkAtoms:
-    new(result)
-    result[] = n[]
-  of cnkWithOperand:
-    result = CgNode(kind: n.kind, info: n.info, typ: n.typ)
-    result.operand = copyTree(n.operand)
-  of cnkWithItems:
-    result = CgNode(kind: n.kind, info: n.info, typ: n.typ)
-    result.kids.setLen(n.kids.len)
-    for i, it in n.pairs:
-      result[i] = copyTree(it)
-
-proc newEmpty(info = unknownLineInfo): CgNode =
-  CgNode(kind: cnkEmpty, info: info)
-
-proc newTree(kind: CgNodeKind, info: TLineInfo, kids: varargs[CgNode]): CgNode =
-  ## For node kinds that don't represent standalone statements.
-  result = CgNode(kind: kind, info: info)
-  result.kids = @kids
-
-func newTypeNode(info: TLineInfo, typ: PType): CgNode =
-  CgNode(kind: cnkType, info: info, typ: typ)
-
-func newFieldNode(s: PSym; info = unknownLineInfo): CgNode =
-  CgNode(kind: cnkField, info: info, typ: s.typ, field: s)
-
-func newLabelNode(blk: BlockId; info = unknownLineInfo): CgNode =
-  CgNode(kind: cnkLabel, info: info, label: blk)
-
-proc newExpr(kind: CgNodeKind, info: TLineInfo, typ: PType,
-             kids: sink seq[CgNode]): CgNode =
-  ## Variant of ``newExpr`` optimized for passing a pre-existing child
-  ## node sequence.
-  result = CgNode(kind: kind, info: info, typ: typ)
-  result.kids = kids
-
-proc translateLit*(val: PNode): CgNode =
-  ## Translates an ``mnkLiteral`` node to a ``CgNode``.
-  ## Note that the MIR not only uses ``mnkLiteral`` for "real" literals, but
-  ## also for pushing other raw ``PNode``s through the MIR phase.
-  template node(k: CgNodeKind, field, value: untyped): CgNode =
-    CgNode(kind: k, info: val.info, typ: val.typ, field: value)
-
-  case val.kind
-  of nkIntLiterals:
-    # use the type for deciding what whether it's a signed or unsigned value
-    case val.typ.skipTypes(abstractRange + {tyEnum}).kind
-    of tyInt..tyInt64, tyBool:
-      node(cnkIntLit, intVal, val.intVal)
-    of tyUInt..tyUInt64, tyChar:
-      node(cnkUIntLit, intVal, val.intVal)
-    of tyPtr, tyPointer, tyProc:
-      # XXX: consider adding a dedicated node for pointer-like-literals
-      #      to both ``PNode`` and ``CgNode``
-      node(cnkUIntLit, intVal, val.intVal)
-    else:
-      unreachable(val.typ.skipTypes(abstractRange).kind)
-  of nkFloatLiterals:
-    case val.typ.skipTypes(abstractRange).kind
-    of tyFloat, tyFloat64:
-      node(cnkFloatLit, floatVal, val.floatVal)
-    of tyFloat32:
-      # all code-generators need to do this at one point, so we help them out
-      # by narrowing the value to a float32 value
-      node(cnkFloatLit, floatVal, val.floatVal.float32.float64)
-    else:
-      unreachable()
-  of nkStrKinds:
-    node(cnkStrLit, strVal, val.strVal)
-  of nkNilLit:
-    newNode(cnkNilLit, val.info, val.typ)
-  of nkNimNodeLit:
-    node(cnkAstLit, astLit, val[0])
-  of nkRange:
-    node(cnkRange, kids, @[translateLit(val[0]), translateLit(val[1])])
-  of nkSym:
-    # special case for raw symbols used with emit and asm statements
-    assert val.sym.kind == skField
-    node(cnkField, field, val.sym)
-  else:
-    unreachable("implement: " & $val.kind)
-
-func addIfNotEmpty(stmts: var seq[CgNode], n: sink CgNode) =
-  ## Only adds the node to the list if it's not an empty node. Used to prevent
-  ## the creation of statement-list expression that only consist of empty
-  ## nodes + the result-expression (a statement-list expression is unnecessary
-  ## in that case)
-  if n.kind != cnkEmpty:
-    stmts.add n
-
-func toSingleNode(stmts: sink seq[CgNode]): CgNode =
-  ## Creates a single ``CgNode`` from a list of *statements*
-  case stmts.len
-  of 0:
-    result = newEmpty()
-  of 1:
-    result = move stmts[0]
-  else:
-    result = newNode(cnkStmtList)
-    result.kids = stmts
-
-proc newDefaultCall(info: TLineInfo, typ: PType): CgNode =
-  ## Produces the tree for a ``default`` magic call.
-  newExpr(cnkCall, info, typ, [newMagicNode(mDefault, info)])
-
-proc initLocal(s: PSym): Local =
-  ## Inits a ``Local`` with the data from `s`.
-  result = Local(typ: s.typ, flags: s.flags, isImmutable: (s.kind == skLet),
-                 name: s.name)
-  if s.kind in {skVar, skLet, skForVar}:
-    result.alignment = s.alignment.uint32
-
-proc wrapInHiddenAddr(cl: TranslateCl, n: CgNode): CgNode =
-  ## Restores the ``cnkHiddenAddr`` around lvalue expressions passed to ``var``
-  ## parameters. The code-generators operating on ``CgNode``-IR depend on the
-  ## hidden addr to be present
-  if n.typ.skipTypes(abstractInst).kind != tyVar:
-    newOp(cnkHiddenAddr, n.info, makeVarType(cl.owner, n.typ, cl.idgen), n)
-  else:
-    # XXX: is this case ever reached? It should not be. Raw ``var`` values
-    #      must never be passed directly to ``var`` parameters at the MIR
-    #      level
-    n
-
-proc genObjConv(n: CgNode, a, b, t: PType): CgNode =
-  ## Depending on the relationship between `a` and `b`, wraps `n` in either an
-  ## up- or down-conversion. `t` is the type to use for the resulting
-  ## expression
-  let diff = inheritanceDiff(b, a)
-  #echo "a: ", a.sym.name.s, "; b: ", b.sym.name.s
-  #assert diff != 0 and diff != high(int), "redundant or illegal conversion"
-  if diff == 0:
-    return nil
-  result = newOp(
-    if diff < 0: cnkObjUpConv else: cnkObjDownConv,
-    n.info, t): n
-
-# forward declarations:
-proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode
-proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, allowExpr=false): seq[CgNode]
-
-proc handleSpecialConv(c: ConfigRef, n: CgNode, info: TLineInfo,
-                       dest: PType): CgNode =
-  ## Checks if a special conversion operator is required for a conversion
-  ## between the source type (i.e. that of `n`) and the destination type.
-  ## If it is, generates the conversion operation IR and returns it -- nil
-  ## otherwise
-  let
-    orig = dest
-    source = n.typ.skipTypes(abstractVarRange)
-    dest = dest.skipTypes(abstractVarRange)
-
-  case dest.kind
-  of tyObject:
-    assert source.kind == tyObject
-    genObjConv(n, source, dest, orig)
-  of tyRef, tyPtr, tyVar, tyLent:
-    assert source.kind == dest.kind
-    if source.base.kind == tyObject:
-      genObjConv(n, source.base, dest.base, orig)
-    else:
-      nil
-  else:
-    nil
-
-proc convToIr(cl: TranslateCl, n: CgNode, info: TLineInfo, dest: PType): CgNode =
-  ## Generates the ``CgNode`` IR for an ``mnkPathConv`` operation (handle
-  ## conversion).
-  result = handleSpecialConv(cl.graph.config, n, info, dest)
-  if result == nil:
-    # no special conversion is used
-    result = newOp(cnkLvalueConv, info, dest, n)
-
-proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
-  case n.kind
-  of mnkProc:
-    CgNode(kind: cnkProc, info: info, typ: n.typ, prc: n.prc)
-  of mnkGlobal:
-    CgNode(kind: cnkGlobal, info: info, typ: n.typ, global: n.global)
-  of mnkConst:
-    CgNode(kind: cnkConst, info: info, typ: n.typ, cnst: n.cnst)
-  of mnkLocal, mnkParam:
-    # paramaters are treated like locals in the code generators
-    assert n.sym.id in cl.localsMap
-    newLocalRef(cl.localsMap[n.sym.id], info, n.sym.typ)
-  of mnkTemp:
-    newLocalRef(cl.tempMap[n.temp], info, n.typ)
-  of mnkAlias:
-    # the type of the node doesn't match the real one
-    let
-      id = cl.tempMap[n.temp]
-      typ = cl.locals[id].typ
-    # the view is auto-dereferenced here for convenience
-    newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
-  of mnkLiteral:
-    translateLit(n.lit)
-  of mnkType:
-    newTypeNode(info, n.typ)
-  of mnkNone:
-    # type arguments do use `mnkNone` in some situtations, so keep
-    # the type
-    CgNode(kind: cnkEmpty, info: info, typ: n.typ)
-  else:
-    unreachable("not an atom: " & $n.kind)
-
-proc atomToIr(tree: MirBody, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode {.inline.} =
-  atomToIr(get(tree, cr), cl, cr.info)
-
-proc tbExceptItem(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor
-                 ): CgNode =
-  let n {.cursor.} = get(tree, cr)
-  case n.kind
-  of mnkLocal:
-    # the 'except' branch acts as a definition for the local
-    let id = cl.locals.add initLocal(n.sym)
-    cl.localsMap[n.sym.id] = id
-    newLocalRef(id, cr.info, n.typ)
-  of mnkType:  newTypeNode(cr.info, n.typ)
-  else:        unreachable()
-
-
-proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
-                cr: var TreeCursor; preferField = true): CgNode =
-  ## Translates a MIR lvalue expression to the corresponding CG IR.
-  ## Due to tagged unions (currently) not being addressable at the type-
-  ## representation level, the exact meaning of ``mnkPathVariant`` is
-  ## context-dependent -- `preferField` disambiguates whether it should be
-  ## turned into a field access rather than a (pseudo) access of the tagged
-  ## union.
-  let info = cr.info
-
-  template recurse(): CgNode =
-    lvalueToIr(tree, cl, tree.get(cr), cr, false)
-
-  case n.kind
-  of mnkLocal, mnkGlobal, mnkParam, mnkTemp, mnkAlias, mnkConst, mnkProc:
-    return atomToIr(n, cl, info)
-  of mnkPathNamed:
-    result = newExpr(cnkFieldAccess, info, n.typ,
-                     [recurse(), newFieldNode(n.field)])
-  of mnkPathVariant:
-    if preferField:
-      result = newExpr(cnkFieldAccess, cr.info, n.field.typ,
-                      [recurse(), newFieldNode(n.field)])
-    else:
-      # variant access itself has no ``CgNode`` counterpart at the moment
-      result = recurse()
-  of mnkPathPos:
-    result = newExpr(cnkTupleAccess, info, n.typ,
-                     [recurse(),
-                      CgNode(kind: cnkIntLit, intVal: n.position.BiggestInt)])
-  of mnkPathArray:
-    # special case in order to support string literal access
-    # XXX: this needs to be removed once there is a dedicated run-time-
-    #      sequence access operator
-    let arg =
-      if tree[cr].kind == mnkLiteral:
-        atomToIr(tree, cl, cr)
-      else:
-        recurse()
-
-    result = newExpr(cnkArrayAccess, info, n.typ, [arg, atomToIr(tree, cl, cr)])
-  of mnkPathConv:
-    result = convToIr(cl, recurse(), info, n.typ)
-  # dereferences are allowed at the end of a path tree
-  of mnkDeref:
-    result = newOp(cnkDeref, info, n.typ, atomToIr(tree, cl, cr))
-  of mnkDerefView:
-    result = newOp(cnkDerefView, info, n.typ, atomToIr(tree, cl, cr))
-  of AllNodeKinds - LvalueExprKinds - {mnkProc}:
-    unreachable(n.kind)
-
-  leave(tree, cr)
-
-proc lvalueToIr(tree: MirBody, cl: var TranslateCl,
-                cr: var TreeCursor; preferField=true): CgNode {.inline.} =
-  lvalueToIr(tree, cl, tree.get(cr), cr, preferField)
-
-proc valueToIr(tree: MirBody, cl: var TranslateCl,
-               cr: var TreeCursor): CgNode =
-  case tree[cr].kind
-  of mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkAlias,
-     mnkLiteral, mnkType:
-    atomToIr(tree, cl, cr)
-  of mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv, mnkPathVariant,
-     mnkDeref, mnkDerefView:
-    lvalueToIr(tree, cl, cr)
-  else:
-    unreachable("not a value: " & $tree[cr].kind)
-
-proc argToIr(tree: MirBody, cl: var TranslateCl,
-             cr: var TreeCursor): (bool, CgNode) =
-  ## Translates a MIR argument tree to the corresponding CG IR tree.
-  ## Returns both the tree and whether the argumnet was wrapped in a tag
-  ## operator (which indicates that the parameter is a ``var`` parameter).
-  var n {.cursor.} = tree.get(cr)
-  assert n.kind in ArgumentNodes, "argument node expected: " & $n.kind
-  # the inner node may be a tag node
-  n = tree.get(cr)
-  case n.kind
-  of mnkTag:
-    # it is one, the expression must be an lvalue
-    result = (true, lvalueToIr(tree, cl, cr))
-    leave(tree, cr)
-  of mnkLiteral, mnkType, mnkProc, mnkNone:
-    # not a tag but an atom
-    result = (false, atomToIr(n, cl, cr.info))
-  of LvalueExprKinds:
-    result = (false, lvalueToIr(tree, cl, n, cr))
-  else:
-    unreachable("not a valid argument expression")
-
-  leave(tree, cr)
-
-proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor): CgNode =
-  ## Translate a valid call-like tree to the CG IR.
-  let info = cr.info
-  result = newExpr((if n.kind == mnkCall: cnkCall else: cnkCheckedCall),
-                   info, n.typ)
-  result.add: # the callee
-    case tree[cr].kind
-    of mnkMagic: newMagicNode(tree.get(cr).magic, info)
-    else:        valueToIr(tree, cl, cr)
-
-  # the code generators currently require some magics to not have any
-  # arguments wrapped in ``cnkHiddenAddr`` nodes
-  let noAddr = result[0].kind == cnkMagic and
-               result[0].magic in FakeVarParams
-
-  # translate the arguments:
-  while tree[cr].kind != mnkEnd:
-    var (mutable, arg) = argToIr(tree, cl, cr)
-    if noAddr:
-      if arg.typ.kind == tyVar:
-        # auto-dereference the view
-        # XXX: prevent this case from happening
-        arg = newOp(cnkDerefView, arg.info, arg.typ.base, arg)
-    elif mutable:
-      arg = wrapInHiddenAddr(cl, arg)
-
-    result.add arg
-
-  leave(tree, cr)
-
-proc exprToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode
-
-proc sourceExprToIr(tree: MirBody, cl: var TranslateCl,
-                    cr: var TreeCursor): tuple[n: CgNode, useFast: bool] =
-  ## Translates the MIR expression appearing in an assignment's source
-  ## slot. Assignment modifiers are dropped, and whether a fast assignment or
-  ## normal assignment should be used is computed and returned.
-  case tree[cr].kind
-  of mnkCopy, mnkSink:
-    # requires a full assignment
-    discard enter(tree, cr)
-    result = (valueToIr(tree, cl, cr), false)
-    leave(tree, cr)
-  of mnkMove:
-    # an ``x = move y`` assignment can be turned into a fast assignment
-    discard enter(tree, cr)
-    result = (valueToIr(tree, cl, cr), true)
-    leave(tree, cr)
-  of LvalueExprKinds:
-    # a fast assignment is correct for all raw lvalues
-    result = (lvalueToIr(tree, cl, cr), true)
-  else:
-    # rvalue expressions require a full assignment
-    result = (exprToIr(tree, cl, cr), false)
-
-proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-           n: MirNode, cr: var TreeCursor): CgNode =
-  ## Translates a 'def'-like construct
-  assert n.kind in DefNodes
-  let
-    entity {.cursor.} = get(tree, cr) # the name of the defined entity
-    info = cr.info
-
-  var def: CgNode
-
-  case entity.kind
-  of mnkLocal:
-    # translate the ``PSym`` to a ``Local`` and establish a mapping
-    let
-      sym = entity.sym
-      id = cl.locals.add initLocal(sym)
-
-    assert sym.id notin cl.localsMap, "re-definition of local"
-    cl.localsMap[sym.id] = id
-
-    def = newLocalRef(id, info, entity.typ)
-  of mnkParam:
-    # ignore 'def's for parameters
-    def = newEmpty()
-  of mnkGlobal:
-    def = CgNode(kind: cnkGlobal, info: info, typ: entity.typ,
-                 global: entity.global)
-  of mnkTemp:
-    # MIR temporaries are like normal locals, with the difference that they
-    # are created ad-hoc and don't have any extra information attached
-    assert entity.typ != nil
-    let tmp = cl.locals.add Local(typ: entity.typ)
-
-    assert entity.temp notin cl.tempMap, "re-definition of temporary"
-    cl.tempMap[entity.temp] = tmp
-
-    def = newLocalRef(tmp, info, entity.typ)
-  of mnkAlias:
-    # MIR aliases are translated to var/lent views
-    assert n.kind in {mnkBind, mnkBindMut}, "alias can only be defined by binds"
-    assert entity.typ != nil
-    let
-      typ = makeVarType(cl.owner, entity.typ, cl.idgen,
-                        if n.kind == mnkBind: tyLent else: tyVar)
-      tmp = cl.locals.add Local(typ: typ)
-
-    assert entity.temp notin cl.tempMap, "re-definition of temporary"
-    cl.tempMap[entity.temp] = tmp
-
-    def = newLocalRef(tmp, info, typ)
-  else:
-    unreachable()
-
-  var arg =
-    if n.kind in {mnkBind, mnkBindMut} and tree[cr].kind in LvalueExprKinds:
-      # don't use the field interperation for variant access
-      lvalueToIr(tree, cl, cr, preferField=false)
-    else:
-      sourceExprToIr(tree, cl, cr)[0]
-  leave(tree, cr)
-  if n.kind in {mnkBind, mnkBindMut} and arg.typ.kind notin {tyVar, tyLent}:
-    # wrap the operand in an address-of operation
-    arg = newOp(cnkHiddenAddr, info, def.typ, arg)
-
-  let isLet = (entity.kind == mnkTemp and n.kind == mnkDefCursor) or
-              (entity.kind == mnkTemp and not hasDestructor(def.typ)) or
-              (entity.kind == mnkAlias)
-  # to reduce the pressure on the code generator, locals that never cross
-  # structured control-flow boundaries are not lifted. As a temporary
-  # measure, cursor temporaries and aliases are treated as such, but
-  # do note that this is not guaranteed and relies on how `mirgen`
-  # produces MIR code
-
-  case def.kind
-  of cnkLocal:
-    if cl.inUnscoped and not isLet:
-      # add the local to the list of moved definitions and only emit
-      # an assignment
-      cl.defs.add copyTree(def)
-      result =
-        case arg.kind
-        of cnkEmpty: arg
-        else:        newStmt(cnkAsgn, info, [def, arg])
-    else:
-      result = newStmt(cnkDef, info, [def, arg])
-  of cnkGlobal:
-    # there are no defs for globals in the ``CgNode`` IR, so we
-    # emit an assignment that has the equivalent behaviour (in
-    # terms of initialization)
-    case arg.kind
-    of cnkEmpty:
-      if sfImportc in env.globals[def.global].flags:
-        # for imported globals, the 'def' only means that the symbol becomes
-        # known to us, not that it starts its lifetime here -> don't
-        # initialize or move it
-        result = arg
-      elif cl.inUnscoped:
-        # move the default initialization to the start of the scope
-        cl.defs.add def
-        result = arg
-      else:
-        result = newStmt(cnkAsgn, info, [def, newDefaultCall(info, def.typ)])
-    else:
-      if sfImportc notin env.globals[def.global].flags and cl.inUnscoped:
-        # default intialization is required at the start of the scope
-        cl.defs.add def
-      result = newStmt(cnkAsgn, info, [def, arg])
-  of cnkEmpty:
-    result = def
-  else:
-    unreachable()
-
-proc bodyToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode =
-  ## Generates the ``CgNode`` tree for the body of a construct that implies
-  ## some form of control-flow.
-  let prev = cl.inUnscoped
-  # assume the body is unscoped until stated otherwise
-  cl.inUnscoped = true
-  result = stmtToIr(tree, env, cl, cr)
-  cl.inUnscoped = prev
-
-proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor): CgNode
-
-proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode =
-  let n {.cursor.} = tree.get(cr)
-  let info = cr.info ## the source information of `n`
-
-  template body(): CgNode =
-    bodyToIr(tree, env, cl, cr)
-
-  template to(kind: CgNodeKind, args: varargs[untyped]): CgNode =
-    let r = newStmt(kind, info, args)
-    leave(tree, cr)
-    r
-
-  template toList(k: CgNodeKind, body: untyped): CgNode =
-    let res {.inject.} = newStmt(k, info)
-    while tree[cr].kind != mnkEnd:
-      body
-    leave(tree, cr)
-    res
-
-  case n.kind
-  of DefNodes:
-    defToIr(tree, env, cl, n, cr)
-  of mnkAsgn, mnkInit, mnkSwitch:
-    let
-      dst = lvalueToIr(tree, cl, cr)
-      (src, useFast) = sourceExprToIr(tree, cl, cr)
-    to (if useFast: cnkFastAsgn else: cnkAsgn), dst, src
-  of mnkRepeat:
-    to cnkRepeatStmt, body()
-  of mnkBlock:
-    cl.blocks.add n.label # push the label to the stack
-    let body = body()
-    cl.blocks.setLen(cl.blocks.len - 1) # pop block from the stack
-    to cnkBlockStmt, newLabelNode(cl.blocks.len.BlockId, info), body
-  of mnkTry:
-    let res = newStmt(cnkTryStmt, info, [body()])
-    assert n.len <= 2
-
-    for _ in 0..<n.len:
-      let it {.cursor.} = enter(tree, cr)
-
-      case it.kind
-      of mnkExcept:
-        for _ in 0..<it.len:
-          let br {.cursor.} = enter(tree, cr)
-          assert br.kind == mnkBranch
-
-          let excpt = newNode(cnkExcept, cr.info)
-          for j in 0..<br.len:
-            excpt.add tbExceptItem(tree, cl, cr)
-
-          excpt.add body()
-          res.add excpt
-
-          leave(tree, cr)
-
-      of mnkFinally:
-        res.add newTree(cnkFinally, cr.info, body())
-      else:
-        unreachable(it.kind)
-
-      leave(tree, cr)
-
-    leave(tree, cr)
-    res
-  of mnkBreak:
-    # find the stack index of the enclosing 'block' identified by the break's
-    # label; we use the index as the ID
-    var idx = cl.blocks.high
-    while idx >= 0 and cl.blocks[idx] != n.label:
-      dec idx
-    newStmt(cnkBreakStmt, info, [newLabelNode(BlockId idx, info)])
-  of mnkReturn:
-    newNode(cnkReturnStmt, info)
-  of mnkVoid:
-    var res = exprToIr(tree, cl, cr)
-    if res.typ.isEmptyType():
-      # a void expression doesn't need to be discarded
-      discard
-    else:
-      res = newStmt(cnkVoidStmt, info, [res])
-    leave(tree, cr)
-    res
-  of mnkIf:
-    to cnkIfStmt, valueToIr(tree, cl, cr), body()
-  of mnkRaise:
-    # the operand can either be empty or an lvalue expression
-    to cnkRaiseStmt:
-      case tree[cr].kind
-      of mnkNone: atomToIr(tree, cl, cr)
-      else:       lvalueToIr(tree, cl, cr)
-  of mnkCase:
-    caseToIr(tree, env, cl, n, cr)
-  of mnkAsm:
-    toList cnkAsmStmt:
-      res.add valueToIr(tree, cl, cr)
-  of mnkEmit:
-    toList cnkEmitStmt:
-      res.add valueToIr(tree, cl, cr)
-  of mnkStmtList:
-    toList cnkStmtList:
-      res.kids.addIfNotEmpty stmtToIr(tree, env, cl, cr)
-  of mnkScope:
-    toSingleNode scopeToIr(tree, env, cl, cr)
-  of mnkDestroy:
-    unreachable("a 'destroy' that wasn't lowered")
-  of AllNodeKinds - StmtNodes:
-    unreachable(n.kind)
-
-proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor): CgNode =
-  assert n.kind == mnkCase
-  result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
-  for j in 0..<n.len:
-    let br {.cursor.} = enter(tree, cr)
-
-    result.add newTree(cnkBranch, cr.info)
-    if br.len > 0:
-      for x in 0..<br.len:
-        assert tree[cr].kind in {mnkConst, mnkLiteral}
-        result[^1].add atomToIr(tree, cl, cr)
-
-    result[^1].add bodyToIr(tree, env, cl, cr)
-    leave(tree, cr)
-
-  leave(tree, cr)
-
-proc exprToIr(tree: MirBody, cl: var TranslateCl,
-              cr: var TreeCursor): CgNode =
-  ## Translates a MIR expression to the corresponding CG IR representation.
-  ## Moves the cursor to the next tree item.
-  let n {.cursor.} = get(tree, cr)
-  let info = cr.info
-
-  template op(kind: CgNodeKind, e: CgNode): CgNode =
-    let r = newOp(kind, info, n.typ, e)
-    leave(tree, cr)
-    r
-
-  template treeOp(k: CgNodeKind, body: untyped): CgNode =
-    let res {.inject.} = newExpr(k, info, n.typ)
-    while tree[cr].kind != mnkEnd:
-      body
-    leave(tree, cr)
-    res
-
-  case n.kind
-  of Atoms:
-    atomToIr(n, cl, info)
-  of mnkPathVariant, mnkPathArray, mnkPathConv, mnkPathNamed, mnkPathPos:
-    lvalueToIr(tree, cl, n, cr)
-  of mnkCast:
-    op cnkCast, valueToIr(tree, cl, cr)
-  of mnkConv:
-    op cnkConv, valueToIr(tree, cl, cr)
-  of mnkStdConv:
-    op cnkHiddenConv, valueToIr(tree, cl, cr)
-  of mnkToSlice:
-    treeOp cnkToSlice:
-      res.add valueToIr(tree, cl, cr)
-  of mnkAddr:
-    op cnkAddr, lvalueToIr(tree, cl, cr)
-  of mnkDeref:
-    op cnkDeref, atomToIr(tree, cl, cr)
-  of mnkView:
-    op cnkHiddenAddr, lvalueToIr(tree, cl, cr)
-  of mnkDerefView:
-    op cnkDerefView, atomToIr(tree, cl, cr)
-  of mnkObjConstr:
-    assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
-    treeOp cnkObjConstr:
-      let f = newFieldNode(get(tree, cr).field)
-      res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
-  of mnkConstr:
-    let typ = n.typ.skipTypes(abstractVarRange)
-
-    let kind =
-      case typ.kind
-      of tySet:               cnkSetConstr
-      of tyArray, tySequence: cnkArrayConstr
-      of tyTuple:             cnkTupleConstr
-      of tyProc:
-        assert typ.callConv == ccClosure
-        cnkClosureConstr
-      else:
-        unreachable(typ.kind)
-
-    treeOp kind:
-      res.add argToIr(tree, cl, cr)[1]
-  of mnkCall, mnkCheckedCall:
-    callToIr(tree, cl, n, cr)
-  of UnaryOps:
-    const Map = [mnkNeg: cnkNeg]
-    treeOp Map[n.kind]:
-      res.add valueToIr(tree, cl, cr)
-  of BinaryOps:
-    const Map = [mnkAdd: cnkAdd, mnkSub: cnkSub,
-                 mnkMul: cnkMul, mnkDiv: cnkDiv, mnkModI: cnkModI]
-    treeOp Map[n.kind]:
-      res.kids = @[valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)]
-  of mnkCopy, mnkMove, mnkSink:
-    # translation of assignments needs to handle all modifiers
-    unreachable("loose assignment modifier")
-  of AllNodeKinds - ExprKinds - {mnkNone}:
-    unreachable(n.kind)
-
-proc genDefFor(sym: sink CgNode): CgNode =
-  ## Produces the statement tree of a definition for the given symbol-like
-  ## node. Globals use an assignment.
-  case sym.kind
-  of cnkLocal:
-    newStmt(cnkDef, sym.info, [sym, newEmpty()])
-  of cnkGlobal:
-    # emulate the default-initialization behaviour
-    newStmt(cnkAsgn, sym.info, [sym, newDefaultCall(sym.info, sym.typ)])
-  else:
-    unreachable()
-
-proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, allowExpr = false): seq[CgNode] =
-  let
-    ends =
-      if allowExpr: {mnkEnd} + Atoms
-      else:         {mnkEnd}
-    prev = cl.defs.len
-    prevInUnscoped = cl.inUnscoped
-
-  # a scope is entered, meaning that we're no longer in an unscoped context
-  cl.inUnscoped = false
-
-  var stmts: seq[CgNode]
-  # translate all statements:
-  while cr.hasNext(tree) and tree[cr].kind notin ends:
-    stmts.addIfNotEmpty stmtToIr(tree, env, cl, cr)
-
-  if cr.hasNext(tree) and tree[cr].kind == mnkEnd:
-    leave(tree, cr) # close the sub-tree
-
-  if cl.defs.len > prev:
-    # insert all the lifted defs at the start
-    for i in countdown(cl.defs.high, prev):
-      stmts.insert genDefFor(move cl.defs[i])
-
-    # "pop" the elements that were added as part of this scope:
-    cl.defs.setLen(prev)
-
-  cl.inUnscoped = prevInUnscoped
-
-  result = stmts
-
-proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-        start: NodePosition): CgNode =
-  ## Translate `tree` to the corresponding ``CgNode`` representation.
-  var cr = TreeCursor(pos: start.uint32)
-  var nodes = scopeToIr(tree, env, cl, cr, allowExpr=true)
-  if cr.hasNext(tree):
-    # the tree must be an expression; the last node is required to be an atom
-    let x = atomToIr(tree, cl, cr)
-    if nodes.len == 0:
-      x
-    else:
-      nodes.add x
-      newExpr(cnkStmtListExpr, unknownLineInfo, nodes[^1].typ, nodes)
-  else:
-    # it's a statement list
-    toSingleNode nodes
-
-proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
-                 owner: PSym,
-                 body: sink MirBody): Body =
-  ## Generates the ``CgNode`` IR corresponding to the input MIR `body`,
-  ## using `idgen` to provide new IDs when creating symbols.
-  var cl = TranslateCl(graph: graph, idgen: idgen, owner: owner)
-  if owner.kind in routineKinds:
-    # setup the locals and associated mappings for the parameters
-    template add(v: PSym) =
-      let s = v
-      cl.localsMap[s.id] = cl.locals.add initLocal(s)
-
-    let sig =
-      if owner.kind == skMacro: owner.internal
-      else:                     owner.typ
-
-    # result variable:
-    if sig[0].isEmptyType():
-      # always reserve a slot for the result variable, even if the latter is
-      # not present
-      discard cl.locals.add(Local())
-    else:
-      add(owner.ast[resultPos].sym)
-
-    # normal parameters:
-    for i in 1..<sig.len:
-      add(sig.n[i].sym)
-
-    if sig.callConv == ccClosure:
-      # environment parameter
-      add(owner.ast[paramsPos][^1].sym)
-
-  result = Body()
-  result.code = tb(body, env, cl, NodePosition 0)
-  result.locals = cl.locals
diff --git a/compiler/backend/cgirutils.nim b/compiler/backend/cgirutils.nim
index b5f361b401f..f5e0813ffea 100644
--- a/compiler/backend/cgirutils.nim
+++ b/compiler/backend/cgirutils.nim
@@ -59,7 +59,7 @@ proc treeRepr*(n: CgNode): string =
     of cnkMagic:
       result.add "magic: "
       result.add $n.magic
-    of cnkEmpty, cnkInvalid, cnkType, cnkAstLit, cnkNilLit, cnkReturnStmt,
+    of cnkEmpty, cnkInvalid, cnkType, cnkAstLit, cnkNilLit,
        cnkResume:
       discard
     of cnkWithOperand:
diff --git a/compiler/backend/jsbackend.nim b/compiler/backend/jsbackend.nim
index da2d9f132db..6c3cc7e1dbd 100644
--- a/compiler/backend/jsbackend.nim
+++ b/compiler/backend/jsbackend.nim
@@ -115,8 +115,7 @@ proc generateCodeForMain(globals: PGlobals, graph: ModuleGraph, m: BModule,
 
   let owner = m.module
   genTopLevelStmt(globals, m):
-    canonicalize(graph, m.idgen, globals.env, owner, body, TranslationConfig(),
-                 legacy=false)
+    canonicalize(graph, m.idgen, globals.env, owner, body, TranslationConfig())
 
 proc generateCode*(graph: ModuleGraph, mlist: sink ModuleList) =
   ## Entry point into the JS backend. Generates the code for all modules and
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index 1b95ed3c651..cf91e59e97f 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -207,14 +207,8 @@ func analyseIfAddressTaken(n: CgNode, addrTaken: var PackedSet[LocalId]) =
   ## that have their address taken in `addrTaken`.
   proc skipAllConv(n: CgNode): CgNode {.nimcall.} =
     var n {.cursor.} = n
-    while true:
-      case n.kind
-      of cnkLvalueConv, cnkObjDownConv, cnkObjUpConv:
-        n = n.operand
-      of cnkStmtListExpr:
-        n = n[^1]
-      else:
-        break
+    while n.kind in {cnkLvalueConv, cnkObjDownConv, cnkObjUpConv}:
+      n = n.operand
 
     result = n
 
@@ -1189,11 +1183,6 @@ proc genAddr(p: PProc, n: CgNode, r: var TCompRes) =
   of cnkObjUpConv, cnkObjDownConv:
     # object up-/down-conversions are no-ops
     genAddr(p, n.operand, r)
-  of cnkStmtListExpr:
-    for i in 0..<n.len-1:
-      genStmt(p, n[i])
-
-    genAddr(p, n[^1], r)
   else:
     internalError(p.config, n.info, "genAddr: " & $n.kind)
 
@@ -2677,8 +2666,8 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
   of cnkJoinStmt, cnkEnd, cnkLoopStmt, cnkContinueStmt:
     discard "terminators or endings for which no special handling is needed"
   of cnkInvalid, cnkMagic, cnkRange, cnkBinding, cnkLeave, cnkTargetList,
-     cnkResume, cnkBranch, cnkAstLit, cnkLabel, cnkStmtListExpr, cnkStmtList,
-     cnkField, cnkLegacyNodes, cnkCaseStmt:
+     cnkResume, cnkBranch, cnkAstLit, cnkLabel, cnkStmtList, cnkCaseStmt,
+     cnkField:
     internalError(p.config, n.info, "gen: unknown node type: " & $n.kind)
 
 proc newModule*(g: ModuleGraph; module: PSym): BModule =
diff --git a/compiler/mir/mirbridge.nim b/compiler/mir/mirbridge.nim
index 19b58d19467..c83a5ef4f33 100644
--- a/compiler/mir/mirbridge.nim
+++ b/compiler/mir/mirbridge.nim
@@ -10,7 +10,6 @@ import
   compiler/backend/[
     cgir,
     cgirgen,
-    cgirgen_legacy,
     cgirutils
   ],
   compiler/front/[
@@ -77,8 +76,7 @@ proc echoOutput*(config: ConfigRef, owner: PSym, body: Body) =
       config.writeln(treeRepr(body.code))
 
 proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
-                   owner: PSym, body: PNode, config: TranslationConfig;
-                   legacy=false): Body =
+                   owner: PSym, body: PNode, config: TranslationConfig): Body =
   ## Legacy routine. Translates the body `body` of the procedure `owner` to
   ## MIR code, and the MIR code to ``CgNode`` IR.
   echoInput(graph.config, owner, body)
@@ -87,8 +85,5 @@ proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
   echoMir(graph.config, owner, body)
 
   # step 2: generate the ``CgNode`` tree
-  if legacy:
-    result = cgirgen_legacy.generateIR(graph, idgen, env, owner, body)
-  else:
-    result = cgirgen.generateIR(graph, idgen, env, owner, body)
+  result = cgirgen.generateIR(graph, idgen, env, owner, body)
   echoOutput(graph.config, owner, result)
\ No newline at end of file
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 8aeafa6d87a..fce9c2500b4 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -3187,8 +3187,8 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
   of cnkAsmStmt, cnkEmitStmt:
     unused(c, n, dest)
   of cnkInvalid, cnkMagic, cnkRange, cnkBranch,
-     cnkBinding, cnkLabel, cnkStmtListExpr, cnkField, cnkToSlice,
-     cnkLegacyNodes, cnkResume, cnkTargetList, cnkLeave:
+     cnkBinding, cnkLabel, cnkField, cnkToSlice,
+     cnkResume, cnkTargetList, cnkLeave:
     unreachable(n.kind)
 
 proc initProc(c: TCtx, owner: PSym, body: sink Body): BProc =

From 7fd1110e09ea2b1c34f35f9415b682e618da2f2c Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Wed, 13 Mar 2024 02:43:29 +0100
Subject: [PATCH 032/169] Unify tree equivalence checking procedures (#1233)

## Summary

Unify tree equivalence checking procedures in the compiler by way of a
template that generates these procedures. This fixes differing comments
between forward declaration and implementation breaking the comparison.
This also fixes a bug where VM constant deduplication ignored node
literal differences due to comments.

## Details

* The various tree equivalence checking procedures across the compiler
now all use a common template  `makeTreeEquivalenceProc` .
*  `nkCommentStmt`  nodes' equality is now **ignored** in
`exprStructuralEquivalent`  and  `exprStructuralEquivalentStrictSym` ,
fixing an issue where differing comments could prevent matching forward
declarations, see the test added in
`tests/lang_callable/generics/tforwardgeneric.nim`
*  `nkCommentStmt`  nodes' equality is now **checked for** in
`cmpNodeCnst`  fixing an issue where constants containing NimNodes were
incorrectly deduplicated, see the test added in
`tests/lang_callable/macros/tmacros_various.nim`
* Removed `trees.sameTree` due to it being dead-code
* Add comments explaining preexisting issues with  `nkFloatLiterals`
and  `nkNimNodeLit`  equality checking

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 compiler/ast/trees.nim                        | 110 +++++++++---------
 compiler/ast/types.nim                        |   6 +
 compiler/backend/cbackend.nim                 |   2 +-
 compiler/ic/replayer.nim                      |   4 +-
 compiler/sem/guards.nim                       |  33 ++----
 compiler/sem/patterns.nim                     |  26 ++---
 compiler/sem/procfind.nim                     |   1 +
 compiler/sem/semfold.nim                      |   2 +-
 compiler/vm/vm.nim                            |   5 +-
 compiler/vm/vmcompilerserdes.nim              |   2 +-
 compiler/vm/vmgen.nim                         |  33 ++----
 .../generics/tforwardgeneric.nim              |  18 ++-
 .../lang_callable/macros/tmacros_various.nim  |  18 +++
 13 files changed, 134 insertions(+), 126 deletions(-)

diff --git a/compiler/ast/trees.nim b/compiler/ast/trees.nim
index da324808325..317ec8896e7 100644
--- a/compiler/ast/trees.nim
+++ b/compiler/ast/trees.nim
@@ -44,61 +44,63 @@ proc sameFloatIgnoreNan(a, b: BiggestFloat): bool {.inline.} =
   ## ignores NaN semantics, but ensures 0.0 == -0.0, see #13730
   cast[uint64](a) == cast[uint64](b) or a == b
 
-proc exprStructuralEquivalent*(a, b: PNode; strictSymEquality=false): bool =
-  if a == b:
-    result = true
-  elif (a != nil) and (b != nil) and (a.kind == b.kind):
-    case a.kind
-    of nkSym:
-      if strictSymEquality:
-        result = a.sym == b.sym
-      else:
-        # don't go nuts here: same symbol as string is enough:
-        result = a.sym.name.id == b.sym.name.id
-    of nkIdent: result = a.ident.id == b.ident.id
-    of nkIntLiterals: result = a.intVal == b.intVal
-    of nkFloatLiterals: result = sameFloatIgnoreNan(a.floatVal, b.floatVal)
-    of nkStrLiterals: result = a.strVal == b.strVal
-    of nkCommentStmt: result = a.comment == b.comment
-    of nkEmpty, nkNilLit, nkType: result = true
-    of nkError:
-      unreachable()
-    of nkWithSons:
-      if a.len == b.len:
-        for i in 0..<a.len:
-          if not exprStructuralEquivalent(a[i], b[i],
-                                          strictSymEquality): return
-        result = true
+template makeTreeEquivalenceProc*(
+  name, relaxedKindCheck, symCheck, floatCheck, typeCheck, commentCheck) {.dirty.} =
+  ## Defines a tree equivalence checking procedure.
+  ## This skeleton is shared between all recursive
+  ## `PNode` equivalence checks in the compiler code base
+  ## It might be possible to unify more of them with each other.
+  proc name(a, b: PNode): bool =
+    result = false
+    if a == b:
+      result = true
+    elif a != nil and b != nil and (a.kind == b.kind or relaxedKindCheck):
+      case a.kind
+      of nkError:           unreachable()
+      of nkEmpty, nkNilLit: result = true
+      of nkSym:             result = symCheck
+      of nkIdent:           result = a.ident.id == b.ident.id
+      of nkIntLiterals:     result = a.intVal == b.intVal
+      of nkFloatLiterals:   result = floatCheck
+        # XXX: Using float equality, even if partially tamed through
+        #      sameFloatIgnoreNan, causes inconsistencies due to it
+        #      lacking the substition and reflexivity property.
+      of nkStrLiterals:     result = a.strVal == b.strVal
+      of nkType:            result = typeCheck
+      of nkCommentStmt:     result = commentCheck
+      # XXX: nkNimNodeLit should probably always be checked strictly.
+      of nkWithSons:
+        if a.len == b.len:
+          for i in 0..<a.len:
+            if not name(a[i], b[i]): return false
+          result = true
 
-proc sameTree*(a, b: PNode): bool =
-  if a == b:
-    result = true
-  elif a != nil and b != nil and a.kind == b.kind:
-    if a.flags != b.flags: return
-    if a.info.line != b.info.line: return
-    if a.info.col != b.info.col:
-      return                  #if a.info.fileIndex <> b.info.fileIndex then exit;
-    case a.kind
-    of nkSym:
-      # don't go nuts here: same symbol as string is enough:
-      result = a.sym.name.id == b.sym.name.id
-    of nkIdent: result = a.ident.id == b.ident.id
-    of nkIntLiterals:
-      result = a.intVal == b.intVal and
-               a.intLitBase == b.intLitBase
-    of nkFloatLiterals:
-      result = sameFloatIgnoreNan(a.floatVal, b.floatVal) and
-               a.floatLitBase == b.floatLitBase
-    of nkStrLiterals: result = a.strVal == b.strVal
-    of nkCommentStmt: result = a.comment == b.comment
-    of nkEmpty, nkNilLit, nkType: result = true
-    of nkError:
-      unreachable()
-    of nkWithSons:
-      if a.len == b.len:
-        for i in 0..<a.len:
-          if not sameTree(a[i], b[i]): return
-        result = true
+makeTreeEquivalenceProc(exprStructuralEquivalent,
+  relaxedKindCheck = false,
+  symCheck     = a.sym.name.id == b.sym.name.id, # same symbol as string is enough
+  floatCheck   = sameFloatIgnoreNan(a.floatVal, b.floatVal),
+  typeCheck    = true,
+  commentCheck = true
+)
+export exprStructuralEquivalent
+
+makeTreeEquivalenceProc(exprStructuralEquivalentStrictSym,
+  relaxedKindCheck = false,
+  symCheck     = a.sym == b.sym,
+  floatCheck   = sameFloatIgnoreNan(a.floatVal, b.floatVal),
+  typeCheck    = true,
+  commentCheck = true
+)
+export exprStructuralEquivalentStrictSym
+
+makeTreeEquivalenceProc(exprStructuralEquivalentStrictSymAndComm,
+  relaxedKindCheck = false,
+  symCheck     = a.sym == b.sym,
+  floatCheck   = sameFloatIgnoreNan(a.floatVal, b.floatVal),
+  typeCheck    = true,
+  commentCheck = a.comment == b.comment
+)
+export exprStructuralEquivalentStrictSymAndComm
 
 proc getMagic*(op: PNode): TMagic =
   if op == nil: return mNone
diff --git a/compiler/ast/types.nim b/compiler/ast/types.nim
index 4479cb96d37..92e7b05be53 100644
--- a/compiler/ast/types.nim
+++ b/compiler/ast/types.nim
@@ -652,6 +652,10 @@ proc sameTypeOrNil*(a, b: PType, flags: TTypeCmpFlags = {}): bool =
     else: result = sameType(a, b, flags)
 
 proc equalParam(a, b: PSym): TParamsEquality =
+  ## Returns whether parameters `a` and `b` are considered equal.
+  ## Note that this operation is not commutative, so when comparing
+  ## a forward declaration to an implementation, ensure `a` is the
+  ## param from the forward declaration.
   if sameTypeOrNil(a.typ, b.typ, {ExactTypeDescValues}) and
       exprStructuralEquivalent(a.constraint, b.constraint):
     if a.ast == b.ast:
@@ -660,6 +664,8 @@ proc equalParam(a, b: PSym): TParamsEquality =
       if exprStructuralEquivalent(a.ast, b.ast): result = paramsEqual
       else: result = paramsIncompatible
     elif a.ast != nil:
+      # This means default values for parameters don't have to be
+      # repeated when the proc was forward declared
       result = paramsEqual
     elif b.ast != nil:
       result = paramsIncompatible
diff --git a/compiler/backend/cbackend.nim b/compiler/backend/cbackend.nim
index 45e7aeb5bc4..4e9d34bb1bb 100644
--- a/compiler/backend/cbackend.nim
+++ b/compiler/backend/cbackend.nim
@@ -503,4 +503,4 @@ proc generateCode*(graph: ModuleGraph, g: BModuleList, mlist: sink ModuleList) =
     # code generation for the module is done; its C code will not change
     # anymore beyond this point
     # future direction: this part is going to be turned into an iterator
-    # yielding the C file's content
\ No newline at end of file
+    # yielding the C file's content
diff --git a/compiler/ic/replayer.nim b/compiler/ic/replayer.nim
index 6c8f1a1cd16..44f44ec0adf 100644
--- a/compiler/ic/replayer.nim
+++ b/compiler/ic/replayer.nim
@@ -101,7 +101,7 @@ proc replayStateChanges*(module: PSym; g: ModuleGraph) =
         else:
           block search:
             for existing in g.cacheSeqs[destKey]:
-              if exprStructuralEquivalent(existing, val, strictSymEquality = true):
+              if exprStructuralEquivalentStrictSymAndComm(existing, val):
                 break search
             g.cacheSeqs[destKey].add val
       of "add":
@@ -193,4 +193,4 @@ proc replayLibs*(g: ModuleGraph, module: int) =
   if module >= g.libs.len:
     g.libs.setLen(module + 1)
 
-  g.libs[module] = loadLibs(g.config, g.cache, g.packed, module)
\ No newline at end of file
+  g.libs[module] = loadLibs(g.config, g.cache, g.packed, module)
diff --git a/compiler/sem/guards.nim b/compiler/sem/guards.nim
index 74c1c838609..2d3f31f6652 100644
--- a/compiler/sem/guards.nim
+++ b/compiler/sem/guards.nim
@@ -441,30 +441,15 @@ proc sameOpr(a, b: PSym): bool =
   of someDiv: result = b.magic in someDiv
   else: result = a == b
 
-proc sameTree*(a, b: PNode): bool =
-  result = false
-  if a == b:
-    result = true
-  elif a != nil and b != nil and a.kind == b.kind:
-    case a.kind
-    of nkError:
-      unreachable()
-    of nkSym:
-      result = a.sym == b.sym
-      if not result and a.sym.magic != mNone:
-        result = a.sym.magic == b.sym.magic or sameOpr(a.sym, b.sym)
-    of nkIdent: result = a.ident.id == b.ident.id
-    of nkIntLiterals: result = a.intVal == b.intVal
-    of nkFloatLiterals: result = a.floatVal == b.floatVal
-    of nkStrLiterals: result = a.strVal == b.strVal
-    of nkType: result = a.typ == b.typ
-    of nkEmpty, nkNilLit, nkCommentStmt:
-      result = true # Ignore comments
-    of nkWithSons:
-      if a.len == b.len:
-        for i in 0..<a.len:
-          if not sameTree(a[i], b[i]): return
-        result = true
+makeTreeEquivalenceProc(sameTree,
+  relaxedKindCheck = false,
+  symCheck     = sameOpr(a.sym, b.sym) or
+    (a.sym.magic != mNone and a.sym.magic == b.sym.magic),
+  floatCheck   = a.floatVal == b.floatVal,
+  typeCheck    = a.typ == b.typ,
+  commentCheck = true # ignore comments
+)
+export sameTree
 
 proc hasSubTree(n, x: PNode): bool =
   if n.sameTree(x): result = true
diff --git a/compiler/sem/patterns.nim b/compiler/sem/patterns.nim
index 391f19b2f9e..dead41b9ab9 100644
--- a/compiler/sem/patterns.nim
+++ b/compiler/sem/patterns.nim
@@ -60,24 +60,14 @@ proc canonKind(n: PNode): TNodeKind =
 proc sameKinds(a, b: PNode): bool {.inline.} =
   result = a.kind == b.kind or a.canonKind == b.canonKind
 
-proc sameTrees*(a, b: PNode): bool =
-  if sameKinds(a, b):
-    case a.kind
-    of nkSym: result = a.sym == b.sym
-    of nkIdent: result = a.ident.id == b.ident.id
-    of nkIntLiterals: result = a.intVal == b.intVal
-    of nkFloatLiterals: result = a.floatVal == b.floatVal
-    of nkStrLiterals: result = a.strVal == b.strVal
-    of nkError:
-      unreachable()
-    of nkEmpty, nkNilLit, nkCommentStmt:
-      result = true # Ignore comments
-    of nkType: result = sameTypeOrNil(a.typ, b.typ)
-    of nkWithSons:
-      if a.len == b.len:
-        for i in 0..<a.len:
-          if not sameTrees(a[i], b[i]): return
-        result = true
+makeTreeEquivalenceProc(sameTrees,
+  relaxedKindCheck = sameKinds(a, b),
+  symCheck     = a.sym == b.sym,
+  floatCheck   = a.floatVal == b.floatVal,
+  typeCheck    = sameTypeOrNil(a.typ, b.typ),
+  commentCheck = true # Ignore comments
+)
+export sameTrees
 
 proc inSymChoice(sc, x: PNode): bool =
   if sc.kind == nkClosedSymChoice:
diff --git a/compiler/sem/procfind.nim b/compiler/sem/procfind.nim
index cd8f4609cc3..2b47f60f909 100644
--- a/compiler/sem/procfind.nim
+++ b/compiler/sem/procfind.nim
@@ -58,6 +58,7 @@ proc searchForProcAux(c: PContext, scope: PScope, fn: PSym): PSym =
         return
       of paramsIncompatible:
         localReport(c.config, fn.info, reportSym(rsemAmbiguousCall, fn))
+          # TODO: Should be rsemDefaultParamIsIncompatible
 
         return
       of paramsNotEqual:
diff --git a/compiler/sem/semfold.nim b/compiler/sem/semfold.nim
index 875f6f3fd6e..7a1125f3da2 100644
--- a/compiler/sem/semfold.nim
+++ b/compiler/sem/semfold.nim
@@ -379,7 +379,7 @@ proc evalOp*(m: TMagic, n, a, b, c: PNode; idgen: IdGenerator; g: ModuleGraph):
     result.typ = n.typ
   of mEqProc:
     result = newIntNodeT(toInt128(ord(
-        exprStructuralEquivalent(a, b, strictSymEquality=true))), n, idgen, g)
+        exprStructuralEquivalentStrictSym(a, b))), n, idgen, g)
   else: discard
 
 proc getConstIfExpr(c: PSym, n: PNode; idgen: IdGenerator; g: ModuleGraph): PNode =
diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index f36289117fa..67301e53a1c 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -1550,8 +1550,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
     of opcEqNimNode:
       decodeBC(rkInt)
       regs[ra].intVal =
-        ord(exprStructuralEquivalent(regs[rb].nimNode, regs[rc].nimNode,
-                                     strictSymEquality=true))
+        ord(exprStructuralEquivalentStrictSymAndComm(regs[rb].nimNode, regs[rc].nimNode))
     of opcSameNodeType:
       decodeBC(rkInt)
       # TODO: Look into me!
@@ -2841,7 +2840,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
       else:
         block search:
           for existing in g.cacheSeqs[destKey]:
-            if exprStructuralEquivalent(existing, val, strictSymEquality=true):
+            if exprStructuralEquivalentStrictSymAndComm(existing, val):
               break search
           g.cacheSeqs[destKey].add val
       recordIncl(c, c.debug[pc], destKey, val)
diff --git a/compiler/vm/vmcompilerserdes.nim b/compiler/vm/vmcompilerserdes.nim
index ae3bda4ab40..0a58623284c 100644
--- a/compiler/vm/vmcompilerserdes.nim
+++ b/compiler/vm/vmcompilerserdes.nim
@@ -25,7 +25,7 @@ import
 
 # XXX: the function signatures are a bit cumbersome here
 
-from compiler/ast/trees import exprStructuralEquivalent, cyclicTree
+from compiler/ast/trees import cyclicTree
 
 const SkipSet = abstractRange + {tyStatic} - {tyTypeDesc}
 
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index fce9c2500b4..31ccf2a6f19 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -40,7 +40,8 @@ import
     renderer,
     types,
     ast,
-    lineinfos
+    lineinfos,
+    trees
   ],
   compiler/backend/[
     cgir
@@ -807,26 +808,16 @@ template cmpFloatRep(a, b: BiggestFloat): bool =
   # if a.floatVal == 0.0: result = cast[uint64](a.floatVal) == cast[uint64](b.floatVal)
   # else: result = a.floatVal == b.floatVal
 
-func cmpNodeCnst(a, b: PNode): bool {.inline.} =
-  ## Compares two trees for structural equality, also taking the type of
-  ## ``nkType`` nodes into account. This procedure is used to prevent the same
-  ## AST from being added as a node constant more than once
-  if a == b:
-    return true
-  elif a.kind == b.kind:
-    case a.kind
-    of nkSym:           result = a.sym == b.sym
-    of nkIdent:         result = a.ident.id == b.ident.id
-    of nkEmpty:         result = true
-    of nkType:          result = a.typ == b.typ
-    of nkStrKinds:      result = a.strVal == b.strVal
-    of nkIntKinds:      result = a.intVal == b.intVal
-    of nkFloatLiterals: result = cmpFloatRep(a.floatVal, b.floatVal)
-    else:
-      if a.len == b.len:
-        for i in 0..<a.len:
-          if not cmpNodeCnst(a[i], b[i]): return
-        result = true
+# Compares two trees for structural equality, also taking the type of
+# ``nkType`` nodes into account. This procedure is used to prevent the same
+# AST from being added as a node constant more than once
+makeTreeEquivalenceProc(cmpNodeCnst,
+  relaxedKindCheck = false,
+  symCheck     = a.sym == b.sym,
+  floatCheck   = cmpFloatRep(a.floatVal, b.floatVal),
+  typeCheck    = a.typ == b.typ,
+  commentCheck = a.comment == b.comment
+)
 
 template makeCnstFunc(name, vType, aKind, valName, cmp) {.dirty.} =
   proc name(c: var TCtx, val: vType): int =
diff --git a/tests/lang_callable/generics/tforwardgeneric.nim b/tests/lang_callable/generics/tforwardgeneric.nim
index 953b301ed57..cfdb9535085 100644
--- a/tests/lang_callable/generics/tforwardgeneric.nim
+++ b/tests/lang_callable/generics/tforwardgeneric.nim
@@ -34,4 +34,20 @@ block unresolved_generic_param_in_body:
   forwarded[int]()
 
   proc forwarded[T]() = # complete the definition
-    doAssert ($T) == "int"
\ No newline at end of file
+    doAssert ($T) == "int"
+
+# Differing comments must not prevent forward declaration
+template noop(a: untyped): untyped = a
+
+proc comm[T](arg = ( noop (;
+    ## comment
+    true
+  )
+ ) )
+proc comm[T](arg = ( noop (;
+    ## this comment is different
+    true
+  )
+ ) ) = discard
+
+comm[bool](true)
diff --git a/tests/lang_callable/macros/tmacros_various.nim b/tests/lang_callable/macros/tmacros_various.nim
index 056246caaec..5d7d62dffb1 100644
--- a/tests/lang_callable/macros/tmacros_various.nim
+++ b/tests/lang_callable/macros/tmacros_various.nim
@@ -10,6 +10,8 @@ Infix
       Ident "cint"
   NilLit
 macrocache ok
+CommentStmt "comment 1"
+CommentStmt "comment 2"
 '''
 
   output: '''
@@ -328,3 +330,19 @@ block: # bug #15118
 
   block:
     flop("b")
+
+block:
+  # Ensure nkCommentStmt equality is not ignored when vmgen.cmpNodeCnst
+  # is used to deduplicate NimNode constants, so that `CommentStmt "comment 2"`
+  # is not counted as a duplicate of `CommentStmt "comment 1"` and
+  # incorrectly optimized to point at the `Comment "comment 1"` node
+
+  proc createComment(s: string): NimNode =
+    result = nnkCommentStmt.newNimNode()
+    result.strVal = s
+
+  const C1 = (1, createComment("comment 1"))
+  const C2 = (1, createComment("comment 2"))
+  static:
+    echo treeRepr(C1[1])
+    echo treeRepr(C2[1])

From a4a32d586de88b10dc69bd5063f2a0bea1c992f1 Mon Sep 17 00:00:00 2001
From: Nixfreak <nixfreak@gmail.com>
Date: Wed, 13 Mar 2024 10:59:33 -0500
Subject: [PATCH 033/169] Link to `style_guide.html` in `intern.rst` (#1050)

## Summary

`nep1.html` was renamed to `style_guide.html`, but the reference
to it in `intern.rst` wasn't updated, resulting in a broken link.
This is fixed now.

---------

Co-authored-by: Clyybber <darkmine956@gmail.com>
Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 doc/intern.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/intern.rst b/doc/intern.rst
index f8bb074e456..f71c7b10c8d 100644
--- a/doc/intern.rst
+++ b/doc/intern.rst
@@ -250,7 +250,7 @@ The new runtime is active `when defined(nimV2)`.
 Coding Guidelines
 =================
 
-* We follow |NimSkull|'s official style guide, see `<nep1.html>`_.
+* We follow |NimSkull|'s official style guide, see `<style_guide.html>`_.
 * Max line length is 100 characters.
 * Provide spaces around binary operators if that enhances readability.
 * Use a space after a colon, but not before it.

From 5fd1189f63378363723cc021d630da79d72b3020 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 13 Mar 2024 20:22:16 +0100
Subject: [PATCH 034/169] std/dynlib: fix `loadLibPatterns` having unknown
 effects (#1237)

## Summary

The `loadLibPatterns` procedure was erroneously inferred to have
unknown effects (`RootEffect`), making it unusable in `.tags: []`
procedures. This is now fixed.

## Details

`loadLibPatterns` calls the at-that-point forwarded procedure
`loadLib`, so effect inference falls back to assume that
`loadLibPatterns` can have effects.

Since `loadLib`, as well as the other forward-declared procedures,
don't have effects in practice, this is now explicitly specified
on the forward declarations.
---
 lib/pure/dynlib.nim      | 10 ++++++----
 tests/stdlib/tdynlib.nim | 21 +++++++++++++++++++++
 2 files changed, 27 insertions(+), 4 deletions(-)
 create mode 100644 tests/stdlib/tdynlib.nim

diff --git a/lib/pure/dynlib.nim b/lib/pure/dynlib.nim
index 6c6c11ac12c..df950709fea 100644
--- a/lib/pure/dynlib.nim
+++ b/lib/pure/dynlib.nim
@@ -48,22 +48,24 @@ import std/strutils
 type
   LibHandle* = pointer ## A handle to a dynamically loaded library.
 
-proc loadLib*(path: string, globalSymbols = false): LibHandle {.gcsafe.}
+{.pragma: noeffects, gcsafe, raises: [], tags: [].}
+
+proc loadLib*(path: string, globalSymbols = false): LibHandle {.noeffects.}
   ## Loads a library from `path`. Returns nil if the library could not
   ## be loaded.
 
-proc loadLib*(): LibHandle {.gcsafe.}
+proc loadLib*(): LibHandle {.noeffects.}
   ## Gets the handle from the current executable. Returns nil if the
   ## library could not be loaded.
 
-proc unloadLib*(lib: LibHandle) {.gcsafe.}
+proc unloadLib*(lib: LibHandle) {.noeffects.}
   ## Unloads the library `lib`.
 
 proc raiseInvalidLibrary*(name: cstring) {.noinline, noreturn.} =
   ## Raises a `LibraryError` exception.
   raise newException(LibraryError, "could not find symbol: " & $name)
 
-proc symAddr*(lib: LibHandle, name: cstring): pointer {.gcsafe.}
+proc symAddr*(lib: LibHandle, name: cstring): pointer {.noeffects.}
   ## Retrieves the address of a procedure/variable from `lib`. Returns nil
   ## if the symbol could not be found.
 
diff --git a/tests/stdlib/tdynlib.nim b/tests/stdlib/tdynlib.nim
new file mode 100644
index 00000000000..6eb3713670d
--- /dev/null
+++ b/tests/stdlib/tdynlib.nim
@@ -0,0 +1,21 @@
+discard """
+  targets: c
+  action: compile
+"""
+
+import std/dynlib
+
+# ensure that the dynlib procedures are GC safe and don't have effects
+proc dynlibProcsHaveNoEffects1() {.gcsafe, raises: [], tags: [].} =
+  discard loadLib("")
+  discard loadLib()
+  unloadLib(nil)
+  discard symAddr(nil, nil)
+
+  var candidates: seq[string]
+  libCandidates("", candidates)
+
+  discard loadLibPattern("")
+
+proc dynlibProcsHaveNoEffects2() {.gcsafe, tags: [].} =
+  discard checkedSymAddr(nil, nil)

From ae89c1099e1b83ca351c2cdde1808192b94cc9bd Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Fri, 15 Mar 2024 00:43:18 +0100
Subject: [PATCH 035/169] CI: Workaround leak sanitizer test failures due to
 high `vm.mmap_rnd_bits`  (#1242)

## Summary
Works around a leak sanitizer crash when  `vm.mmap_rnd_bits`  is 32 bits
by setting it to 28. This currently blocks all CI runs.

See https://github.com/actions/runner-images/issues/9491
---
 .github/workflows/leak.yml | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/.github/workflows/leak.yml b/.github/workflows/leak.yml
index 169955b98bd..753c6af9458 100644
--- a/.github/workflows/leak.yml
+++ b/.github/workflows/leak.yml
@@ -14,6 +14,10 @@ jobs:
     runs-on: ubuntu-latest
 
     steps:
+      - name: Decrease kernel address randomization
+        # Works around https://github.com/actions/runner-images/issues/9491
+        run: sudo sysctl vm.mmap_rnd_bits=28
+
       - uses: actions/checkout@v4
         with:
           fetch-depth: 0

From 82b3cea69c3c4ab36ff509d7809f4df1f3f8fa5f Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Thu, 14 Mar 2024 22:21:45 -0500
Subject: [PATCH 036/169] ci: pin Xcode and macOS SDK version (#1244)

## Summary
Recently we have seen an excessive amount of reproducibility failures
due to differences in SDK version between M1 jobs.

This PR pins both the Xcode version and the macOS SDK version to avoid
fluctuations caused by runner updates.

## Details
* M1 jobs appears to be flip-flopping between two macOS SDK versions:
14.0 and 14.2. This is found by doing manual analysis via  `llvm-otool`
on the resulting binaries.
* GitHub's documentation suggests that a new 20240219 version of the M1
runner is still being rolled out. While the changelog does not show any
differences in Xcode configuration, we do observe these changes via our
reproducibility tests.
* GitHub's documentation also outlined that several SDK versions are
available, including 14.0 and 14.2. My speculation is that 14.2 was made
the default (either by accident or intentional) during the runner
updates. As such, pin the SDK back to 14.0 to remove this variable.

Fixes https://github.com/nim-works/nimskull/issues/1231
---
 .github/workflows/ci.yml | 60 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 60 insertions(+)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 254b7d74c39..6d3f31af1a3 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -155,6 +155,18 @@ jobs:
           Invoke-WebRequest https://curl.se/ca/cacert.pem -OutFile (Join-Path $binPath "cacert.pem")
         shell: pwsh
 
+      - name: Set Xcode version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        uses: maxim-lobanov/setup-xcode@v1
+        with:
+          xcode-version: "15.0.1"
+
+      - name: Set macOS SDK version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        run: |
+          sdkpath=$(xcrun --sdk macosx14.0 --show-sdk-path)
+          echo "SDKROOT=$sdkpath" >> "$GITHUB_ENV"
+
       - name: Build release binaries
         run: ./koch.py all-strict
 
@@ -207,6 +219,18 @@ jobs:
           sudo apt-get update
           sudo apt-get install "${deps[@]}"
 
+      - name: Set Xcode version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        uses: maxim-lobanov/setup-xcode@v1
+        with:
+          xcode-version: "15.0.1"
+
+      - name: Set macOS SDK version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        run: |
+          sdkpath=$(xcrun --sdk macosx14.0 --show-sdk-path)
+          echo "SDKROOT=$sdkpath" >> "$GITHUB_ENV"
+
       - name: Install dependencies (macOS)
         if: runner.os == 'macOS'
         run: |
@@ -259,6 +283,18 @@ jobs:
           $binPath | Out-File -Append $env:GITHUB_PATH
         shell: pwsh
 
+      - name: Set Xcode version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        uses: maxim-lobanov/setup-xcode@v1
+        with:
+          xcode-version: "15.0.1"
+
+      - name: Set macOS SDK version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        run: |
+          sdkpath=$(xcrun --sdk macosx14.0 --show-sdk-path)
+          echo "SDKROOT=$sdkpath" >> "$GITHUB_ENV"
+
       - uses: ./.github/actions/download-compiler
 
       - name: Enable annotations
@@ -333,6 +369,18 @@ jobs:
         if: runner.os == 'Windows'
         uses: ./git-src/.github/actions/setup-mingw
 
+      - name: Set Xcode version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        uses: maxim-lobanov/setup-xcode@v1
+        with:
+          xcode-version: "15.0.1"
+
+      - name: Set macOS SDK version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        run: |
+          sdkpath=$(xcrun --sdk macosx14.0 --show-sdk-path)
+          echo "SDKROOT=$sdkpath" >> "$GITHUB_ENV"
+
       - name: Download source archive
         uses: actions/download-artifact@v4
         with:
@@ -458,6 +506,18 @@ jobs:
           Copy-Item (Join-Path $binPath "libpcre.dll") -Destination bin
         shell: pwsh
 
+      - name: Set Xcode version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        uses: maxim-lobanov/setup-xcode@v1
+        with:
+          xcode-version: "15.0.1"
+
+      - name: Set macOS SDK version (macOS M1)
+        if: runner.os == 'macOS' && runner.arch == 'ARM64'
+        run: |
+          sdkpath=$(xcrun --sdk macosx14.0 --show-sdk-path)
+          echo "SDKROOT=$sdkpath" >> "$GITHUB_ENV"
+
       # Note: keep synchronized with source_binaries job
       - name: Build docs
         run: |

From 0ecf9a8ed0deef2e54f860d0e3c347bf58fd716a Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 15 Mar 2024 05:07:08 +0100
Subject: [PATCH 037/169] internal: fix an incorrect assertion (#1241)

## Summary

An assertion in the `injectdestructors` module was incorrect, which led
to the compiler aborting on `x.a = f()` assignments, where `a` is a
discriminator field.

## Details

Only raw lvalue expressions must not appear as the source operand of a
branch-switch assignment, rvalue expression (which aren't included in
`ModifierNodes`) are okay.
---
 compiler/sem/injectdestructors.nim | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index b51ff3643cb..8b5330280f1 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -794,7 +794,9 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
     typ = body[target].field.typ
 
   assert body[target].kind == mnkPathVariant
-  assert body[stmt, 1].kind in ModifierNodes
+  # the source expression must either be an rvalue, or there must be a
+  # modifier present
+  assert body[stmt, 1].kind notin LvalueExprKinds
 
   let
     a = bu.wrapMutAlias(typ):

From 87e282a14648f1d3ed9e43298a82792b37ff4891 Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Fri, 15 Mar 2024 05:08:09 +0100
Subject: [PATCH 038/169] sem: remove float analysis from `sem/guards` (#1240)

## Summary

Remove float analysis from `sem/guards` since it's currently unsound.

## Details

`sem/guards`  is only used for static bounds checking (
`--staticBoundChecks` ),  `not nil`  checking, warning for checked field
accesses ( `--warning:ProveField` ) and field accesses of fields
annotated with  `{.guard: ...}` .
Since object variants with a  `float`  discriminator are invalid and
bound checks only concern integers, only conversions to float range
types would be affected under  `--staticBoundChecks` .

It's not clear whether the analysis method here can work with floats
without special treatment in a lot of cases, due to float equality
lacking the subsitution and reflexivity property or the comparison
relations not being total.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/sem/guards.nim | 24 ++++++++++++++++++------
 1 file changed, 18 insertions(+), 6 deletions(-)

diff --git a/compiler/sem/guards.nim b/compiler/sem/guards.nim
index 2d3f31f6652..bca5b672e4d 100644
--- a/compiler/sem/guards.nim
+++ b/compiler/sem/guards.nim
@@ -39,14 +39,22 @@ from compiler/ast/reports_sem import reportAst,
 from compiler/ast/report_enums import ReportKind
 
 const
-  someEq = {mEqI, mEqF64, mEqEnum, mEqCh, mEqB, mEqRef, mEqProc,
+  # Float operations are not analysed as
+  # it is currently unclear whether they
+  # can be analysed in a sound manner
+  # with the approach used here
+  someEq = {mEqI, mEqEnum, mEqCh, mEqB, mEqRef, mEqProc,
     mEqStr, mEqSet, mEqCString}
+    # `mEqF64` excluded here as it lacks the
+    # substition and reflexivity property
 
   # set excluded here as the semantics are vastly different:
-  someLe = {mLeI, mLeF64, mLeU, mLeEnum,
+  someLe = {mLeI, mLeU, mLeEnum,
             mLeCh, mLeB, mLePtr, mLeStr}
+    # `mLeF64` excluded here since it's not a total order
   someLt = {mLtI, mLtF64, mLtU, mLtEnum,
             mLtCh, mLtB, mLtPtr, mLtStr}
+    # `mLtF64` excluded here since it's not a strict total order
 
   someLen = {mLengthOpenArray, mLengthStr, mLengthArray, mLengthSeq}
 
@@ -55,10 +63,14 @@ const
   someHigh = {mHigh}
   # we don't list unsigned here because wrap around semantics suck for
   # proving anything:
-  someAdd = {mAddI, mAddF64, mSucc}
-  someSub = {mSubI, mSubF64, mPred}
-  someMul = {mMulI, mMulF64}
-  someDiv = {mDivI, mDivF64}
+  someAdd = {mAddI, mSucc}
+    # No `mAddF64` since float ops aren't analysed
+  someSub = {mSubI, mPred}
+    # No `mSubF64` since float ops aren't analysed
+  someMul = {mMulI}
+    # No `mMulF64` since float ops aren't analysed
+  someDiv = {mDivI}
+    # No `mDivF64` since float ops aren't analysed
   someMax = {mMaxI}
   someMin = {mMinI}
   someBinaryOp = someAdd+someSub+someMul+someMax+someMin

From 9549d7e455b3dffb81b118afbc08ad49ab9d5d81 Mon Sep 17 00:00:00 2001
From: Saem Ghani <saemghani+github@gmail.com>
Date: Thu, 14 Mar 2024 21:08:36 -0700
Subject: [PATCH 039/169] std/macros: const for nodes requring special init
 (#1239)

## Summary

Introduce a constant  `nnkRequireInitKinds`  for all nodes that require
special initialization, and therefore cannot be constructed via
`newNimNode` . This allows imports of  `std/macros`  that construct
arbitrary nodes to create a filter.

## Details

Added the constant to  `std/macros` , with export, as well as a test to
ensure we can detect any node kinds not in the list in  `tmacros` .
---
 lib/core/macros.nim                                   |  4 ++++
 .../defer/tdefer_malformed_many_children.nim          |  2 +-
 tests/stdlib/metaprogramming/tmacros.nim              | 11 +++++++++++
 3 files changed, 16 insertions(+), 1 deletion(-)

diff --git a/lib/core/macros.nim b/lib/core/macros.nim
index 40d9efba1ff..9cbbba59394 100644
--- a/lib/core/macros.nim
+++ b/lib/core/macros.nim
@@ -149,9 +149,13 @@ type
 
 const
   nnkLiterals* = {nnkCharLit..nnkNilLit}
+    ## `NimNodeKind`s that represent syntax literals
   nnkCallKinds* = {nnkCall, nnkInfix, nnkPrefix, nnkPostfix, nnkCommand,
                    nnkCallStrLit}
   nnkPragmaCallKinds = {nnkExprColonExpr, nnkCall, nnkCallStrLit}
+  nnkRequireInitKinds* = {nnkError, nnkIdent, nnkSym, nnkType}
+    ## `NimNodeKind`s that require initialization and cannot be created via
+    ## general construction routines e.g. `newNimNode`.
 
 proc `==`*(a, b: NimNode): bool {.magic: "EqNimrodNode", noSideEffect.}
   ## Compare two Nim nodes. Return true if nodes are structurally
diff --git a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
index 9e9c9d8ebf3..324ba6b56d1 100644
--- a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
+++ b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
@@ -2,7 +2,7 @@ discard """
   description: "`defer` must have exactly one child node (macro input)."
   errormsg: "illformed AST"
   file: "macros.nim"
-  line: 618
+  line: 622
 """
 
 import std/macros
diff --git a/tests/stdlib/metaprogramming/tmacros.nim b/tests/stdlib/metaprogramming/tmacros.nim
index 8ec2f563426..8fce585e104 100644
--- a/tests/stdlib/metaprogramming/tmacros.nim
+++ b/tests/stdlib/metaprogramming/tmacros.nim
@@ -144,3 +144,14 @@ block: # extractDocCommentsAndRunnables
     
   proc c() {.checkComments("Hello world").} =
     ## Hello world
+
+block some_node_kinds_require_specialize_initialization:
+  ## ensure we can init all the rest as a "negative" test
+  const kindsNotRequiringInit = {low(NimNodeKind)..high(NimNodeKind)} -
+                                  nnkRequireInitKinds
+
+  static:
+    doAssert kindsNotRequiringInit.len > 0
+
+    for k in kindsNotRequiringInit.items:
+      discard newNimNode(k)

From f98e81760161ef3fe303999468fdfe97e4914aee Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 16 Mar 2024 17:38:54 +0100
Subject: [PATCH 040/169] forbid hook routines raising exceptions (#1236)

## Summary

This is enforced as follows:
* if a hook routine potentially raises an exception, a compile-time
  error is reported
* if a hook routine raises a defect at run-time, the program panics

Exception effects of hooks side-steps effect tracking for
procedures, and if a hook does raise at run-time, behaviour was
previously undefined. Disallowing hooks to raise exceptions resolves
both issues.

Performance of the produced executables also improves significantly
(depending on the code), as destroy hooks not being able to raise
results in better code generation.

## Details

The implementation is made up of three parts:
* statically enforcing that no exceptions are raised by hooks (in
  `sempass2`)
* preventing exceptions from exiting hooks at run-time (in `mirgen`/
  `liftdestructors`)
* support in the runtime for panicking on unhandled exceptions

### Static Detection

* for hooks, identified by the presence of the `sfOverriden` flag,
  `sempass2` tests against an empty `.raises` specification, ensuring
  that no (tracked) exceptions can be raised
* the existing exception specification is always replaced
* no error is reported when `.raises: []` was explicitly specified, to
  give precedence to the `can raise unlisted exception` error.
* the symbol of hooks is marked with `sfNeverRaises`, to enforce at
  run-time that no exceptions (defects) leave the routine

The meaning of `sfNeverRaises` is changed from being a hint/guarantee
to being a request.

### Enforcement

* `mirgen` wraps the body of `sfNeverRaises` procedure in a
  `try: ... except: nimUnhandledException()`
* elimination of unreachable code in `cgirgen` removes the `except` if
  it's not used in practice
* all synthesized hook procedure (`liftdestructors`) are flagged with
  `sfNeverRaises`; the `canRaise` tracking is removed

### Runtimes

* C runtime: `nimUnhandledException` displays the exception and quits
  the process
* node.js JS runtime: `nimUnhandledException` displays the exception
  and quits the process
* non-node.js JS runtime: `nimUnhandledException` re-raises the
  exception (there's currently no way to terminate the program)
* VM: `nimUnhandledException` is a  `vmop` that raises a
  `vmEvtUnhandledException` event, which aborts execution

### Standard Library and Tests

* fix the `Task` `=destroy` hook being inferred to raise exceptions
* fix `GC_fullCollect` being inferred to raise exceptions

### Tests

Three individual tests need to be adjusted to the language change:
* `tnew` and `gctest` use `debugEcho` instead of `write` (the former
  has no effects)
* `tarcmisc` has to cast away the raise effects of `Stream.close` for
  now

### Specification

The beginnings of a specification test category for hook routines is
added. At the moment, it only covers the exception behaviour.
---
 compiler/ast/report_enums.nim                 |  1 +
 compiler/front/cli_reporter.nim               |  3 ++
 compiler/mir/mirgen.nim                       | 19 +++++++++++
 compiler/sem/injectdestructors.nim            | 34 +------------------
 compiler/sem/liftdestructors.nim              | 11 ++----
 compiler/sem/sempass2.nim                     | 15 ++++++++
 compiler/vm/compilerbridge.nim                |  4 ++-
 compiler/vm/vm.nim                            | 18 ++--------
 compiler/vm/vmdeps.nim                        | 10 ++++++
 compiler/vm/vmops.nim                         | 12 +++++++
 lib/std/tasks.nim                             |  2 +-
 lib/system.nim                                |  3 ++
 lib/system/excpt.nim                          |  6 ++++
 lib/system/jssys.nim                          | 32 +++++++++++++++--
 lib/system/orc.nim                            |  4 +--
 tests/arc/tarcmisc.nim                        |  3 +-
 tests/arc/topt_no_cursor.nim                  | 14 ++++----
 tests/errmsgs/tprefer_raise_spec_error.nim    | 16 +++++++++
 tests/gc/gctest.nim                           |  3 +-
 tests/lang/s02_core/s99_hooks/README.md       | 21 ++++++++++++
 .../s99_hooks/s99_escaping_defects/README.md  |  3 ++
 .../s99_escaping_defects/t01_copy_hook.nim    | 17 ++++++++++
 .../s99_escaping_defects/t02_sink_hook.nim    | 17 ++++++++++
 .../s99_escaping_defects/t03_destroy_hook.nim | 17 ++++++++++
 .../s99_escaping_defects/t04_trace_hook.nim   | 17 ++++++++++
 .../t05_deepcopy_hook.nim                     | 16 +++++++++
 .../s02_core/s99_hooks/t99_cannot_raise.nim   | 30 ++++++++++++++++
 tests/misc/tnew.nim                           |  3 +-
 28 files changed, 274 insertions(+), 77 deletions(-)
 create mode 100644 tests/errmsgs/tprefer_raise_spec_error.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/README.md
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/README.md
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/t01_copy_hook.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/t02_sink_hook.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/t03_destroy_hook.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/t04_trace_hook.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/s99_escaping_defects/t05_deepcopy_hook.nim
 create mode 100644 tests/lang/s02_core/s99_hooks/t99_cannot_raise.nim

diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index d4da99e7f74..4b4afeeef41 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -423,6 +423,7 @@ type
     rsemCallingConventionMismatch
     rsemHasSideEffects
     rsemCantPassProcvar
+    rsemHookCannotRaise
     rsemUnlistedRaises
     rsemUnlistedEffects
     rsemOverrideSafetyMismatch
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index cee55b31a27..de634c0cc33 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -1303,6 +1303,9 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
     of rsemXCannotRaiseY:
       result = "'$1' cannot raise '$2'" % [r.ast.render, r.raisesList.render]
 
+    of rsemHookCannotRaise:
+      result = "a hook routine is not allowed to raise. ($1)" % r.typ.render
+
     of rsemUnlistedRaises, rsemWarnUnlistedRaises:
       result.add("$1 can raise an unlisted exception: " % r.ast.render,
                  r.typ.render)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 572b334956e..cbbfd5e1860 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -2058,6 +2058,10 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
 
   c.scopeDepth = 1
   c.add MirNode(kind: mnkScope)
+  if sfNeverRaises in owner.flags:
+    c.add MirNode(kind: mnkTry, len: 1)
+    c.add MirNode(kind: mnkStmtList)
+
   if owner.kind in routineKinds:
     # add a 'def' for each ``sink`` parameter. This simplifies further
     # processing and analysis
@@ -2070,6 +2074,21 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
           c.add MirNode(kind: mnkNone)
 
   gen(c, body)
+
+  if sfNeverRaises in owner.flags:
+    # if it's enforced that the procedure never raises, exceptions escaping
+    # the procedure terminate the program. This is achieved by wrapping the
+    # body in a catch-all exception handler
+    c.add endNode(mnkStmtList)
+    c.subTree MirNode(kind: mnkExcept, len: 1):
+      c.subTree mnkBranch:
+        c.subTree mnkVoid:
+          let p = c.graph.getCompilerProc("nimUnhandledException")
+          c.builder.buildCall c.env.procedures.add(p), p.typ,
+                              typeOrVoid(c, p.typ[0]):
+            discard
+    c.add endNode(mnkTry)
+
   c.add endNode(mnkScope)
 
   swap(c.env, env) # swap back
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 8b5330280f1..8ad20cf2469 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -63,31 +63,6 @@
 ## subsequently turning the assignment into a move and thus making the
 ## assertion fail with an ``IndexDefect``.
 
-# XXX: there exists an effect-related problem with the lifetime-tracking hooks
-#      (i.e. ``=copy``, ``=sink``, ``=destroy``). The assignment rewriting and,
-#      to some degree, the destructor injection can be seen as a
-#      refinement/expansion/lowering and should thus not introduce (observable)
-#      side-effects (mutation of global state, exceptional control-flow, etc.) --
-#      it also violates the MIR specification. All three hooks are currently
-#      allowed to have side-effects, which violates the aforementioned rules.
-#      It also causes the concrete issue of cyclic dependencies: for example,
-#      the move analyser uses data-flow analysis (which requires a control-flow
-#      graph) in order to decide where to move and where to copy. If whether a
-#      copy or move is used affects the control-flow graph, the move analyser
-#      depends on its own output, which while possible to make work, would
-#      likely introduce a large amount of complexity.
-#      There are two possible solutions:
-#      1. disallow lifetime-tracking hooks from having any side-effects
-#      2. at least for the ``=copy`` and ``=sink`` hooks, each assignment
-#         could be said to have the union of the effects from both hooks.
-#         Those can be computed when generating the MIR code, as types and
-#         their type-bound operations are already figured out at that point.
-#         It's more complicated for ``=destroy`` hooks, since they are
-#         injected rather than being the result of an expansion. The current
-#         plan is to introduce the MIR concept of dedicated "scope finalizers",
-#         which could be used to attach the effects gathered from all possible
-#         destructor calls to
-
 # XXX: not being able to rewrite an assignment into a call to the copy hook
 #      because it is disabled is a semantic error, meaning that it should
 #      be detected and reported during semantic analysis, not as part of
@@ -527,14 +502,7 @@ template buildVoidCall*(bu: var MirBuilder, env: var MirEnv, p: PSym,
                        body: untyped) =
   let prc = p # prevent multi evaluation
   bu.subTree mnkVoid:
-    let kind =
-      if canRaise(optPanics in graph.config.globalOptions, prc.ast[namePos]):
-        mnkCheckedCall
-      else:
-        mnkCall
-
-    # XXX: injected procedures should not introduce new control-flow paths
-    bu.subTree MirNode(kind: kind, typ: getVoidType(graph)):
+    bu.subTree MirNode(kind: mnkCall, typ: getVoidType(graph)):
       bu.use toValue(env.procedures.add(prc), prc.typ)
       body
 
diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index 7493f01316d..8c66b425416 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -57,7 +57,6 @@ type
     asgnForType: PType
     recurse: bool
     addMemReset: bool    # add wasMoved() call after destructor call
-    canRaise: bool
     filterDiscriminator: PSym  # we generating destructor for case branch
     c: PContext # c can be nil, then we are called from lambdalifting!
     idgen: IdGenerator
@@ -152,8 +151,6 @@ proc genContainerOf(c: var TLiftCtx; objType: PType, field, x: PSym): PNode =
 proc destructorCall(c: var TLiftCtx; op: PSym; x: PNode): PNode =
   var destroy = newTreeIT(nkCall, x.info, op.typ[0]):
     [newSymNode(op), genAddr(c, x)]
-  if sfNeverRaises notin op.flags:
-    c.canRaise = true
   if c.addMemReset:
     result = newTree(nkStmtList):
       [destroy, genBuiltin(c, mWasMoved,  "wasMoved", x)]
@@ -303,8 +300,6 @@ proc newHookCall(c: var TLiftCtx; op: PSym; x, y: PNode): PNode =
   #  localReport(c.config, x.info, "usage of '$1' is a user-defined error" % op.name.s)
   result = newNodeI(nkCall, x.info)
   result.add newSymNode(op)
-  if sfNeverRaises notin op.flags:
-    c.canRaise = true
   if op.typ.sons[1].kind == tyVar:
     result.add genAddr(c, x)
   else:
@@ -322,8 +317,6 @@ proc newHookCall(c: var TLiftCtx; op: PSym; x, y: PNode): PNode =
 proc newOpCall(c: var TLiftCtx; op: PSym; x: PNode): PNode =
   result = newTreeIT(nkCall, x.info, op.typ[0]):
     [newSymNode(op), x]
-  if sfNeverRaises notin op.flags:
-    c.canRaise = true
 
 proc newDeepCopyCall(c: var TLiftCtx; op: PSym; x, y: PNode): PNode =
   result = newAsgnStmt(x, newOpCall(c, op, y))
@@ -948,7 +941,7 @@ proc produceSym(g: ModuleGraph; c: PContext; typ: PType; kind: TTypeAttachedOp;
         # bug #19205: Do not forget to also copy the hidden type field:
         genTypeFieldCopy(a, typ, result.ast[bodyPos], d, src)
 
-  if not a.canRaise: incl result.flags, sfNeverRaises
+  incl result.flags, sfNeverRaises
   completePartialOp(g, idgen.module, typ, kind, result)
 
 
@@ -972,7 +965,7 @@ proc produceDestructorForDiscriminator*(g: ModuleGraph; typ: PType; field: PSym,
   result.ast[bodyPos].add v
   let placeHolder = newNodeIT(nkSym, info, getSysType(g, info, tyPointer))
   fillBody(a, typ, result.ast[bodyPos], d, placeHolder)
-  if not a.canRaise: incl result.flags, sfNeverRaises
+  incl result.flags, sfNeverRaises
 
 
 template liftTypeBoundOps*(c: PContext; typ: PType; info: TLineInfo) =
diff --git a/compiler/sem/sempass2.nim b/compiler/sem/sempass2.nim
index 74b6e2e2c89..d60c2146345 100644
--- a/compiler/sem/sempass2.nim
+++ b/compiler/sem/sempass2.nim
@@ -1788,6 +1788,21 @@ proc trackProc*(c: PContext; s: PSym, body: PNode) =
   else:
     effects[tagEffects] = t.tags
 
+  # ensure that user-provided hooks have no effects and don't raise
+  if sfOverriden in s.flags:
+    # if raising was explicitly disabled (i.e., via ``.raises: []``),
+    # exceptions, if any, were already reported; don't report errors again in
+    # that case
+    if raisesSpec.isNil or raisesSpec.len > 0:
+      let newSpec = newNodeI(nkArgList, s.info)
+      checkRaisesSpec(g, rsemHookCannotRaise, newSpec,
+                      t.exc, hints=off, nil)
+      # override the raises specification to prevent cascading errors:
+      effects[exceptionEffects] = newSpec
+
+    # enforce that no defects escape the routine at run-time:
+    s.flags.incl sfNeverRaises
+
   var mutationInfo = MutationInfo()
   var hasMutationSideEffect = false
   if {strictFuncs, views} * c.features != {}:
diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index 6e147734924..27ee3988b7a 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -225,7 +225,9 @@ proc buildError(c: TCtx, thread: VmThread, event: sink VmEvent): ExecErrorReport
   ## Creates an `ExecErrorReport` with the `event` and a stack-trace for
   ## `thread`
   let stackTrace =
-    if event.kind == vmEvtUnhandledException:
+    if event.kind == vmEvtUnhandledException and event.trace.len > 0:
+      # HACK: an unhandled exception can be reported without providing a trace.
+      #       Ideally, that shouldn't happen
       createStackTrace(c, event.trace)
     else:
       createStackTrace(c, thread)
diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index 67301e53a1c..cd22818da90 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -286,22 +286,8 @@ template toException(x: DerefFailureCode): untyped =
 
 proc reportException(c: TCtx; trace: sink VmRawStackTrace, raised: LocHandle) =
   ## Reports the exception represented by `raised` by raising a `VmError`
-
-  let name = $raised.getFieldHandle(1.fpos).deref().strVal
-  let msg = $raised.getFieldHandle(2.fpos).deref().strVal
-
-  # The reporter expects the exception as a deserialized PNode-tree. Only the
-  # 2nd (name) and 3rd (msg) field are actually used, so instead of running
-  # full deserialization (which is also not possible due to no `PType` being
-  # available), we just create the necessary parts manually
-
-  # TODO: the report should take the two strings directly instead
-  let empty = newNode(nkEmpty)
-  let ast = newTree(nkObjConstr,
-                    empty, # constructor type; unused
-                    empty, # unused
-                    newStrNode(nkStrLit, name),
-                    newStrNode(nkStrLit, msg))
+  let ast = toExceptionAst($raised.getFieldHandle(1.fpos).deref().strVal,
+                           $raised.getFieldHandle(2.fpos).deref().strVal)
   raiseVmError(VmEvent(kind: vmEvtUnhandledException, exc: ast, trace: trace))
 
 func cleanUpReg(r: var TFullReg, mm: var VmMemoryManager) =
diff --git a/compiler/vm/vmdeps.nim b/compiler/vm/vmdeps.nim
index 59918cdb2af..95318902f0d 100644
--- a/compiler/vm/vmdeps.nim
+++ b/compiler/vm/vmdeps.nim
@@ -428,3 +428,13 @@ proc errorReportToString*(c: ConfigRef, error: Report): string =
               # the report, so need to add `"Error: "`
               # manally to stay consistent with the old
               # output.
+
+proc toExceptionAst*(name, msg: sink string): PNode =
+  ## Creates the AST as for an exception object as expected by the report.
+  # TODO: the report should take the two strings directly instead
+  let empty = newNode(nkEmpty)
+  newTree(nkObjConstr,
+          empty, # constructor type; unused
+          empty, # unused
+          newStrNode(nkStrLit, name),
+          newStrNode(nkStrLit, msg))
diff --git a/compiler/vm/vmops.nim b/compiler/vm/vmops.nim
index 70201fd21ae..3d7db173587 100644
--- a/compiler/vm/vmops.nim
+++ b/compiler/vm/vmops.nim
@@ -170,6 +170,17 @@ proc prepareExceptionWrapper(a: VmArgs) {.nimcall.} =
                  deref(a.getHandle(1)).strVal,
                  a.mem.allocator)
 
+proc nimUnhandledExceptionWrapper(a: VmArgs) {.nimcall.} =
+  # setup the exception AST:
+  let
+    exc = a.heap[].tryDeref(a.currentException, noneType).value()
+    ast = toExceptionAst($exc.getFieldHandle(1.fpos).deref().strVal,
+                         $exc.getFieldHandle(2.fpos).deref().strVal)
+  # report the unhandled exception:
+  # XXX: the current stack-trace should be passed along, but we don't
+  #      have access to it here
+  raiseVmError(VmEvent(kind: vmEvtUnhandledException, exc: ast))
+
 proc prepareMutationWrapper(a: VmArgs) {.nimcall.} =
   discard "no-op"
 
@@ -247,6 +258,7 @@ iterator basicOps*(): Override =
   systemop(getCurrentExceptionMsg)
   systemop(getCurrentException)
   systemop(prepareException)
+  systemop(nimUnhandledException)
   systemop(prepareMutation)
   override("stdlib.system.closureIterSetupExc",
            setCurrentExceptionWrapper)
diff --git a/lib/std/tasks.nim b/lib/std/tasks.nim
index e2ea5377f43..ac18862228e 100644
--- a/lib/std/tasks.nim
+++ b/lib/std/tasks.nim
@@ -61,7 +61,7 @@ type
   Task* = object ## `Task` contains the callback and its arguments.
     callback: proc (args: pointer) {.nimcall, gcsafe.}
     args: pointer
-    destroy: proc (args: pointer) {.nimcall, gcsafe.}
+    destroy: proc (args: pointer) {.nimcall, gcsafe, raises: [].}
 
 
 proc `=copy`*(x: var Task, y: Task) {.error.}
diff --git a/lib/system.nim b/lib/system.nim
index 550b60ac13c..72927a6b123 100644
--- a/lib/system.nim
+++ b/lib/system.nim
@@ -2348,6 +2348,9 @@ elif isNimVmTarget:
   proc prepareException(e: ref Exception, ename: cstring) {.compilerproc.} =
     discard
 
+  proc nimUnhandledException() {.compilerproc.} =
+    discard
+
   proc closureIterSetupExc(e: ref Exception) {.compilerproc, inline.} =
     ## Used by the closure transformation pass for preparing for exception
     ## handling. Implemented as a callback.
diff --git a/lib/system/excpt.nim b/lib/system/excpt.nim
index 8603fce28b7..961d02da475 100644
--- a/lib/system/excpt.nim
+++ b/lib/system/excpt.nim
@@ -427,6 +427,12 @@ when true:
       currException = nil
       quit(1)
 
+proc nimUnhandledException() {.compilerproc, noreturn.} =
+  ## Called from generated code when propgation of an exception crosses a
+  ## routine boundary it shouldn't.
+  reportUnhandledError(currException)
+  quit(1)
+
 proc pushActiveException(e: sink(ref Exception)) =
   e.up = activeException
   activeException = e
diff --git a/lib/system/jssys.nim b/lib/system/jssys.nim
index 86b749c47ad..363d20a976a 100644
--- a/lib/system/jssys.nim
+++ b/lib/system/jssys.nim
@@ -115,8 +115,7 @@ proc writeStackTrace() =
 proc getStackTrace*(): string = rawWriteStackTrace()
 proc getStackTrace*(e: ref Exception): string = e.trace
 
-proc unhandledException(e: ref Exception) {.
-    compilerproc, asmNoStackFrame.} =
+proc unhandledExceptionString(e: ref Exception): string =
   var buf = ""
   if e.msg.len != 0:
     add(buf, "Error: unhandled exception: ")
@@ -128,7 +127,11 @@ proc unhandledException(e: ref Exception) {.
   add(buf, "]\n")
   when NimStackTrace:
     add(buf, rawWriteStackTrace())
-  let cbuf = cstring(buf)
+  result = buf
+
+proc unhandledException(e: ref Exception) {.
+    compilerproc, asmNoStackFrame.} =
+  let cbuf = cstring(unhandledExceptionString(e))
   framePtr = nil
   {.emit: """
   if (typeof(Error) !== "undefined") {
@@ -139,6 +142,29 @@ proc unhandledException(e: ref Exception) {.
   }
   """.}
 
+proc nimUnhandledException() {.compilerproc, asmNoStackFrame.} =
+  # |NimSkull| exceptions are turned into JavaScript errors for the purpose
+  # of better error messages
+  when defined(nodejs):
+    {.emit: """
+      if (lastJSError.m_type !== undefined) {
+        console.log(`toJSStr`(`unhandledExceptionString`(`lastJSError`)));
+      } else {
+        console.log('Error: unhandled exception: ', `lastJSError`)
+      }
+      process.exit(1);
+    """.}
+  else:
+    # it's currently not possible to truly panic (abort excution) for non-
+    # node.js JavaScript
+    {.emit: """
+      if (lastJSError.m_type !== undefined) {
+        `unhandledException`(lastJSError);
+      } else {
+        throw lastJSError;
+      }
+    """.}
+
 proc prepareException(e: ref Exception, ename: cstring) {.
     compilerproc, asmNoStackFrame.} =
   if e.name.isNil:
diff --git a/lib/system/orc.nim b/lib/system/orc.nim
index 38da71d9cda..ee44add02a0 100644
--- a/lib/system/orc.nim
+++ b/lib/system/orc.nim
@@ -27,7 +27,7 @@ const
   logOrc = defined(nimArcIds)
 
 type
-  TraceProc = proc (p, env: pointer) {.nimcall, benign.}
+  TraceProc = proc (p, env: pointer) {.nimcall, benign, raises: [], tags: [].}
   DisposeProc = proc (p: pointer) {.nimcall, benign.}
 
 template color(c): untyped = c.rc and colorMask
@@ -472,7 +472,7 @@ proc GC_prepareOrc*(): int {.inline.} = roots.len
 proc GC_partialCollect*(limit: int) =
   partialCollect(limit)
 
-proc GC_fullCollect* =
+proc GC_fullCollect*() {.raises: [].} =
   ## Forces a full garbage collection pass. With `--gc:orc` triggers the cycle
   ## collector. This is an alias for `GC_runOrc`.
   collectCycles()
diff --git a/tests/arc/tarcmisc.nim b/tests/arc/tarcmisc.nim
index 0e1dda7fb33..3747f624097 100644
--- a/tests/arc/tarcmisc.nim
+++ b/tests/arc/tarcmisc.nim
@@ -112,7 +112,8 @@ type
     x: int
 
 proc `=destroy`(x: var AObj) =
-  close(x.io)
+  {.cast(raises: []).}:
+    close(x.io)
   echo "closed"
 
 var x = B(io: newStringStream("thestream"))
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 398a0fe593f..491fc9aefd3 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -33,17 +33,17 @@ scope:
   def_cursor _0: Node = target[]
   def_cursor _1: Node = _0[].parent
   def sibling: Node
-  =copy(name sibling, arg _1[].left) (raises)
+  =copy(name sibling, arg _1[].left)
   def_cursor _2: Node = sibling
   def saved: Node
-  =copy(name saved, arg _2[].right) (raises)
+  =copy(name saved, arg _2[].right)
   def_cursor _3: Node = sibling
   def_cursor _4: Node = saved
   def_cursor _6: Node = _4[].left
-  =copy(name _3[].right, arg _6) (raises)
+  =copy(name _3[].right, arg _6)
   def_cursor _5: Node = sibling
-  =sink(name _5[].parent, arg saved) (raises)
-  =destroy(name sibling) (raises)
+  =sink(name _5[].parent, arg saved)
+  =destroy(name sibling)
 -- end of expandArc ------------------------
 --expandArc: p1
 
@@ -130,7 +130,7 @@ scope:
 scope:
   try:
     def shadowScope: Scope
-    =copy(name shadowScope, arg c[].currentScope) (raises)
+    =copy(name shadowScope, arg c[].currentScope)
     rawCloseScope(arg c) (raises)
     scope:
       def_cursor _0: Scope = shadowScope
@@ -157,7 +157,7 @@ scope:
                   addInterfaceDecl(arg c, consume _6) (raises)
                 i = addI(arg i, arg 1) (raises)
   finally:
-    =destroy(name shadowScope) (raises)
+    =destroy(name shadowScope)
 -- end of expandArc ------------------------
 --expandArc: treturn
 
diff --git a/tests/errmsgs/tprefer_raise_spec_error.nim b/tests/errmsgs/tprefer_raise_spec_error.nim
new file mode 100644
index 00000000000..4d92f4de3f0
--- /dev/null
+++ b/tests/errmsgs/tprefer_raise_spec_error.nim
@@ -0,0 +1,16 @@
+discard """
+  description: '''
+    An error for violating the explicit `.raises` specification is preferred
+    over the error that hooks cannot raise
+  '''
+  errormsg: "doRaise() can raise an unlisted exception: ref CatchableError"
+  line: 16
+"""
+
+type Obj = object
+
+proc doRaise() =
+  raise CatchableError.newException("")
+
+proc `=copy`(a: var Obj, b: Obj) {.raises: [].} =
+  doRaise()
diff --git a/tests/gc/gctest.nim b/tests/gc/gctest.nim
index f241bfaf2f0..36138ce1f1d 100644
--- a/tests/gc/gctest.nim
+++ b/tests/gc/gctest.nim
@@ -60,8 +60,7 @@ proc caseTree(lvl: int = 0): PCaseNode =
 
 proc `=destroy`(n: var TNode) =
   assert(addr(n) != nil)
-  write(stdout, "finalizing: ")
-  writeLine(stdout, "not nil")
+  debugEcho "finalizing: not nil"
 
 var
   id: int = 1
diff --git a/tests/lang/s02_core/s99_hooks/README.md b/tests/lang/s02_core/s99_hooks/README.md
new file mode 100644
index 00000000000..786bff439da
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/README.md
@@ -0,0 +1,21 @@
+## What belongs here
+
+This section contains tests related to hook procedures, that is, procedures:
+- to which calls are statically inserted by the compiler
+- that are invoked by the runtime at run-time
+
+This should cover:
+- syntax
+- restrictions on the routine definitions
+- restrictions on the run-time behaviour (if any)
+- where the hooks are injected
+
+## Assumptions
+
+- nothing beyond a single module/file
+- assertions may still be built-ins
+- user-defined types are supported and work
+- procedures and calls thereof work
+- `var T` is supported as a parameter's type
+- raising and catching exceptions work
+- tag effect tracking works
\ No newline at end of file
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/README.md b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/README.md
new file mode 100644
index 00000000000..1538b39ff42
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/README.md
@@ -0,0 +1,3 @@
+If a Defect is raised from a hook routine at run-time, the program immediately
+terminates (i.e., panics) and an unhandled exception is reported. This is the
+case for both automatic and explicit calls of the hooks.
\ No newline at end of file
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t01_copy_hook.nim b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t01_copy_hook.nim
new file mode 100644
index 00000000000..af708b10886
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t01_copy_hook.nim
@@ -0,0 +1,17 @@
+discard """
+  description: "`=copy` hooks panic when a defect escapes"
+  outputsub: "Error: unhandled exception: error [Defect]"
+  exitcode: 1
+"""
+
+type Type = object
+
+proc `=copy`(a: var Type, b: Type) =
+  raise (ref Defect)(msg: "error")
+
+try:
+  var x: Type
+  `=copy`(x, Type())
+finally:
+  # finally sections are not reached and no cleanup is performed
+  doAssert false
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t02_sink_hook.nim b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t02_sink_hook.nim
new file mode 100644
index 00000000000..e6f7af55f62
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t02_sink_hook.nim
@@ -0,0 +1,17 @@
+discard """
+  description: "`=sink` hooks panic when a defect escapes"
+  outputsub: "Error: unhandled exception: error [Defect]"
+  exitcode: 1
+"""
+
+type Type = object
+
+proc `=sink`(a: var Type, b: Type) =
+  raise (ref Defect)(msg: "error")
+
+try:
+  var x: Type
+  `=sink`(x, Type())
+finally:
+  # finally sections are not reached and no cleanup is performed
+  doAssert false
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t03_destroy_hook.nim b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t03_destroy_hook.nim
new file mode 100644
index 00000000000..5433c981d39
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t03_destroy_hook.nim
@@ -0,0 +1,17 @@
+discard """
+  description: "`=destroy` hooks panic when a defect escapes"
+  outputsub: "Error: unhandled exception: error [Defect]"
+  exitcode: 1
+"""
+
+type Type = object
+
+proc `=destroy`(a: var Type) =
+  raise (ref Defect)(msg: "error")
+
+try:
+  var x: Type
+  `=destroy`(x)
+finally:
+  # finally sections are not reached and no cleanup is performed
+  doAssert false
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t04_trace_hook.nim b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t04_trace_hook.nim
new file mode 100644
index 00000000000..65d62b289fc
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t04_trace_hook.nim
@@ -0,0 +1,17 @@
+discard """
+  description: "`=trace` hooks panic when a defect escapes"
+  outputsub: "Error: unhandled exception: error [Defect]"
+  exitcode: 1
+"""
+
+type Type = object
+
+proc `=trace`(a: var Type, p: pointer) =
+  raise (ref Defect)(msg: "error")
+
+try:
+  var x: Type
+  `=trace`(x, nil)
+finally:
+  # finally sections are not reached and no cleanup is performed
+  doAssert false
diff --git a/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t05_deepcopy_hook.nim b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t05_deepcopy_hook.nim
new file mode 100644
index 00000000000..a4196256bc9
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/s99_escaping_defects/t05_deepcopy_hook.nim
@@ -0,0 +1,16 @@
+discard """
+  description: "`=deepcopy` hooks panic when a defect escapes"
+  outputsub: "Error: unhandled exception: error [Defect]"
+  exitcode: 1
+"""
+
+type Type = ref object
+
+proc `=deepcopy`(a: Type): Type =
+  raise (ref Defect)(msg: "error")
+
+try:
+  var x = `=deepcopy`(Type())
+finally:
+  # finally sections are not reached and no cleanup is performed
+  doAssert false
diff --git a/tests/lang/s02_core/s99_hooks/t99_cannot_raise.nim b/tests/lang/s02_core/s99_hooks/t99_cannot_raise.nim
new file mode 100644
index 00000000000..0232aeed375
--- /dev/null
+++ b/tests/lang/s02_core/s99_hooks/t99_cannot_raise.nim
@@ -0,0 +1,30 @@
+discard """
+  description: '''
+    Hook routines are not allowed to raise exception. If they're inferred to
+    raise, a compile-time error is reported.
+  '''
+  action: reject
+  matrix: "--errorMax:5"
+"""
+
+type Type = object
+
+proc `=copy`(a: var Type, b: Type) =
+  raise (ref CatchableError)() #[tt.Error
+  ^ a hook routine is not allowed to raise. (ref CatchableError)]#
+
+proc `=sink`(a: var Type, b: Type) =
+  raise (ref CatchableError)() #[tt.Error
+  ^ a hook routine is not allowed to raise. (ref CatchableError)]#
+
+proc `=destroy`(a: var Type) =
+  raise (ref CatchableError)() #[tt.Error
+  ^ a hook routine is not allowed to raise. (ref CatchableError)]#
+
+proc `=trace`(a: var Type, env: pointer) =
+  raise (ref CatchableError)() #[tt.Error
+  ^ a hook routine is not allowed to raise. (ref CatchableError)]#
+
+proc `=deepCopy`(a: ref Type): ref Type =
+  raise (ref CatchableError)() #[tt.Error
+  ^ a hook routine is not allowed to raise. (ref CatchableError)]#
diff --git a/tests/misc/tnew.nim b/tests/misc/tnew.nim
index 318fa644be3..1c44bc7b457 100644
--- a/tests/misc/tnew.nim
+++ b/tests/misc/tnew.nim
@@ -20,8 +20,7 @@ type
   TStressTest = ref array[0..45, array[1..45, TNode]]
 
 proc `=destroy`(n: var TNode) =
-  write(stdout, n.data)
-  write(stdout, " is now freed\n")
+  debugEcho n.data, " is now freed"
 
 proc newNode(data: int, le, ri: PNode): PNode =
   new(result)

From 8a55ef7ca560444d80ca06ae14b2a9a986c1305b Mon Sep 17 00:00:00 2001
From: Clyybber <darkmine956@gmail.com>
Date: Sun, 17 Mar 2024 12:05:29 +0100
Subject: [PATCH 041/169] sem: `NimNode` equality respects `nkType`'s type
 (#1245)

## Summary
`exprStructuralEquivalentStrictSymAndComm`  no longer ignores type
equality for  `nkType`  nodes.
This affects  ``macros.`==` ``  for NimNodes and  `macrocache.incl`
(and  `ic` ).

## Details
A test using ``macros.`==` `` has been added.
---
 compiler/ast/trees.nim                        |  2 +-
 .../lang_callable/macros/tmacros_various.nim  | 40 +++++++++++++++++++
 2 files changed, 41 insertions(+), 1 deletion(-)

diff --git a/compiler/ast/trees.nim b/compiler/ast/trees.nim
index 317ec8896e7..24473ece706 100644
--- a/compiler/ast/trees.nim
+++ b/compiler/ast/trees.nim
@@ -97,7 +97,7 @@ makeTreeEquivalenceProc(exprStructuralEquivalentStrictSymAndComm,
   relaxedKindCheck = false,
   symCheck     = a.sym == b.sym,
   floatCheck   = sameFloatIgnoreNan(a.floatVal, b.floatVal),
-  typeCheck    = true,
+  typeCheck    = a.typ == b.typ,
   commentCheck = a.comment == b.comment
 )
 export exprStructuralEquivalentStrictSymAndComm
diff --git a/tests/lang_callable/macros/tmacros_various.nim b/tests/lang_callable/macros/tmacros_various.nim
index 5d7d62dffb1..39802860453 100644
--- a/tests/lang_callable/macros/tmacros_various.nim
+++ b/tests/lang_callable/macros/tmacros_various.nim
@@ -12,6 +12,8 @@ Infix
 macrocache ok
 CommentStmt "comment 1"
 CommentStmt "comment 2"
+false
+false
 '''
 
   output: '''
@@ -346,3 +348,41 @@ block:
   static:
     echo treeRepr(C1[1])
     echo treeRepr(C2[1])
+
+block:
+  # Ensure nkType equality is not ignored by `==` for NimNode
+  macro checkEq(a, b: typed) =
+    echo a == b
+
+  type Exception1 = object of Exception
+  type Exception2 = object of Exception
+  checkEq (;
+    try:
+      discard
+    except Exception1:
+      discard
+  ), (;
+    try:
+      discard
+    except Exception2:
+      discard
+  )
+
+  macro checkEqOfTry(a, b: typed) =
+    echo a[0][1][1] == b[0][1][1]
+
+  checkEqOfTry (;
+    block:
+      type E = object of Exception1
+      try:
+        discard
+      except E:
+        discard
+  ), (;
+    block:
+      type E = object of Exception2
+      try:
+        discard
+      except E:
+        discard
+  )

From 8d0db1d38140f25044b7d7d4fdad4b741f9edf4e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 18 Mar 2024 00:48:08 +0100
Subject: [PATCH 042/169] make locals' lifetimes bounded by lexical scope for
 `if` (#1247)

## Summary

Temporaries and locals that start their storage duration within
`if`/`elif` condition expressions are now destroyed, if necessary,
at the end of the `if`/`elif` branch, not at the end of the `if`'s
enclosing scope. This makes the end of their storage duration
consistent with the end of their lexical scope.

## Details

Making the storage duration end at the end of the `if`/`elif` is
achieved by `mirgen` wrapping the code for each `nkElifBranch` in a
`scope`.

### `while` Lowering

Each `nkElifBranch` being wrapped in a (lifetime) scope, means that
lowering `while cond` into `while true: (if not cond: break; body)`
no longer works, since locals and temporaries starting their
storage duration during evaluation of the `cond` expression would
be destroyed at the end of the `if`, instead of at the end of the
`while`'s body.

To ensure correct and expected lifetimes, `cond` is first assigned
to a temporary, which the `if` then uses for branching. For
example, `while (let x = y; x > 1): body` is lowered by `transf`
into:
```nim
while true:
  let tmp = (let x = y; x > 1)
  if not tmp:
    break
  body
```

Turning `while cond` into `while true: (if cond: body else: break)`
would work too, but it's decide against, because:
* it, currently, results in worse cursor inference results (meaning
  more copies)
* it expands to more MIR code (more work for data-flow analysis)
---
 compiler/mir/mirgen.nim                   | 13 ++--
 compiler/sem/transf.nim                   | 16 +++-
 tests/arc/tcontrolflow.nim                |  7 +-
 tests/arc/topt_cursor.nim                 | 21 +++---
 tests/arc/topt_no_cursor.nim              | 90 ++++++++++++-----------
 tests/arc/topt_refcursors.nim             | 24 +++---
 tests/arc/topt_wasmoved_destroy_pairs.nim | 65 ++++++++--------
 7 files changed, 136 insertions(+), 100 deletions(-)

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index cbbfd5e1860..b2e0aa7b930 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1459,12 +1459,13 @@ proc genIf(c: var TCtx, n: PNode, dest: Destination) =
 
   template genElifBranch(branch: PNode, extra: untyped) =
     ## Generates the code for a single ``nkElif(Branch|Expr)``
-    let v = genUse(c, branch[0])
-    c.subTree mnkIf:
-      c.use v
-      c.scope:
-        genBranch(c, branch.lastSon, dest)
-        extra
+    c.scope:
+      let v = genUse(c, branch[0])
+      c.subTree mnkIf:
+        c.use v
+        c.scope:
+          genBranch(c, branch.lastSon, dest)
+          extra
 
   if n.len == 1:
     # an ``if`` statement/expression with a single branch. Don't emit the
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 829171cb34c..0728f544adb 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -373,9 +373,9 @@ proc transformWhile(c: PTransf; n: PNode): PNode =
       loop[0] = newIntTypeNode(1, c.graph.getSysType(info, tyBool))
       loop[0].info = info
 
-      # XXX: we need to help ``closureiters`` (which doesn't support 'yield' in
-      #      if conditions...) here and unpack complex condition expressions;
-      #      'yield' in 'while' conditions would not work otherwise
+      # unwrap the statement list expression. It helps with the following
+      # lowering, and it's also necessary for the closure iterator
+      # transformation
       var preamble = PNode(nil)
       if cond.kind in {nkStmtListExpr, nkStmtList}:
         preamble = newNodeI(nkStmtList, info, cond.len - 1)
@@ -384,6 +384,16 @@ proc transformWhile(c: PTransf; n: PNode): PNode =
 
         cond = cond[^1]
 
+      # all definitions part of the condition expression are part of the while's
+      # scope, placing the expression into the if's condition slot would thus
+      # result in incorrect scoping
+      if not isAtom(cond):
+        let tmp = newTemp(c, cond.typ, cond.info)
+        if preamble.isNil:
+          preamble = newTree(nkStmtList)
+        preamble.add newTree(nkLetSection, newIdentDefs(tmp, cond))
+        cond = tmp
+
       let exit =
         newTreeI(nkIfStmt, info,
           newTreeI(nkElifBranch, info,
diff --git a/tests/arc/tcontrolflow.nim b/tests/arc/tcontrolflow.nim
index 80cc2b187eb..fd99f9141a9 100644
--- a/tests/arc/tcontrolflow.nim
+++ b/tests/arc/tcontrolflow.nim
@@ -1,12 +1,12 @@
 discard """
   output: '''begin A
 elif
-end A
 destroyed
+end A
 begin false
 if
-end false
 destroyed
+end false
 begin true
 if
 end true
@@ -19,6 +19,9 @@ true
 # we use the -d:danger switch to detect uninitialized stack
 # slots more reliably (there shouldn't be any, of course).
 
+# XXX: the test here need to be improved and turned into a proper
+#      specification
+
 type
   Foo = object
     id: int
diff --git a/tests/arc/topt_cursor.nim b/tests/arc/topt_cursor.nim
index 2085b3c17d9..4f4cb9f59ff 100644
--- a/tests/arc/topt_cursor.nim
+++ b/tests/arc/topt_cursor.nim
@@ -7,10 +7,11 @@ scope:
   try:
     def_cursor x: (string, int) = <D0>
     block L0:
-      if cond:
-        scope:
-          x = <D1>
-          break L0
+      scope:
+        if cond:
+          scope:
+            x = <D1>
+            break L0
       scope:
         x = <D2>
     def_cursor _0: (string, int) = x
@@ -35,11 +36,13 @@ scope:
               while true:
                 scope:
                   def_cursor _1: File = f
-                  def _2: bool = readLine(arg _1, name res) (raises)
-                  def _3: bool = not(arg _2)
-                  if _3:
-                    scope:
-                      break L0
+                  def :tmp: bool = readLine(arg _1, name res) (raises)
+                  scope:
+                    def_cursor _2: bool = :tmp
+                    def _3: bool = not(arg _2)
+                    if _3:
+                      scope:
+                        break L0
                   scope:
                     scope:
                       def_cursor x: string = res
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 491fc9aefd3..1dc6bcab5a4 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -98,11 +98,13 @@ scope:
           while true:
             scope:
               def_cursor _1: int = i
-              def _2: bool = ltI(arg _1, arg L)
-              def _3: bool = not(arg _2)
-              if _3:
-                scope:
-                  break L0
+              def :tmp: bool = ltI(arg _1, arg L)
+              scope:
+                def_cursor _2: bool = :tmp
+                def _3: bool = not(arg _2)
+                if _3:
+                  scope:
+                    break L0
               scope:
                 scope:
                   try:
@@ -110,12 +112,13 @@ scope:
                     def line: lent string = borrow a[_4]
                     def_cursor _5: string = line[]
                     def splitted: seq[string] = split(arg _5, arg " ", arg -1) (raises)
-                    def_cursor _6: string = splitted[0]
-                    def _7: bool = eqStr(arg _6, arg "opt")
-                    if _7:
-                      scope:
-                        def_cursor _10: string = splitted[1]
-                        =copy(name lan_ip, arg _10)
+                    scope:
+                      def_cursor _6: string = splitted[0]
+                      def _7: bool = eqStr(arg _6, arg "opt")
+                      if _7:
+                        scope:
+                          def_cursor _10: string = splitted[1]
+                          =copy(name lan_ip, arg _10)
                     def_cursor _8: string = lan_ip
                     echo(arg type(array[0..0, string]), arg _8) (raises)
                     def_cursor _9: string = splitted[1]
@@ -143,11 +146,13 @@ scope:
           while true:
             scope:
               def_cursor _2: int = i
-              def _3: bool = ltI(arg _2, arg L)
-              def _4: bool = not(arg _3)
-              if _4:
-                scope:
-                  break L0
+              def :tmp: bool = ltI(arg _2, arg L)
+              scope:
+                def_cursor _3: bool = :tmp
+                def _4: bool = not(arg _3)
+                if _4:
+                  scope:
+                    break L0
               scope:
                 scope:
                   def_cursor _5: int = i
@@ -164,14 +169,15 @@ scope:
 scope:
   try:
     def x: sink string
-    def_cursor _0: sink string = x
-    def _1: int = lengthStr(arg _0)
-    def _2: bool = eqI(arg _1, arg 2)
-    if _2:
-      scope:
-        result := move x
-        wasMoved(name x)
-        return
+    scope:
+      def_cursor _0: sink string = x
+      def _1: int = lengthStr(arg _0)
+      def _2: bool = eqI(arg _1, arg 2)
+      if _2:
+        scope:
+          result := move x
+          wasMoved(name x)
+          return
     def_cursor _3: sink string = x
     def _4: int = lengthStr(arg _3)
     def _5: string = $(arg _4) (raises)
@@ -189,14 +195,15 @@ scope:
     this[].isValid = fileExists(arg _0) (raises)
     def _1: tuple[dir: string, front: string]
     block L0:
-      def_cursor _2: string = this[].value
-      def _3: bool = dirExists(arg _2) (raises)
-      if _3:
-        scope:
-          def _4: string
-          =copy(name _4, arg this[].value)
-          _1 := construct (consume _4, consume "")
-          break L0
+      scope:
+        def_cursor _2: string = this[].value
+        def _3: bool = dirExists(arg _2) (raises)
+        if _3:
+          scope:
+            def _4: string
+            =copy(name _4, arg this[].value)
+            _1 := construct (consume _4, consume "")
+            break L0
       scope:
         try:
           def_cursor _5: string = this[].value
@@ -214,15 +221,16 @@ scope:
           =destroy(name _6)
     def par: tuple[dir: string, front: string] = move _1
     block L1:
-      def_cursor _10: string = par.0
-      def _11: bool = dirExists(arg _10) (raises)
-      if _11:
-        scope:
-          def_cursor _12: string = par.0
-          def_cursor _13: string = par.1
-          def _14: seq[string] = getSubDirs(arg _12, arg _13) (raises)
-          =sink(name this[].matchDirs, arg _14)
-          break L1
+      scope:
+        def_cursor _10: string = par.0
+        def _11: bool = dirExists(arg _10) (raises)
+        if _11:
+          scope:
+            def_cursor _12: string = par.0
+            def_cursor _13: string = par.1
+            def _14: seq[string] = getSubDirs(arg _12, arg _13) (raises)
+            =sink(name this[].matchDirs, arg _14)
+            break L1
       scope:
         def _15: seq[string] = construct ()
         =sink(name this[].matchDirs, arg _15)
diff --git a/tests/arc/topt_refcursors.nim b/tests/arc/topt_refcursors.nim
index 20b5823ee66..e0d466b1f3e 100644
--- a/tests/arc/topt_refcursors.nim
+++ b/tests/arc/topt_refcursors.nim
@@ -11,11 +11,13 @@ scope:
         scope:
           def_cursor _0: Node = it
           def _1: bool = eqRef(arg _0, arg nil)
-          def _2: bool = not(arg _1)
-          def _3: bool = not(arg _2)
-          if _3:
-            scope:
-              break L0
+          def :tmp: bool = not(arg _1)
+          scope:
+            def_cursor _2: bool = :tmp
+            def _3: bool = not(arg _2)
+            if _3:
+              scope:
+                break L0
           scope:
             def_cursor _4: Node = it
             def_cursor _5: string = _4[].s
@@ -29,11 +31,13 @@ scope:
         scope:
           def_cursor _7: Node = jt
           def _8: bool = eqRef(arg _7, arg nil)
-          def _9: bool = not(arg _8)
-          def _10: bool = not(arg _9)
-          if _10:
-            scope:
-              break L1
+          def :tmp: bool = not(arg _8)
+          scope:
+            def_cursor _9: bool = :tmp
+            def _10: bool = not(arg _9)
+            if _10:
+              scope:
+                break L1
           scope:
             def_cursor _11: Node = jt
             def_cursor ri: Node = _11[].ri
diff --git a/tests/arc/topt_wasmoved_destroy_pairs.nim b/tests/arc/topt_wasmoved_destroy_pairs.nim
index 3e23ce3ee25..2d21d939f5b 100644
--- a/tests/arc/topt_wasmoved_destroy_pairs.nim
+++ b/tests/arc/topt_wasmoved_destroy_pairs.nim
@@ -8,11 +8,12 @@ scope:
   def b: seq[seq[int]]
   def x: seq[int] = f() (raises)
   block L0:
-    if cond:
-      scope:
-        def _0: seq[int] = move x
-        add(name a, consume _0)
-        break L0
+    scope:
+      if cond:
+        scope:
+          def _0: seq[int] = move x
+          add(name a, consume _0)
+          break L0
     scope:
       def _1: seq[int] = move x
       add(name b, consume _1)
@@ -35,29 +36,33 @@ scope:
           while true:
             scope:
               def_cursor _0: int = i
-              def _1: bool = ltI(arg _0, arg b)
-              def _2: bool = not(arg _1)
-              if _2:
-                scope:
-                  break L0
+              def :tmp: bool = ltI(arg _0, arg b)
+              scope:
+                def_cursor _1: bool = :tmp
+                def _2: bool = not(arg _1)
+                if _2:
+                  scope:
+                    break L0
               scope:
                 scope:
                   def_cursor i: int = i
-                  def _3: bool = eqI(arg i, arg 2)
-                  if _3:
-                    scope:
-                      return
+                  scope:
+                    def _3: bool = eqI(arg i, arg 2)
+                    if _3:
+                      scope:
+                        return
                   def _4: seq[int]
                   =copy(name _4, arg x)
                   add(name a, consume _4)
                 i = addI(arg i, arg 1) (raises)
     block L1:
-      if cond:
-        scope:
-          def _5: seq[int] = move x
-          wasMoved(name x)
-          add(name a, consume _5)
-          break L1
+      scope:
+        if cond:
+          scope:
+            def _5: seq[int] = move x
+            wasMoved(name x)
+            add(name a, consume _5)
+            break L1
       scope:
         def _6: seq[int] = move x
         wasMoved(name x)
@@ -72,17 +77,19 @@ scope:
   try:
     def str: string
     def x: string = boolToStr(arg cond)
-    if cond:
-      scope:
-        return
+    scope:
+      if cond:
+        scope:
+          return
     def _0: string = boolToStr(arg cond)
     str := move _0
-    def _1: bool = not(arg cond)
-    if _1:
-      scope:
-        result := move str
-        wasMoved(name str)
-        return
+    scope:
+      def _1: bool = not(arg cond)
+      if _1:
+        scope:
+          result := move str
+          wasMoved(name str)
+          return
   finally:
     =destroy(name x)
     =destroy(name str)

From 63b2a528a03dc6703c5f7a9980c3bdc4b77cbce1 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 19 Mar 2024 14:03:16 +0000
Subject: [PATCH 043/169] build(deps): Bump softprops/action-gh-release from
 2.0.3 to 2.0.4 (#1250)

Bumps

[softprops/action-gh-release](https://github.com/softprops/action-gh-release)
from 2.0.3 to 2.0.4.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/releases">softprops/action-gh-release's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.4</h2>
<ul>
<li>Minor follow up to <a

href="https://redirect.github.com/softprops/action-gh-release/pull/417">#417</a>.
<a

href="https://redirect.github.com/softprops/action-gh-release/pull/425">#425</a></li>
</ul>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/blob/master/CHANGELOG.md">softprops/action-gh-release's
changelog</a>.</em></p>
<blockquote>
<h2>2.0.4</h2>
<ul>
<li>Minor follow up to <a

href="https://redirect.github.com/softprops/action-gh-release/pull/417">#417</a>.
<a

href="https://redirect.github.com/softprops/action-gh-release/pull/425">#425</a></li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/softprops/action-gh-release/commit/9d7c94cfd0a1f3ed45544c887983e9fa900f0564"><code>9d7c94c</code></a>
build</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/6ffed59e5547e6594ba7b3e49883af40801fa1df"><code>6ffed59</code></a>
followup to <a

href="https://redirect.github.com/softprops/action-gh-release/issues/417">#417</a>
(<a

href="https://redirect.github.com/softprops/action-gh-release/issues/425">#425</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/1ce812a7bd7fa6c191ed3334eeace31579a98f25"><code>1ce812a</code></a>
package script for updating git tag</li>
<li>See full diff in <a

href="https://github.com/softprops/action-gh-release/compare/v2.0.3...v2.0.4">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=softprops/action-gh-release&package-manager=github_actions&previous-version=2.0.3&new-version=2.0.4)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index e87c1367b16..121528719c9 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -101,7 +101,7 @@ jobs:
 
       - id: release
         name: Create pre-release
-        uses: softprops/action-gh-release@v2.0.3
+        uses: softprops/action-gh-release@v2.0.4
         with:
           prerelease: true
           files: ${{ steps.release-files.outputs.result }}

From 8ca0787a6bac322b79915640c1cfb9178bdd4099 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 19 Mar 2024 14:05:35 +0000
Subject: [PATCH 044/169] build(deps): Bump dawidd6/action-download-artifact
 from 3.1.2 to 3.1.4 (#1251)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 3.1.2 to 3.1.4.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v3.1.4</h2>
<h2>What's Changed</h2>
<ul>
<li>build(deps): bump adm-zip from 0.5.10 to 0.5.12 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/282">dawidd6/action-download-artifact#282</a></li>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.1.2 to
2.1.4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/280">dawidd6/action-download-artifact#280</a></li>
<li>fix: accept expired artifacts with documentation url by <a
href="https://github.com/wdconinc"><code>@​wdconinc</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/283">dawidd6/action-download-artifact#283</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/wdconinc"><code>@​wdconinc</code></a>
made their first contribution in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/283">dawidd6/action-download-artifact#283</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.4">https://github.com/dawidd6/action-download-artifact/compare/v3...v3.1.4</a></p>
<h2>v3.1.3</h2>
<h2>What's Changed</h2>
<ul>
<li>node_modules: upgrade by <a
href="https://github.com/dawidd6"><code>@​dawidd6</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/276">dawidd6/action-download-artifact#276</a></li>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.1.1 to
2.1.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/277">dawidd6/action-download-artifact#277</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.1.2...v3.1.3">https://github.com/dawidd6/action-download-artifact/compare/v3.1.2...v3.1.3</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/09f2f74827fd3a8607589e5ad7f9398816f540fe"><code>09f2f74</code></a>
fix: accept expired artifacts with documentation url (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/283">#283</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/4a559bae55614d2dc605c9fc1250c5222f31a731"><code>4a559ba</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.1.2 to 2.1.4
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/280">#280</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/ffef66c3dd64b1f902eebb69e1fbdada641808b7"><code>ffef66c</code></a>
build(deps): bump adm-zip from 0.5.10 to 0.5.12 (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/282">#282</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/a430ac5786b39ad5869da25a98130624d2ce340c"><code>a430ac5</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.1.1 to 2.1.2
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/277">#277</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/0a65e2546f0b341289d1b51568985835a6dfe495"><code>0a65e25</code></a>
node_modules: upgrade (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/276">#276</a>)</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.1.2...v3.1.4">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=3.1.2&new-version=3.1.4)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 121528719c9..6e60bbb202a 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v3.1.2
+        uses: dawidd6/action-download-artifact@v3.1.4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v3.1.2
+        uses: dawidd6/action-download-artifact@v3.1.4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v3.1.2
+        uses: dawidd6/action-download-artifact@v3.1.4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v3.1.2
+        uses: dawidd6/action-download-artifact@v3.1.4
         with:
           workflow: ci.yml
           workflow_conclusion: success

From 19b0b9f8b6b9cf8f854f53f53f0013de26604fe4 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 21 Mar 2024 19:13:44 +0100
Subject: [PATCH 045/169] fix(sem): crash with forward-declared `=destroy` hook
 (#1252)

## Summary

Fix the compiler crashing when using a type with an, at that point,
forward-declared `=destroy` hook.

## Details

If the `=destroy` hook is forward-declared, its body is an `nkEmpty`
node, which caused a `FieldDefect` error in
`liftdestructors.createTypeBoundOps`, where the body AST is expected
to support `len`.

To resolve the issue, the `getBody(...).len` access is guarded by first
checking that the destroy hook is not overridden (indicated by the
`sfOverriden`  flag); only overridden hooks can be forward-declared.
This
works because `sfOverriden` implies that the attached-to type has
the `tfHasAsgn` flag already included.
---
 compiler/sem/liftdestructors.nim              |  4 ++-
 .../tforward_declared_destructor.nim          | 27 +++++++++++++++++++
 2 files changed, 30 insertions(+), 1 deletion(-)
 create mode 100644 tests/lang_objects/destructor/tforward_declared_destructor.nim

diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index 8c66b425416..5712b14c2b9 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -1062,7 +1062,9 @@ proc createTypeBoundOps(g: ModuleGraph; c: PContext; orig: PType; info: TLineInf
       setAttachedOp(g, idgen.module, orig, k, getAttachedOp(g, canon, k))
 
   let op = getAttachedOp(g, orig, attachedDestructor)
-  if op != nil and getBody(g, op).len != 0:
+  # if the destructor is overridden, the ``tfHasAsgn`` flag was already
+  # included
+  if op != nil and sfOverriden notin op.flags and getBody(g, op).len != 0:
     #or not isTrival(orig.assignment) or
     # not isTrival(orig.sink):
     orig.flags.incl tfHasAsgn
diff --git a/tests/lang_objects/destructor/tforward_declared_destructor.nim b/tests/lang_objects/destructor/tforward_declared_destructor.nim
new file mode 100644
index 00000000000..73ccce83a9e
--- /dev/null
+++ b/tests/lang_objects/destructor/tforward_declared_destructor.nim
@@ -0,0 +1,27 @@
+discard """
+  description: '''
+    Regression test for a forward-declared destroy hook causing a compiler
+    crash when hooks are requested before the forward-declaration is
+    completed
+  '''
+"""
+
+# note: the comments refer to implementation details that were present at the
+# time of writing
+
+type
+  Object* = object
+
+# it's important that the destroy hook is forward-declared here
+proc `=destroy`(x: var Object)
+
+# use `Object` in a way so that no hooks are requested before `p` is
+# instantiated
+proc test(x: Object) =
+  # request hooks for the type with the still-forward-declared destroy hook,
+  # resulting in a compiler crash
+  var x = x
+
+# finish the forward declaration
+proc `=destroy`(x: var Object) =
+  discard

From 658e9b21eca216015de3a10bb9bc3e30748bdcf5 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 23 Mar 2024 22:27:53 +0100
Subject: [PATCH 046/169] fix: exception handler not entered for indirect calls
 (#1254)

## Summary

Fix exception handlers sometimes being ignored for indirect calls when
building with `--panics:on`.

Fixes https://github.com/nim-works/nimskull/issues/1253

## Details

The `canRaise` procedure treated callables with a `tyProc` without an
exception effect list as not being able to raise, which is incorrect.
No exception effect list means that the exception effects are unknown,
not that there are none.

When panics are enabled, the result of `canRaise` decides whether a
routine call is a checked call (one that can potentially raise).
Procedural values with a type without an explicit `.raises`
specification have no exception effect list, so calls of them were
treated as not raising, leading to the enclosing exception handlers
being elided, if there are no other statements potentially entering the
handler.

`canRaise` is changed to conservatively consider a missing exception
effect list to mean "can raise". In addition, the procedure is
partially refactored to use a case statement, making it not ignore
invalid `tyProc` types anymore.
---
 compiler/ast/ast_query.nim                | 22 ++++++++++++++-------
 tests/exception/tindirect_call_raises.nim | 24 +++++++++++++++++++++++
 2 files changed, 39 insertions(+), 7 deletions(-)
 create mode 100644 tests/exception/tindirect_call_raises.nim

diff --git a/compiler/ast/ast_query.nim b/compiler/ast/ast_query.nim
index 8b613c6c876..5c4ac058d35 100644
--- a/compiler/ast/ast_query.nim
+++ b/compiler/ast/ast_query.nim
@@ -641,14 +641,22 @@ proc canRaise(fn: PNode): bool =
     result = false
   elif fn.kind == nkSym and fn.sym.magic == mEcho:
     result = true
-  else:
-    # TODO check for n having sons? or just return false for now if not
-    if fn.typ != nil and fn.typ.n != nil and fn.typ.n[0].kind == nkSym:
-      result = false
+  elif fn.typ != nil and fn.typ.kind == tyProc:
+    let effects {.cursor.} = fn.typ.n[0]
+    case effects.kind
+    of nkSym:
+      result = false # callable has no effects
+    of nkEffectList:
+      # if the effects were either not computed yet or there's no explicit
+      # specification, assume that the procedure can raise
+      result = effects.len < effectListLen or
+               effects[exceptionEffects].isNil or
+               effects[exceptionEffects].len > 0
     else:
-      result = fn.typ != nil and fn.typ.n != nil and ((fn.typ.n[0].len < effectListLen) or
-        (fn.typ.n[0][exceptionEffects] != nil and
-        fn.typ.n[0][exceptionEffects].safeLen > 0))
+      unreachable(effects.kind)
+  else:
+    # fn doesn't seem to be something callable, assume not raising
+    result = false
 
 proc canRaise*(panicsEnabled: bool, n: PNode): bool =
   ## 'true' if a call with `n` as the callee can exit via exceptional control-
diff --git a/tests/exception/tindirect_call_raises.nim b/tests/exception/tindirect_call_raises.nim
new file mode 100644
index 00000000000..7616c932f8b
--- /dev/null
+++ b/tests/exception/tindirect_call_raises.nim
@@ -0,0 +1,24 @@
+discard """
+  description: '''
+    Regression test for indirect calls of callables without explicit `.raises`
+    specification being treated as not being able to raise.
+
+    Refer to https://github.com/nim-works/nimskull/issues/1253
+  '''
+  matrix: "--panics:on"
+  output: "caught"
+"""
+
+# important: the procedural type must have no explicit `.raises` specification
+type Proc = proc () {.nimcall.}
+
+proc test(x: Proc) =
+  try:
+    x()
+  except CatchableError:
+    # the exception raised from `x` was previously not caught
+    echo "caught"
+
+test(proc() =
+  raise CatchableError.newException("")
+)

From 1ee8666282c3af48beaad59a11fb68b6399dea9e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 28 Mar 2024 22:17:24 +0100
Subject: [PATCH 047/169] mir: use `Local` instead of `PSym` for locals (#1258)

## Summary

For parameters and locals, replace `PSym` with `LocalId` -- the actual
data (name, type, etc.) is stored separately as a list of `Local`s. The
idea is to:
* remove another difference between the MIR and CGIR
* remove another `PSym` usage from the MIR (less GC'ed type usage, less
  coupling between sem and the mid-/back-end)

## Details

### MIR

* `mnkParam` and `mnkLocal` nodes store a `LocalId`; the `SymbolLike`
  set is removed
* the list of `Local`s is stored in `MirBody` (looked up via `LocalId`)
* the `Local` type and `resultId` constant are moved from the `cgir` to
  the `mirbodies` module
* new locals are registered through a `MirBuilder` instance
* the pretty-printing procedures accept an optional `ptr MirBody`; it's
  needed for rendering the original names of the locals/parameters

### New Container: `PartialStore`

* `PartialStore` is intended for recording additions to a `Store` out-
  of-place
* upon finishing recording additions, a `PartialStore` can either be
  dropped or joined with the `Store` it was forked from

### Translation

* `mirgen` translates `PSym`s to `Local`, in the same way as `cgirgen`
  previously did
* `cgirgen` is still responsible for creating `Local`s for temporaries
* when manually creating `MirBody`s, a slot for the result variable has
  to be reserved
---
 compiler/backend/backends.nim      |  17 +++--
 compiler/backend/cgir.nim          |  29 ++------
 compiler/backend/cgirgen.nim       |  60 ++---------------
 compiler/mir/analysis.nim          |   6 +-
 compiler/mir/mirbodies.nim         |  34 +++++++++-
 compiler/mir/mirchangesets.nim     |  10 ++-
 compiler/mir/mirconstr.nim         |  31 +++++++--
 compiler/mir/mirgen.nim            |  88 +++++++++++++++++++++---
 compiler/mir/mirpasses.nim         |  14 ++--
 compiler/mir/mirtrees.nim          |   8 +--
 compiler/mir/utils.nim             | 103 +++++++++++++++++------------
 compiler/sem/aliasanalysis.nim     |   6 +-
 compiler/sem/injectdestructors.nim |  15 ++---
 compiler/utils/containers.nim      |  39 +++++++++++
 compiler/vm/vmjit.nim              |   9 ++-
 tests/compiler/ttreechangesets.nim |   4 +-
 16 files changed, 301 insertions(+), 172 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index b2cbf3fdf9a..c0ad7ff81a2 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -332,7 +332,7 @@ proc process(body: var MirBody, prc: PSym, graph: ModuleGraph,
 
     if graph.config.arcToExpand.hasKey(prc.name.s):
       graph.config.msgWrite("--expandArc: " & prc.name.s & "\n")
-      graph.config.msgWrite(render(body.code, addr env))
+      graph.config.msgWrite(render(body.code, addr env, addr body))
       graph.config.msgWrite("\n-- end of expandArc ------------------------\n")
 
   let target =
@@ -383,14 +383,16 @@ proc produceFragmentsForGlobals(
     # the fragments need to be wrapped in scopes; some MIR passes depend
     # on this
     if bu.front.len == 0:
+      discard bu.addLocal(Local()) # empty result slot
       bu.add(m.add(n)): MirNode(kind: mnkScope)
 
   func finish(bu: sink MirBuilder, m: var SourceMap, n: PNode
-             ): MirTree {.nimcall.} =
+             ): auto {.nimcall.} =
     if bu.front.len > 0:
       bu.setSource(m.add(n))
       bu.add endNode(mnkScope)
-    result = finish(bu)
+    # we're creating a body here, so there is no list of locals yet
+    result = finish(bu, default(Store[LocalId, Local]))
 
   var init, deinit: MirBuilder
 
@@ -420,8 +422,10 @@ proc produceFragmentsForGlobals(
         deinit.setSource(result.deinit.source.add(it[0]))
         genDestroy(deinit, graph, env, toValue(global, s.typ))
 
-  result.init.code = finish(init, result.init.source, graph.emptyNode)
-  result.deinit.code = finish(deinit, result.deinit.source, graph.emptyNode)
+  (result.init.code, result.init.locals) =
+    finish(init, result.init.source, graph.emptyNode)
+  (result.deinit.code, result.deinit.locals) =
+    finish(deinit, result.deinit.source, graph.emptyNode)
 
 # ----- dynlib handling -----
 
@@ -512,6 +516,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
   extname.typ = graph.getSysType(lib.path.info, tyCstring)
 
   var bu = initBuilder(result.source.add(path))
+  discard bu.addLocal(Local()) # empty result slot
 
   let dest =
     if sym.kind in routineKinds:
@@ -562,7 +567,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
         bu.emitByVal tmp
 
   bu.add endNode(mnkScope)
-  result.code = finish(bu)
+  (result.code, result.locals) = finish(bu, result.locals)
 
 # ----- discovery and queueing logic -----
 
diff --git a/compiler/backend/cgir.nim b/compiler/backend/cgir.nim
index a19ac5e1704..23bfa39e1e0 100644
--- a/compiler/backend/cgir.nim
+++ b/compiler/backend/cgir.nim
@@ -12,12 +12,18 @@ import
     lineinfos
   ],
   compiler/mir/[
+    mirbodies,
     mirtrees
   ],
   compiler/utils/[
     containers
   ]
 
+# compatibility exports for symbols originally defined here
+export Local
+export LocalId
+export resultId
+
 type
   CgNodeKind* = enum
     cnkInvalid ## the node is uninitialized
@@ -156,28 +162,10 @@ const
   cnkLiterals* = {cnkIntLit, cnkUIntLit, cnkFloatLit, cnkStrLit}
 
 type
-  Local* = object
-    ## Static information about a local variable. Initialized prior to code
-    ## generation and only read (but not written) by the code generators.
-    typ*: PType
-    alignment*: uint32
-    flags*: TSymFlags
-    isImmutable*: bool
-      ## whether the local is expected to not be mutated, from a high-level
-      ## language perspective. Note that this doesn't meant that it really
-      ## isn't mutated, rather this information is intended to help the
-      ## the code generators optimize
-    # future direction: merge `flags` and `isImmutable` into a single set of
-    # flags
-    name*: PIdent
-      ## either the user-defined name or 'nil'
-
   BlockId* = distinct uint32
     ## Identifies a block within another block -- the IDs are **not** unique
     ## within a ``Body``. An outermost block has ID 0, a block within the
     ## block ID 1, etc.
-  LocalId* = distinct uint32
-    ## Identifies a local within a procedure.
 
   CgNode* {.acyclic.} = ref object
     ## A node in the tree structure representing code during the code
@@ -213,10 +201,6 @@ type
     locals*: Store[LocalId, Local] ## all locals belonging to the body
     code*: CgNode
 
-const
-  resultId* = LocalId(0)
-    ## the ID of the local representing the ``result`` variable
-
 func len*(n: CgNode): int {.inline.} =
   n.kids.len
 
@@ -273,7 +257,6 @@ proc newOp*(kind: CgNodeKind; info: TLineInfo, typ: PType,
 func newLocalRef*(id: LocalId, info: TLineInfo, typ: PType): CgNode =
   CgNode(kind: cnkLocal, info: info, typ: typ, local: id)
 
-proc `==`*(x, y: LocalId): bool {.borrow.}
 proc `==`*(x, y: BlockId): bool {.borrow.}
 
 proc merge*(dest: var Body, source: Body): CgNode =
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 4c6af0a160d..53dfb49fd61 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -60,9 +60,6 @@ type
 
     tempMap: SeqMap[TempId, LocalId]
       ## maps a ``TempId`` to the ID of the local created for it
-    localsMap: Table[int, LocalId]
-      ## maps a sybmol ID to the corresponding local. Needed because normal
-      ## local variables reach here as ``PSym``s
     blocks: seq[tuple[input, actual: LabelId]]
       ## the stack of enclosing blocks for the currently processed node
 
@@ -251,13 +248,6 @@ proc newDefaultCall(info: TLineInfo, typ: PType): CgNode =
   ## Produces the tree for a ``default`` magic call.
   newExpr(cnkCall, info, typ, [newMagicNode(mDefault, info)])
 
-proc initLocal(s: PSym): Local =
-  ## Inits a ``Local`` with the data from `s`.
-  result = Local(typ: s.typ, flags: s.flags, isImmutable: (s.kind == skLet),
-                 name: s.name)
-  if s.kind in {skVar, skLet, skForVar}:
-    result.alignment = s.alignment.uint32
-
 proc wrapInHiddenAddr(cl: TranslateCl, n: CgNode): CgNode =
   ## Restores the ``cnkHiddenAddr`` around lvalue expressions passed to ``var``
   ## parameters. The code-generators operating on ``CgNode``-IR depend on the
@@ -333,9 +323,7 @@ proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
   of mnkConst:
     CgNode(kind: cnkConst, info: info, typ: n.typ, cnst: n.cnst)
   of mnkLocal, mnkParam:
-    # paramaters are treated like locals in the code generators
-    assert n.sym.id in cl.localsMap
-    newLocalRef(cl.localsMap[n.sym.id], info, n.sym.typ)
+    newLocalRef(n.local, info, cl.locals[n.local].typ)
   of mnkTemp:
     newLocalRef(cl.tempMap[n.temp], info, n.typ)
   of mnkAlias:
@@ -364,11 +352,7 @@ proc tbExceptItem(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor
                  ): CgNode =
   let n {.cursor.} = get(tree, cr)
   case n.kind
-  of mnkLocal:
-    # the 'except' branch acts as a definition for the local
-    let id = cl.locals.add initLocal(n.sym)
-    cl.localsMap[n.sym.id] = id
-    newLocalRef(id, cr.info, n.typ)
+  of mnkLocal: newLocalRef(n.local, cr.info, n.typ)
   of mnkType:  newTypeNode(cr.info, n.typ)
   else:        unreachable()
 
@@ -534,15 +518,8 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
 
   case entity.kind
   of mnkLocal:
-    # translate the ``PSym`` to a ``Local`` and establish a mapping
-    let
-      sym = entity.sym
-      id = cl.locals.add initLocal(sym)
-
-    assert sym.id notin cl.localsMap, "re-definition of local"
-    cl.localsMap[sym.id] = id
-
-    def = newLocalRef(id, info, entity.typ)
+    let id = entity.local
+    def = newLocalRef(id, info, cl.locals[id].typ)
   of mnkParam:
     # ignore 'def's for parameters
     def = newEmpty()
@@ -1165,33 +1142,8 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
                  body: sink MirBody): Body =
   ## Generates the ``CgNode`` IR corresponding to the input MIR `body`,
   ## using `idgen` to provide new IDs when creating symbols.
-  var cl = TranslateCl(graph: graph, idgen: idgen, owner: owner)
-  if owner.kind in routineKinds:
-    # setup the locals and associated mappings for the parameters
-    template add(v: PSym) =
-      let s = v
-      cl.localsMap[s.id] = cl.locals.add initLocal(s)
-
-    let sig =
-      if owner.kind == skMacro: owner.internal
-      else:                     owner.typ
-
-    # result variable:
-    if sig[0].isEmptyType():
-      # always reserve a slot for the result variable, even if the latter is
-      # not present
-      discard cl.locals.add(Local())
-    else:
-      add(owner.ast[resultPos].sym)
-
-    # normal parameters:
-    for i in 1..<sig.len:
-      add(sig.n[i].sym)
-
-    if sig.callConv == ccClosure:
-      # environment parameter
-      add(owner.ast[paramsPos][^1].sym)
-
+  var cl = TranslateCl(graph: graph, idgen: idgen, owner: owner,
+                       locals: move body.locals)
   # enable translation:
   cl.isActive = true
 
diff --git a/compiler/mir/analysis.nim b/compiler/mir/analysis.nim
index f815d493586..01282bd7e21 100644
--- a/compiler/mir/analysis.nim
+++ b/compiler/mir/analysis.nim
@@ -206,7 +206,7 @@ func isLastWrite*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph, loc: Path,
 
   result = (true, state.exit, state.escapes)
 
-func computeAliveOp*[T: PSym | GlobalId | TempId](
+func computeAliveOp*[T: LocalId | GlobalId | TempId](
   tree: MirTree, loc: T, op: Opcode, n: OpValue): AliveState =
   ## Computes the state of `loc` at the *end* of the given operation. The
   ## operands are expected to *not* alias with each other. The analysis
@@ -217,8 +217,8 @@ func computeAliveOp*[T: PSym | GlobalId | TempId](
       n.kind == mnkTemp and n.temp == loc
     elif T is GlobalId:
       n.kind == mnkGlobal and n.global == loc
-    elif T is PSym:
-      n.kind in {mnkLocal, mnkParam} and n.sym.id == loc.id
+    elif T is LocalId:
+      n.kind in {mnkLocal, mnkParam} and n.local == loc
     else:
       {.error.}
 
diff --git a/compiler/mir/mirbodies.nim b/compiler/mir/mirbodies.nim
index 8195adb942b..a6cac04050d 100644
--- a/compiler/mir/mirbodies.nim
+++ b/compiler/mir/mirbodies.nim
@@ -8,9 +8,30 @@ import
   compiler/mir/[
     mirtrees,
     sourcemaps
+  ],
+  compiler/utils/[
+    containers
   ]
 
 type
+  Local* = object
+    ## Static information about a local location ('let' or 'var'). Not modified
+    ## after initialization.
+    typ*: PType
+      ## type of the local
+    alignment*: uint32
+      ## alignment of the location, measured in bytes. 0 means "use default"
+    flags*: TSymFlags
+    isImmutable*: bool
+      ## whether the local was originally defined with ``let``. Used for
+      ## optimization purposes
+    # future direction: merge `flags` and `isImmutable` into a single set of
+    # flags
+    name*: PIdent
+      ## either the user-defined name or 'nil'
+
+  Locals* = Store[LocalId, Local]
+
   MirBody* = object
     ## A ``MirBody`` represents a self-contained piece of MIR code. This can
     ## either be:
@@ -22,11 +43,22 @@ type
     ## In each case, ``MirBody`` stores all the local data referenced and
     ## needed by the body's MIR code. It also store additional information
     ## associated with a body, such as how far the lowering is along.
+    locals*: Locals
+      ## all locals part of the body
     source*: SourceMap
     code*: MirTree
 
+const
+  resultId* = LocalId(0)
+    ## the ID of the result variable. A slot for the result variable is always
+    ## reserved, even if there is no result variable for a body
+
 func `[]`*(body: MirBody, n: NodePosition): lent MirNode {.inline.} =
   body.code[n]
 
 func sourceFor*(body: MirBody, n: NodePosition): PNode {.inline.} =
-  body.source[body.code[n].info]
\ No newline at end of file
+  body.source[body.code[n].info]
+
+func `[]`*(body: MirBody, id: LocalId): lent Local {.inline.} =
+  ## Returns the local corresponding to `id`.
+  body.locals[id]
diff --git a/compiler/mir/mirchangesets.nim b/compiler/mir/mirchangesets.nim
index ed038118479..e005a0fe48c 100644
--- a/compiler/mir/mirchangesets.nim
+++ b/compiler/mir/mirchangesets.nim
@@ -9,12 +9,17 @@ import
     mirtrees,
     sourcemaps,
     treechangesets
+  ],
+  compiler/utils/[
+    containers
   ]
 
 type
   Changeset* = object
     ## Represents a set of changes to be applied to a ``MirBody``.
     inner: TreeChangeset
+    locals: PartialStore[LocalId, Local]
+      ## new locals to be added on changeset application
     numTemps: uint32
       ## keeps track of the number of temporaries. Exchanged with
       ## the created builder, where it's used for allocating new IDs
@@ -46,6 +51,7 @@ template remove*(c: var Changeset, tree: MirTree, at: NodePosition) =
 func initChangeset*(body: MirBody): Changeset =
   ## Sets up a changeset for `body`. The changeset either needs to be
   ## discarded, or applied to the same ``MirBody`` instance it was created for.
+  result = Changeset(locals: fork(body.locals))
   # compute the next ID to use for new temporaries:
   for i, n in body.code.pairs:
     if n.kind in DefNodes and
@@ -58,12 +64,13 @@ func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
   ## ``finishBuilder`` call.
   result = initBuilder(info, move buffer)
   swap(c.numTemps, result.numTemps)
+  swap(c.locals, result.locals)
 
 func finishBuilder(c: var Changeset, buffer: var MirNodeSeq,
                    bu: sink MirBuilder) =
   # move the ID counter and buffer back into the changeset
   swap(c.numTemps, bu.numTemps)
-  buffer = finish(bu)
+  (buffer, c.locals) = finish(bu)
 
 template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
                  name: untyped, body: untyped) =
@@ -90,3 +97,4 @@ template replaceMulti*(c: var Changeset, tree: MirTree, at: NodePosition,
 func apply*(body: var MirBody, c: sink Changeset) =
   ## Applies the changeset `c` to `body`.
   apply(body.code, prepare(move c.inner))
+  join(body.locals, move c.locals)
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 120515f6cdb..fb5747b8274 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -5,9 +5,11 @@ import
     ast_types
   ],
   compiler/mir/[
-    mirtrees
+    mirtrees,
+    mirbodies
   ],
   compiler/utils/[
+    containers,
     idioms
   ],
   experimental/[
@@ -51,6 +53,8 @@ type
       ## the ID of the meta-data to associate with all added nodes (that
       ## don't have an explicitly assigned source ID)
 
+    locals*: PartialStore[LocalId, Local]
+      ## new locals created with the builder
     numTemps*: uint32
       ## tracks the number of existing temporaries. Used for allocating new
       ## IDs.
@@ -91,8 +95,9 @@ func toValue*(id: GlobalId, typ: PType): Value =
 func toValue*(id: ProcedureId, typ: PType): Value =
   Value(node: MirNode(kind: mnkProc, typ: typ, prc: id))
 
-func toValue*(kind: range[mnkParam..mnkLocal], sym: PSym): Value =
-  Value(node: MirNode(kind: kind, typ: sym.typ, sym: sym))
+func toValue*(kind: range[mnkParam..mnkLocal], id: LocalId,
+              typ: PType): Value =
+  Value(node: MirNode(kind: kind, typ: typ, local: id))
 
 # --------- MirBuffer interface ----------
 
@@ -250,6 +255,10 @@ func setSource*(bu: var MirBuilder, id: SourceId) =
     # now change the active ID
     bu.currentSourceId = id
 
+func addLocal*(bu: var MirBuilder, data: sink Local): LocalId {.inline.} =
+  ## Adds a new local to the body and returns the ID to address it with.
+  bu.locals.add data
+
 func add*(bu: var MirBuilder, n: sink MirNode) {.inline.} =
   ## Emits `n` to the node buffers.
   bu.front.add n
@@ -440,8 +449,9 @@ func materializeMove*(bu: var MirBuilder, loc: Value): Value =
   bu.wrapTemp loc.typ:
     bu.move loc
 
-func finish*(bu: sink MirBuilder): MirTree =
-  ## Consumes `bu` and returns the finished tree.
+func finish*(bu: sink MirBuilder): auto =
+  ## Low-level procedure that consumes `bu` and returns the finished tree
+  ## and partial store of the locals.
   if bu.swapped:
     swap(bu.front, bu.back)
     bu.swapped = false
@@ -449,4 +459,13 @@ func finish*(bu: sink MirBuilder): MirTree =
   assert bu.back.len == 0, "staging buffer is not empty"
   # make sure all nodes have their info IDs assigned:
   apply(bu.front, bu.currentSourceId)
-  result = move bu.front.nodes
+  result = (move bu.front.nodes, move bu.locals)
+
+func finish*(bu: sink MirBuilder, locals: sink Store[LocalId, Local]): auto =
+  ## Returns the finished tree from `bu`, plus `locals` joined with the locals
+  ## created with the builder. `locals` must be the store the `bu` was initially
+  ## set-up with.
+  let (tree, partial) = finish(bu)
+  result = (tree, move locals)
+  # join the partial store into the base store:
+  join(result[1], partial)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index b2e0aa7b930..a5f497da1d6 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -151,6 +151,8 @@ type
 
     blocks: seq[Block] ## the stack of active ``block``s. Used for looking up
                        ## break targets
+    localsMap: Table[int, LocalId]
+      ## maps symbol IDs of locals to the corresponding ``LocalId``
 
     sp: SourceProvider
 
@@ -253,6 +255,22 @@ template useSource(bu: var MirBuilder, sp: var SourceProvider,
     bu.setSource(prev[1])
     swap(prev, sp.active)
 
+# -------------- Symbol translation --------------
+
+func localToMir(s: PSym): Local =
+  Local(typ: s.typ, flags: s.flags,
+        isImmutable: s.kind in {skLet, skForVar},
+        name: s.name,
+        alignment:
+          if s.kind in {skVar, skLet, skForVar}:
+            s.alignment.uint32
+          else:
+            0
+        )
+
+template paramToMir(s: PSym): Local =
+  localToMir(s)
+
 # -------------- builder/convenience routines -------------
 
 template add(c: var TCtx, n: MirNode) =
@@ -285,6 +303,16 @@ template emitByName(c: var TCtx, eff: EffectKind, body: untyped) =
     c.subTree MirNode(kind: mnkTag, effect: eff):
       body
 
+template addLocal(c: var TCtx, local: Local): LocalId =
+  c.builder.addLocal(local)
+
+func addLocal(c: var TCtx, s: PSym): LocalId =
+  ## Translates `s` to its MIR representation, registers it with body, and
+  ## establishes a mapping.
+  assert s.id notin c.localsMap
+  result = c.addLocal(localToMir(s))
+  c.localsMap[s.id] = result
+
 proc empty(c: var TCtx, n: PNode): MirNode =
   MirNode(kind: mnkNone, typ: n.typ)
 
@@ -296,18 +324,18 @@ func nameNode(c: var TCtx, s: PSym): MirNode =
   of skTemp:
     # temporaries are always locals, even if marked with the ``sfGlobal``
     # flag
-    MirNode(kind: mnkLocal, typ: s.typ, sym: s)
+    MirNode(kind: mnkLocal, typ: s.typ, local: c.localsMap[s.id])
   of skConst:
     MirNode(kind: mnkConst, typ: s.typ, cnst: c.env.constants.add(s))
   of skParam:
-    MirNode(kind: mnkParam, typ: s.typ, sym: s)
+    MirNode(kind: mnkParam, typ: s.typ, local: LocalId(1 + s.position))
   of skResult:
-    MirNode(kind: mnkLocal, typ: s.typ, sym: s)
+    MirNode(kind: mnkLocal, typ: s.typ, local: resultId)
   of skVar, skLet, skForVar:
     if sfGlobal in s.flags:
       MirNode(kind: mnkGlobal, typ: s.typ, global: c.env.globals.add(s))
     else:
-      MirNode(kind: mnkLocal, typ: s.typ, sym: s)
+      MirNode(kind: mnkLocal, typ: s.typ, local: c.localsMap[s.id])
   else:
     unreachable(s.kind)
 
@@ -1262,6 +1290,10 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
       # the definition doesn't imply default intialization
       discard
   else:
+    if kind == pirLocal:
+      # translate the symbol of the local:
+      discard c.addLocal(s)
+
     c.buildStmt (if sfCursor in s.flags: mnkDefCursor else: mnkDef):
       c.add nameNode(c, s)
       if hasInitializer:
@@ -1541,7 +1573,8 @@ proc genExceptBranch(c: var TCtx, n: PNode, dest: Destination) =
         # ``T as a`` doesn't get transformed to just ``T`` if ``T`` is the
         # type of an imported exception -- the local's name is used at the
         # MIR level
-        c.add MirNode(kind: mnkLocal, typ: tn[2].typ, sym: tn[2].sym)
+        let id = c.addLocal(tn[2].sym)
+        c.add MirNode(kind: mnkLocal, typ: tn[2].typ, local: id)
       else:
         unreachable()
 
@@ -2037,6 +2070,29 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv,
   # move the state back into the output parameters:
   swapState()
 
+proc addParams(c: var TCtx, prc: PSym, signature: PType) =
+  ## Translates the result variable and the parameters (taken from `signature`)
+  ## to their MIR representation and adds them to the list of locals.
+  template add(x: Local) =
+    discard c.addLocal(x)
+
+  # result variable:
+  if signature[0].isEmptyType():
+    # always reserve a slot for the result variable, even if the latter is
+    # not present
+    add Local()
+  else:
+    add localToMir(prc.ast[resultPos].sym)
+
+  # parameters:
+  let params = signature.n
+  for i in 1..<params.len:
+    add paramToMir(params[i].sym)
+
+  if signature.callConv == ccClosure:
+    # environment parameter
+    add paramToMir(prc.ast[paramsPos][^1].sym)
+
 proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
                    config: TranslationConfig,  body: PNode): MirBody =
   ## Generates the full MIR body for the given AST `body`.
@@ -2064,15 +2120,27 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
     c.add MirNode(kind: mnkStmtList)
 
   if owner.kind in routineKinds:
+    # the procedure backing a macro has its own internal signature; use that
+    # beyond this point
+    let signature =
+      if owner.kind == skMacro:
+        owner.internal
+      else:
+        owner.typ
+
+    addParams(c, owner, signature)
     # add a 'def' for each ``sink`` parameter. This simplifies further
     # processing and analysis
-    let params = owner.typ.n
+    let params = signature.n
     for i in 1..<params.len:
       let s = params[i].sym
       if s.typ.isSinkTypeForParam():
         c.subTree mnkDef:
-          c.add MirNode(kind: mnkParam, typ: s.typ, sym: s)
+          c.add nameNode(c, s)
           c.add MirNode(kind: mnkNone)
+  else:
+    # reserve the result slot:
+    discard c.addLocal(Local())
 
   gen(c, body)
 
@@ -2095,8 +2163,8 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
   swap(c.env, env) # swap back
 
   # move the buffers into the result body
-  MirBody(source: move c.sp.map,
-          code: finish(move c.builder))
+  let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
+  MirBody(locals: locals, source: move c.sp.map, code: code)
 
 proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
   ## Translates the construction expression AST `n` representing some
@@ -2144,4 +2212,4 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
   # push and pop the content so that ``constToMirAux`` places the nodes into
   # the staging buffer, which is necessary for after-the-fact type patching
   bu.pop(bu.push(constToMirAux(bu, env, n)))
-  bu.finish()
+  bu.finish()[0]
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 74ba5c7076c..2ee8f47b147 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -380,7 +380,7 @@ proc extractStringLiterals(tree: MirTree, env: var MirEnv,
       changes.replaceMulti(tree, i, bu):
         bu.use toValue(c, tree[i].typ)
 
-proc injectResultInit(tree: MirTree, resultVar: PSym, changes: var Changeset) =
+proc injectResultInit(tree: MirTree, resultTyp: PType, changes: var Changeset) =
   ## Injects a default-initialization for the result variable, if deemed
   ## necessary by data-flow analysis.
   ##
@@ -393,7 +393,7 @@ proc injectResultInit(tree: MirTree, resultVar: PSym, changes: var Changeset) =
   # future direction: once possible, extend this pass to apply to all local
   # variables
   func isResult(tree: MirTree, n: OpValue): bool =
-    tree[n].kind == mnkLocal and tree[n].sym.kind == skResult
+    tree[n].kind == mnkLocal and tree[n].local == resultId
 
   func requiresInit(tree: MirTree): bool =
     let
@@ -429,8 +429,8 @@ proc injectResultInit(tree: MirTree, resultVar: PSym, changes: var Changeset) =
     let at = tree.child(NodePosition 0, 0)
     changes.insert(tree, at, at, bu):
       bu.subTree mnkInit:
-        bu.use toValue(mnkLocal, resultVar)
-        bu.buildMagicCall mDefault, resultVar.typ:
+        bu.use toValue(mnkLocal, resultId, resultTyp)
+        bu.buildMagicCall mDefault, resultTyp:
           discard
 
 proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
@@ -476,11 +476,11 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       preventRvo(body.code, c)
 
   batch:
-    if target == targetC and (prc.kind in routineKinds) and
-       (sfNoInit notin prc.flags) and not prc.typ[0].isEmptyType():
+    if target == targetC and body[resultId].typ != nil and
+       (sfNoInit notin body[resultId].flags):
       # the procedure has a result variable and initialization of it is
       # allowed
-      injectResultInit(body.code, prc.ast[resultPos].sym, c)
+      injectResultInit(body.code, body[resultId].typ, c)
 
     lowerSwap(body.code, c)
     if target == targetVm:
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 5db9af07b8a..30cd6cfd523 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -11,7 +11,7 @@ import
   ]
 
 type
-  LocalId {.used.} = distinct uint32
+  LocalId* = distinct uint32
     ## Identifies a local inside a code fragment
   GlobalId* = distinct uint32
     ## Identifies a global across all MIR code
@@ -277,7 +277,7 @@ type
     of mnkConst:
       cnst*: ConstId
     of mnkParam, mnkLocal:
-      sym*: PSym
+      local*: LocalId
     of mnkField, mnkPathNamed, mnkPathVariant:
       field*: PSym
     of mnkLiteral:
@@ -344,9 +344,6 @@ const
     ## Assignment modifiers. Nodes that can only appear directly in the source
     ## slot of assignments.
 
-  SymbolLike* = {mnkParam, mnkLocal}
-    ## Nodes for which the `sym` field is available
-
   ConstrTreeNodes* = {mnkConstr, mnkObjConstr, mnkLiteral, mnkProc,
                       mnkArg, mnkField, mnkEnd}
     ## Nodes that can appear in the MIR subset used for constant expressions.
@@ -378,6 +375,7 @@ const
   CallKinds* = {mnkCall, mnkCheckedCall}
 
 func `==`*(a, b: SourceId): bool {.borrow.}
+func `==`*(a, b: LocalId): bool {.borrow.}
 func `==`*(a, b: TempId): bool {.borrow.}
 func `==`*(a, b: LabelId): bool {.borrow.}
 func `==`*(a, b: ConstId): bool {.borrow.}
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index b408c47c9b3..03fbd70b053 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -15,6 +15,7 @@ import
     typesrenderer,
   ],
   compiler/mir/[
+    mirbodies,
     mirenv,
     mirtrees
   ]
@@ -32,8 +33,8 @@ func `$`(n: MirNode): string =
     result.add " global: "
     result.addInt n.global.uint32
   of mnkParam, mnkLocal:
-    result.add " sym: "
-    result.add $n.sym.name.s
+    result.add " local: "
+    result.addInt n.local.uint32
   of mnkField, mnkPathNamed, mnkPathVariant:
     result.add " field:"
     result.add $n.field.name.s
@@ -120,7 +121,10 @@ proc treeRepr*(tree: MirTree, pos = NodePosition(0)): string =
 # ------- MIR pretty printer --------
 
 type
-  EnvPtr = ptr MirEnv
+  RenderCtx = object
+    ## Contextual immutable data for the renderer.
+    env: ptr MirEnv   ## may be nil
+    body: ptr MirBody ## may be nil
 
 template treeParam(): untyped =
   ## Expands to ``nodes`` or ``tree``, depending on how the parameter is
@@ -135,30 +139,42 @@ func next(tree: MirTree, i: var int): lent MirNode =
   result = tree[i]
   inc i
 
-func addName[I](result: var string, id: I, open: string, env: EnvPtr) =
-  if env.isNil:
+func addName[I](result: var string, id: I, open: string, c: RenderCtx) =
+  if c.env.isNil:
     # just render the ID
     result.add open
     result.addInt id.uint32
     result.add ">"
   else:
-    result.add env[][id].name.s
+    result.add c.env[][id].name.s
 
-proc singleToStr(n: MirNode, result: var string, env: EnvPtr) =
+func addLocalName(result: var string, id: LocalId, open: string,
+                  c: RenderCtx) =
+  if c.body.isNil:
+    # render just the ID
+    result.add open
+    result.addInt id.uint32
+    result.add ">"
+  else:
+    result.add c.body[][id].name.s
+
+proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
   case n.kind
-  of SymbolLike:
-    result.add n.sym.name.s
+  of mnkParam:
+    result.addLocalName(n.local, "<Param", c)
+  of mnkLocal:
+    result.addLocalName(n.local, "<L", c)
   of mnkConst:
     if isAnon(n.cnst):
       result.add "<D" # "D" for "Data"
       result.addInt extract(n.cnst).uint32
       result.add ">"
     else:
-      result.addName(n.cnst, "<C", env)
+      result.addName(n.cnst, "<C", c)
   of mnkGlobal:
-    result.addName(n.global, "<G", env)
+    result.addName(n.global, "<G", c)
   of mnkProc:
-    result.addName(n.prc, "<P", env)
+    result.addName(n.prc, "<P", c)
   of mnkTemp, mnkAlias:
     result.add "_" & $n.temp.int
   of mnkNone:
@@ -172,17 +188,17 @@ proc singleToStr(n: MirNode, result: var string, env: EnvPtr) =
   of AllNodeKinds - Atoms:
     result.add "<error: " & $n.kind & ">"
 
-proc singleToStr(tree: MirTree, i: var int, result: var string, env: EnvPtr) =
-  singleToStr(next(tree, i), result, env)
+proc singleToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
+  singleToStr(next(tree, i), result, c)
 
 template singleToStr() =
-  singleToStr(treeParam(), i, result, env)
+  singleToStr(treeParam(), i, result, c)
 
 template valueToStr() =
   mixin valueToStr
-  valueToStr(treeParam(), i, result, env)
+  valueToStr(treeParam(), i, result, c)
 
-proc valueToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
+proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   template tree(start: string, body: untyped) =
     result.add start
     body
@@ -217,11 +233,11 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
       singleToStr()
       result.add "[]"
   of AtomNodes:
-    singleToStr(n, result, env)
+    singleToStr(n, result, c)
   else:
     result.add "<error: " & $n.kind & ">"
 
-proc calleeToStr(tree: MirTree, i: var int, result: var string, env: EnvPtr) =
+proc calleeToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   case tree[i].kind
   of mnkMagic:
     # cut off the 'm' prefix and use a lowercase first character
@@ -232,7 +248,7 @@ proc calleeToStr(tree: MirTree, i: var int, result: var string, env: EnvPtr) =
   else:
     valueToStr()
 
-proc argToStr(tree: MirTree, i: var int, result: var string, env: EnvPtr) =
+proc argToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   var n {.cursor.} = next(tree, i)
   case n.kind
   of mnkArg:     result.add "arg "
@@ -251,9 +267,9 @@ proc argToStr(tree: MirTree, i: var int, result: var string, env: EnvPtr) =
   inc i # skip the end node
 
 template argToStr() =
-  argToStr(treeParam(), i, result, env)
+  argToStr(treeParam(), i, result, c)
 
-proc exprToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
+proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   template tree(start: string, body: untyped) =
     result.add start
     inc i # skip the start node
@@ -304,14 +320,14 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
       result.add ")"
   of mnkCall:
     tree "":
-      calleeToStr(nodes, i, result, env)
+      calleeToStr(nodes, i, result, c)
       result.add "("
       commaSeparated:
         argToStr()
       result.add ")"
   of mnkCheckedCall:
     tree "":
-      calleeToStr(nodes, i, result, env)
+      calleeToStr(nodes, i, result, c)
       result.add "("
       commaSeparated:
         argToStr()
@@ -344,28 +360,28 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, env: EnvPtr) =
     inc i
 
 template exprToStr() =
-  exprToStr(nodes, i, result, env)
+  exprToStr(nodes, i, result, c)
 
 proc renderNameWithType(tree: MirTree, i: var int, result: var string,
-                        env: EnvPtr) =
+                        c: RenderCtx) =
   let n {.cursor.} = next(tree, i)
-  singleToStr(n, result, env)
+  singleToStr(n, result, c)
   result.add ": "
   result.add typeToString(n.typ)
 
 proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
-                env: EnvPtr)
+                c: RenderCtx)
 
 template renderList(indent: int) =
   mixin renderList
-  renderList(treeParam(), i, indent, result, env)
+  renderList(treeParam(), i, indent, result, c)
 
 template stmtToStr(indent: int) =
   mixin stmtToStr
-  stmtToStr(treeParam(), i, indent, result, env)
+  stmtToStr(treeParam(), i, indent, result, c)
 
 proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
-               env: EnvPtr) =
+               c: RenderCtx) =
   template tree(str: string, body: untyped) =
     result.add repeat("  ", indent)
     result.add str
@@ -382,7 +398,7 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
   case n.kind
   of mnkDef, mnkDefUnpack:
     tree "def ":
-      renderNameWithType(nodes, i, result, env)
+      renderNameWithType(nodes, i, result, c)
       if nodes[i].kind != mnkNone:
         result.add " = "
         exprToStr()
@@ -391,19 +407,19 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
     result.add "\n"
   of mnkDefCursor:
     tree "def_cursor ":
-      renderNameWithType(nodes, i, result, env)
+      renderNameWithType(nodes, i, result, c)
       result.add " = "
       exprToStr()
     result.add "\n"
   of mnkBind:
     tree "bind ":
-      renderNameWithType(nodes, i, result, env)
+      renderNameWithType(nodes, i, result, c)
       result.add " = "
       valueToStr()
     result.add "\n"
   of mnkBindMut:
     tree "bind_mut ":
-      renderNameWithType(nodes, i, result, env)
+      renderNameWithType(nodes, i, result, c)
       result.add " = "
       valueToStr()
     result.add "\n"
@@ -506,23 +522,26 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
   i += ord(n.kind in SubTreeNodes)
 
 proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
-                env: EnvPtr) =
+                c: RenderCtx) =
   while i < tree.len and tree[i].kind != mnkEnd:
     stmtToStr(indent)
 
-proc exprToStr*(tree: MirTree, n: NodePosition, env: EnvPtr = nil): string =
+proc exprToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
+                body: ptr MirBody = nil): string =
   ## Renders the expression at `n` into a human-readable text representation.
   var i = n.int
-  exprToStr(tree, i, result, env)
+  exprToStr(tree, i, result, RenderCtx(env: env, body: body))
 
-proc stmtToStr*(tree: MirTree, n: NodePosition, env: EnvPtr = nil): string =
+proc stmtToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
+                body: ptr MirBody = nil): string =
   ## Renders the statement at `n` into a human-readable text representation.
   var i = n.int
-  stmtToStr(tree, i, 0, result, env)
+  stmtToStr(tree, i, 0, result, RenderCtx(env: env, body: body))
 
-proc render*(tree: MirTree, env: EnvPtr = nil): string =
+proc render*(tree: MirTree; env: ptr MirEnv = nil;
+             body: ptr MirBody = nil): string =
   ## Renders `tree` into a human-readable text representation. The output is
   ## meant for debugging and tracing and is not guaranteed to have a stable
   ## format.
   var i = 0
-  renderList(tree, i, 0, result, env)
+  renderList(tree, i, 0, result, RenderCtx(env: env, body: body))
diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index de0d638cfd2..698cec09b52 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -60,8 +60,8 @@ type
     long: seq[PathInstr]
 
 const
-  Roots = {mnkProc, mnkConst, mnkGlobal, mnkTemp, mnkCall, mnkDeref,
-           mnkDerefView} + SymbolLike
+  Roots = {mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkCall,
+           mnkDeref, mnkDerefView}
   PathOps = {mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv,
              mnkPathVariant}
 
@@ -71,7 +71,7 @@ func isSameRoot(an, bn: MirNode): bool =
 
   case an.kind
   of mnkParam, mnkLocal:
-    result = an.sym.id == bn.sym.id
+    result = an.local == bn.local
   of mnkProc:
     result = an.prc == bn.prc
   of mnkConst:
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 8ad20cf2469..7a5396a5094 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -171,7 +171,7 @@ func toName(n: MirNode): EntityName =
   result.a[0] = n.kind.int
   result.a[1] =
     case n.kind
-    of SymbolLike: n.sym.id
+    of mnkParam, mnkLocal: n.local.int
     of mnkGlobal:  n.global.int
     of mnkTemp:    n.temp.int
     else:          unreachable(n.kind)
@@ -257,11 +257,10 @@ func initEntityDict(tree: MirTree, dfg: DataFlowGraph): EntityDict =
       let t =
         case entity.kind
         of mnkParam:
-          assert isSinkTypeForParam(entity.sym.typ)
-          entity.sym.typ
+          assert isSinkTypeForParam(entity.typ)
+          entity.typ
         of mnkLocal:
-          assert sfCursor notin entity.sym.flags
-          entity.sym.typ
+          entity.typ
         of mnkTemp, mnkGlobal:
           entity.typ
         else:
@@ -345,7 +344,7 @@ func requiresDestruction(tree: MirTree, cfg: DataFlowGraph,
   let r =
     case entity.kind
     of mnkParam, mnkLocal:
-      computeAlive(entity.sym, computeAliveOp[PSym])
+      computeAlive(entity.local, computeAliveOp[LocalId])
     of mnkGlobal:
       computeAlive(entity.global, computeAliveOp[GlobalId])
     of mnkTemp:
@@ -419,7 +418,7 @@ func isAlive(tree: MirTree, cfg: DataFlowGraph,
     let scope =
       # XXX: the way the ``result`` variable is detected here is a hack. It
       #      should be treated as any other local in the context of the MIR
-      if tree[root].kind in SymbolLike and tree[root].sym.kind == skResult:
+      if tree[root].kind == mnkLocal and tree[root].local == resultId:
         cfg.subgraphFor(NodePosition(0) .. NodePosition(tree.high))
       else:
         var exists: bool
@@ -459,7 +458,7 @@ func needsReset(tree: MirTree, cfg: DataFlowGraph, ar: AnalysisResults,
   #      procedure's body should be encoded by inserting a special 'use'
   #      operation that has a control-flow dependency on *all* other
   #      operations
-  if tree[root].kind in SymbolLike and tree[root].sym.kind == skResult:
+  if tree[root].kind == mnkLocal and tree[root].local == resultId:
     return true
 
   var exists: bool
diff --git a/compiler/utils/containers.nim b/compiler/utils/containers.nim
index 2431571a48e..52db2872898 100644
--- a/compiler/utils/containers.nim
+++ b/compiler/utils/containers.nim
@@ -19,6 +19,20 @@ type
     ## integer-like ID. The container is append-only
     data: seq[T]
 
+  PartialStore*[I; T] = object
+    ## Used for adding items to an existing `Store <#Store>`_ without directly
+    ## modifying said object nor requiring access to it.
+    ##
+    ## The usual usage pattern is:
+    ## 1. fork a partial store from a `Store <#Store>`_ object
+    ## 2. add items to the partial store
+    ## 3. once done, join the partial store with the store it was forked from
+    ##
+    ## It's also legal to add items to a partial store that wasn't forked from
+    ## a store. In this case, it can only be joined into empty stores.
+    data: seq[T]
+    base: I
+
   Checkpoint* = distinct int
     ## Represents the state of a ``Store`` at some point in time.
 
@@ -160,6 +174,31 @@ func rewind*(s: var Store, p: Checkpoint) =
   assert p.int <= s.data.len, "illegal rewind"
   s.data.setLen(p.int)
 
+# ---------- PartialStore API -----------
+
+func fork*[I;T](s: Store[I, T]): PartialStore[I, T] =
+  ## Creates a new partial table that can later be joined back (via
+  ## `join <#join,Store,PartialStore>`_) into `s`.
+  PartialStore[I, T](base: nextId(s))
+
+func add*[I;T](s: var PartialStore[I, T], item: sink T): I =
+  ## Adds `item` to `s`, returning the ID to later query it with.
+  s.data.add(item)
+  result = I(ord(s.data.high) + ord(s.base))
+
+func `[]`*[I;T](s: PartialStore[I, T], id: I): lent T {.inline.} =
+  ## Returns the item associated with `id`.
+  s.data[ord(id) - ord(s.base)]
+
+func join*[I;T](s: var Store[I, T], other: sink PartialStore[I, T]) =
+  ## Adds all items from `other` to `s`. `s` has to have the same number of
+  ## items it had when `other` was forked from it.
+  assert s.nextId() == other.base, "containers are out of sync"
+  let offset = s.data.len
+  s.data.setLen(offset + other.data.len)
+  for i, it in other.data.mpairs:
+    s.data[offset + i] = move it
+
 # ---------- OrdinalSeq API ------------
 
 template base*[I; T](x: OrdinalSeq[I, T]): seq[T] =
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 1b9a96a6e11..dbd2f972444 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -44,6 +44,9 @@ import
   compiler/sem/[
     transf
   ],
+  compiler/utils/[
+    containers
+  ],
   compiler/vm/[
     identpatterns,
     vmaux,
@@ -150,8 +153,12 @@ proc generateMirCode(c: var TCtx, env: var MirEnv, n: PNode;
     result = generateCode(c.graph, env, c.module, selectOptions(c), n)
   else:
     var bu: MirBuilder
+     # add an empty local so that the result slot is occupied:
+    discard bu.addLocal(Local())
+    # XXX: ^^ this is a hack, and yet another reason to remove expression
+    #      support from the JIT
     generateCode(c.graph, env, selectOptions(c), n, bu, result.source)
-    result.code = finish(bu)
+    (result.code, result.locals) = finish(bu, default(Store[LocalId, Local]))
 
 proc generateIR(c: var TCtx, env: MirEnv, body: sink MirBody): Body =
   backends.generateIR(c.graph, c.idgen, env, c.module, body)
diff --git a/tests/compiler/ttreechangesets.nim b/tests/compiler/ttreechangesets.nim
index 10ed10d98fb..8cab8415fe8 100644
--- a/tests/compiler/ttreechangesets.nim
+++ b/tests/compiler/ttreechangesets.nim
@@ -112,7 +112,7 @@ block insert_shared_start:
   bu.add temp(0)
   bu.subTree mnkStmtList: discard
   bu.add temp(3)
-  var tree = finish(bu)
+  var (tree, _) = finish(bu)
 
   test(tree, [temp(0), temp(1), temp(2), temp(3)]):
     c.replace 1, temp(2)
@@ -138,7 +138,7 @@ block insert_shared_end:
   bu.add temp(0)
   bu.subTree mnkStmtList: discard
   bu.add temp(3)
-  var tree = finish(bu)
+  var (tree, _) = finish(bu)
 
   test(tree, [temp(0), temp(1), temp(2), temp(3)]):
     c.replace 1, temp(1)

From b22f33d6b7642c610525d85ae36f40cb0db979e5 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 29 Mar 2024 23:45:36 +0100
Subject: [PATCH 048/169] fix: VM crash with implicit object conversion (#1259)

## Summary

Fix a bug with `cgirgen` where incorrect CGIR was produced for implicit
object conversions involving generic types, resulting in an internal VM
error when using the VM backend or running code at compile-time.

## Details

In `cgirgen.handleSpecialConv`, type skipping was missing when testing
for whether the element type of a pointer-like type is an object type,
resulting in the conversion not being detected as an object conversion.
Code generators, such as `vmgen`, where the distinction between plain
lvalue and object conversion matters therefore produced wrong code.

`handleSpecialConv` is changed such that the types are skipped
properly. The object up- or down-conversion node now also uses the
correct line information.
---
 compiler/backend/cgirgen.nim                  | 33 ++++++-------------
 .../lang_callable/generics/tobjecttyperel.nim |  4 ---
 2 files changed, 10 insertions(+), 27 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 53dfb49fd61..871bf331bbe 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -260,18 +260,16 @@ proc wrapInHiddenAddr(cl: TranslateCl, n: CgNode): CgNode =
     #      level
     n
 
-proc genObjConv(n: CgNode, a, b, t: PType): CgNode =
-  ## Depending on the relationship between `a` and `b`, wraps `n` in either an
-  ## up- or down-conversion. `t` is the type to use for the resulting
-  ## expression
-  let diff = inheritanceDiff(b, a)
-  #echo "a: ", a.sym.name.s, "; b: ", b.sym.name.s
-  #assert diff != 0 and diff != high(int), "redundant or illegal conversion"
+proc genObjConv(n: CgNode, to: PType, info: TLineInfo): CgNode =
+  ## Depending on the type relationship between `n` and `to`, wraps `n` in
+  ## either an up- or down-conversion. Returns `nil` if no up- or down-
+  ## conversion is needed.
+  let diff = inheritanceDiff(to.skipTypes(skipPtrs), n.typ.skipTypes(skipPtrs))
   if diff == 0:
     return nil
   result = newOp(
     if diff < 0: cnkObjUpConv else: cnkObjDownConv,
-    n.info, t): n
+    info, to): n
 
 func disable(cl: var TranslateCl) {.inline.} =
   cl.isActive = false
@@ -288,21 +286,10 @@ proc handleSpecialConv(c: ConfigRef, n: CgNode, info: TLineInfo,
   ## between the source type (i.e. that of `n`) and the destination type.
   ## If it is, generates the conversion operation IR and returns it -- nil
   ## otherwise
-  let
-    orig = dest
-    source = n.typ.skipTypes(abstractVarRange)
-    dest = dest.skipTypes(abstractVarRange)
-
-  case dest.kind
-  of tyObject:
-    assert source.kind == tyObject
-    genObjConv(n, source, dest, orig)
-  of tyRef, tyPtr, tyVar, tyLent:
-    assert source.kind == dest.kind
-    if source.base.kind == tyObject:
-      genObjConv(n, source.base, dest.base, orig)
-    else:
-      nil
+  if dest.skipTypes(skipPtrs - {tyDistinct}).kind == tyObject:
+    # if the destination is an object (or ptr/ref object), it must be an
+    # object conversion
+    genObjConv(n, dest, info)
   else:
     nil
 
diff --git a/tests/lang_callable/generics/tobjecttyperel.nim b/tests/lang_callable/generics/tobjecttyperel.nim
index 04d6f6cfafb..80fe23459c2 100644
--- a/tests/lang_callable/generics/tobjecttyperel.nim
+++ b/tests/lang_callable/generics/tobjecttyperel.nim
@@ -1,8 +1,4 @@
 discard """
-  knownIssue.vm: '''
-    Fails for the VM target because ``cgirgen`` emits the incorrect conversion
-    operator for ``ref`` types involving generics.
-  '''
   output: '''(peel: 0, color: 15)
 (color: 15)
 17

From 7fd704ba71ef3ecb43055b5dfc091d03b78888bf Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 30 Mar 2024 01:37:58 +0100
Subject: [PATCH 049/169] mir: use `Local` for temporaries (#1260)

## Summary

In the MIR, temporaries are now real locals that use `Local` and
`LocalId`. Previously, they only existed as IDs (`TempId`), which were
then materialized into real locals by `cgirgen`.

This further shrinks down `cgirgen`, preparing for its eventual
removal. Temporaries and normal locals using the same `MirNode` variant
also unifies some code paths.

## Details

* `mnkTemp` and `mnkAlias` use the same variant as `mnkLocal` and
  `mnkParam`
* the `TempId` type is removed
* allocating new temporaries now uses `addLocal` underneath, removing
  the `numTemps` tracking
* `Changeset` initialization is faster now, since the MIR tree doesn't
  need to be scanned for temporaries anymore
* since temporaries now share their namespace with locals, their names
  in pretty-printed MIR are different, which affects the `--expandArc`-
  using tests
---
 compiler/backend/cgirgen.nim               |  38 +---
 compiler/mir/analysis.nim                  |   8 +-
 compiler/mir/injecthooks.nim               |   2 +-
 compiler/mir/mirchangesets.nim             |  10 -
 compiler/mir/mirconstr.nim                 |  18 +-
 compiler/mir/mirpasses.nim                 |  18 +-
 compiler/mir/mirtrees.nim                  |  22 +-
 compiler/mir/utils.nim                     |   7 +-
 compiler/sem/aliasanalysis.nim             |   4 +-
 compiler/sem/injectdestructors.nim         |  12 +-
 tests/arc/topt_cursor.nim                  |  30 +--
 tests/arc/topt_no_cursor.nim               | 234 ++++++++++-----------
 tests/arc/topt_refcursors.nim              |  44 ++--
 tests/arc/topt_wasmoved_destroy_pairs.nim  |  44 ++--
 tests/compiler/ttreechangesets.nim         |   6 +-
 tests/exception/truntime_check_panics.nim  |  18 +-
 tests/lang_objects/destructor/tv2_cast.nim |  56 ++---
 tests/misc/tdont_fold_procedure_cast.nim   |   8 +-
 18 files changed, 266 insertions(+), 313 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 871bf331bbe..36415619ac6 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -58,8 +58,6 @@ type
 
     owner: PSym
 
-    tempMap: SeqMap[TempId, LocalId]
-      ## maps a ``TempId`` to the ID of the local created for it
     blocks: seq[tuple[input, actual: LabelId]]
       ## the stack of enclosing blocks for the currently processed node
 
@@ -80,7 +78,8 @@ type
       ## unreachable code
 
     locals: Store[LocalId, Local]
-      ## the in-progress list of all locals in the translated body
+      ## the list of all locals in the body, taken from the ``MirBody``.
+      ## Only needed for updating the type for alias locals
 
     # a 'def' in the MIR means that the the local starts to exists and that it
     # is accessible in all connected basic blocks part of the enclosing
@@ -100,11 +99,6 @@ type
     pos: uint32 ## the index of the currently pointed to node
     origin {.cursor.}: PNode ## the source node
 
-template isFilled(x: LocalId): bool =
-  # '0' is a valid ID, but this procedure is only used for
-  # temporaries, which can never map to the result variable
-  x.int != 0
-
 func delete[T](s: var seq[T], a, b: int) =
   # XXX: this procedure is a workaround for ``sequtils.delete`` not handling
   #      empty slices properly (an IndexDefect is erroneously raised)
@@ -309,14 +303,12 @@ proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
     CgNode(kind: cnkGlobal, info: info, typ: n.typ, global: n.global)
   of mnkConst:
     CgNode(kind: cnkConst, info: info, typ: n.typ, cnst: n.cnst)
-  of mnkLocal, mnkParam:
+  of mnkLocal, mnkParam, mnkTemp:
     newLocalRef(n.local, info, cl.locals[n.local].typ)
-  of mnkTemp:
-    newLocalRef(cl.tempMap[n.temp], info, n.typ)
   of mnkAlias:
     # the type of the node doesn't match the real one
     let
-      id = cl.tempMap[n.temp]
+      id = n.local
       typ = cl.locals[id].typ
     # the view is auto-dereferenced here for convenience
     newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
@@ -328,7 +320,7 @@ proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
     # type arguments do use `mnkNone` in some situtations, so keep
     # the type
     CgNode(kind: cnkEmpty, info: info, typ: n.typ)
-  else:
+  of AllNodeKinds - Atoms:
     unreachable("not an atom: " & $n.kind)
 
 proc atomToIr(tree: MirBody, cl: var TranslateCl,
@@ -504,7 +496,7 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   var def: CgNode
 
   case entity.kind
-  of mnkLocal:
+  of mnkLocal, mnkTemp:
     let id = entity.local
     def = newLocalRef(id, info, cl.locals[id].typ)
   of mnkParam:
@@ -513,16 +505,6 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   of mnkGlobal:
     def = CgNode(kind: cnkGlobal, info: info, typ: entity.typ,
                  global: entity.global)
-  of mnkTemp:
-    # MIR temporaries are like normal locals, with the difference that they
-    # are created ad-hoc and don't have any extra information attached
-    assert entity.typ != nil
-    let tmp = cl.locals.add Local(typ: entity.typ)
-
-    assert entity.temp notin cl.tempMap, "re-definition of temporary"
-    cl.tempMap[entity.temp] = tmp
-
-    def = newLocalRef(tmp, info, entity.typ)
   of mnkAlias:
     # MIR aliases are translated to var/lent views
     assert n.kind in {mnkBind, mnkBindMut}, "alias can only be defined by binds"
@@ -530,12 +512,10 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     let
       typ = makeVarType(cl.owner, entity.typ, cl.idgen,
                         if n.kind == mnkBind: tyLent else: tyVar)
-      tmp = cl.locals.add Local(typ: typ)
-
-    assert entity.temp notin cl.tempMap, "re-definition of temporary"
-    cl.tempMap[entity.temp] = tmp
+    # override the original type
+    cl.locals[entity.local].typ = typ
 
-    def = newLocalRef(tmp, info, typ)
+    def = newLocalRef(entity.local, info, typ)
   else:
     unreachable()
 
diff --git a/compiler/mir/analysis.nim b/compiler/mir/analysis.nim
index 01282bd7e21..977a07bd095 100644
--- a/compiler/mir/analysis.nim
+++ b/compiler/mir/analysis.nim
@@ -206,19 +206,17 @@ func isLastWrite*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph, loc: Path,
 
   result = (true, state.exit, state.escapes)
 
-func computeAliveOp*[T: LocalId | GlobalId | TempId](
+func computeAliveOp*[T: LocalId | GlobalId](
   tree: MirTree, loc: T, op: Opcode, n: OpValue): AliveState =
   ## Computes the state of `loc` at the *end* of the given operation. The
   ## operands are expected to *not* alias with each other. The analysis
   ## result will be wrong if they do
 
   func isAnalysedLoc[T](n: MirNode, loc: T): bool =
-    when T is TempId:
-      n.kind == mnkTemp and n.temp == loc
-    elif T is GlobalId:
+    when T is GlobalId:
       n.kind == mnkGlobal and n.global == loc
     elif T is LocalId:
-      n.kind in {mnkLocal, mnkParam} and n.local == loc
+      n.kind in {mnkLocal, mnkParam, mnkTemp} and n.local == loc
     else:
       {.error.}
 
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index eefcc5f5178..e6e7f7f5255 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -97,7 +97,7 @@ proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
     case tree[n].kind
     of mnkConsume:
       let x = tree.operand(n)
-      if tree[x].kind == mnkTemp and tree[x].temp == tree[def].temp:
+      if tree[x].kind == mnkTemp and tree[x].local == tree[def].local:
         # the temporary is used for sink parameter passing
         result = true
         break
diff --git a/compiler/mir/mirchangesets.nim b/compiler/mir/mirchangesets.nim
index e005a0fe48c..c157f49ad2c 100644
--- a/compiler/mir/mirchangesets.nim
+++ b/compiler/mir/mirchangesets.nim
@@ -20,9 +20,6 @@ type
     inner: TreeChangeset
     locals: PartialStore[LocalId, Local]
       ## new locals to be added on changeset application
-    numTemps: uint32
-      ## keeps track of the number of temporaries. Exchanged with
-      ## the created builder, where it's used for allocating new IDs
 
 # ----------------------------------------
 # proxy routines
@@ -52,24 +49,17 @@ func initChangeset*(body: MirBody): Changeset =
   ## Sets up a changeset for `body`. The changeset either needs to be
   ## discarded, or applied to the same ``MirBody`` instance it was created for.
   result = Changeset(locals: fork(body.locals))
-  # compute the next ID to use for new temporaries:
-  for i, n in body.code.pairs:
-    if n.kind in DefNodes and
-       (let ent = body.code[i, 0]; ent.kind in {mnkTemp, mnkAlias}):
-      result.numTemps = max(ent.temp.uint32 + 1, result.numTemps)
 
 func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
                  info: SourceId): MirBuilder =
   ## Internal routine for setting up a builder. Must be paired with a
   ## ``finishBuilder`` call.
   result = initBuilder(info, move buffer)
-  swap(c.numTemps, result.numTemps)
   swap(c.locals, result.locals)
 
 func finishBuilder(c: var Changeset, buffer: var MirNodeSeq,
                    bu: sink MirBuilder) =
   # move the ID counter and buffer back into the changeset
-  swap(c.numTemps, bu.numTemps)
   (buffer, c.locals) = finish(bu)
 
 template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index fb5747b8274..06d7d1f105d 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -55,9 +55,6 @@ type
 
     locals*: PartialStore[LocalId, Local]
       ## new locals created with the builder
-    numTemps*: uint32
-      ## tracks the number of existing temporaries. Used for allocating new
-      ## IDs.
 
     # XXX: the internal fields are currently exported for the integration
     #      with changesets to work, but future refactorings should focus
@@ -80,11 +77,11 @@ func typeLit*(t: PType): Value =
 func literal*(n: PNode): Value =
   Value(node: MirNode(kind: mnkLiteral, typ: n.typ, lit: n))
 
-func temp*(typ: PType, id: TempId): Value =
-  Value(node: MirNode(kind: mnkTemp, typ: typ, temp: id))
+func temp*(typ: PType, id: LocalId): Value =
+  Value(node: MirNode(kind: mnkTemp, typ: typ, local: id))
 
-func alias*(typ: PType, id: TempId): Value =
-  Value(node: MirNode(kind: mnkAlias, typ: typ, temp: id))
+func alias*(typ: PType, id: LocalId): Value =
+  Value(node: MirNode(kind: mnkAlias, typ: typ, local: id))
 
 func toValue*(id: ConstId, typ: PType): Value =
   Value(node: MirNode(kind: mnkConst, typ: typ, cnst: id))
@@ -297,18 +294,17 @@ template scope*(bu: var MirBuilder, body: untyped) =
   bu.subTree MirNode(kind: mnkScope):
     body
 
-func allocTemp(bu: MirBuilder, t: PType; id: TempId, alias: bool): Value =
+func allocTemp(bu: MirBuilder, t: PType; id: LocalId, alias: bool): Value =
   ## Allocates a new temporary or alias and returns it.
   let kind = if alias: mnkAlias
              else:     mnkTemp
   {.cast(uncheckedAssign).}:
-    result = Value(node: MirNode(kind: kind, typ: t, temp: id),
+    result = Value(node: MirNode(kind: kind, typ: t, local: id),
                    info: someOpt bu.currentSourceId)
 
 template allocTemp*(bu: var MirBuilder, t: PType, alias = false): Value =
   # XXX: the only purpose of this is to work around a ``strictFuncs`` bug
-  let id = TempId bu.numTemps
-  inc bu.numTemps
+  let id = bu.addLocal(Local(typ: t))
   allocTemp(bu, t, id, alias)
 
 func use*(bu: var MirBuilder, val: sink Value) {.inline.} =
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 2ee8f47b147..18c053754e6 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -231,14 +231,14 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
         # definition of a temporary into which an lvalue is assigned. Elision
         # is disabled for projections of temporaries; the projected temporary
         # might be elided itself, which could lead to evaluation order issues
-        ct[tree[i, 0].temp.uint32] = 1
+        ct[tree[i, 0].local.uint32] = 1
 
       i = NodePosition e # skip to the source expression
     of mnkTemp:
       # treat as usage
       # XXX: this is brittle. Usages should be detected through DFA, not by
       #      looking for names
-      let id = tree[i].temp
+      let id = tree[i].local
       if hasKey(ct, id.uint32):
         if isDangerous(tree, i):
           ct.del(id.uint32)
@@ -252,13 +252,13 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
       # name lvalue expression, so if a temporary appears in a deref slot,
       # elision of said temporary is disabled
       if tree[i, 0].kind == mnkTemp:
-        ct.del(tree[i, 0].temp.uint32) # treat as not eligible
+        ct.del(tree[i, 0].local.uint32) # treat as not eligible
       i = tree.sibling(i) # skip the deref
     of mnkPathArray:
       # for array index slots, the above also applies
       let index = tree.child(i, 1)
       if tree[index].kind == mnkTemp:
-        ct.del(tree[index].temp.uint32)
+        ct.del(tree[index].local.uint32)
       inc i
     else:
       inc i
@@ -272,7 +272,7 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
     overlapsConservative(tree, a, computePath(tree, x), typ, tree[x].typ)
 
   proc findUse(tree: MirTree, dfg: DataFlowGraph, p: Path, typ: PType,
-               start: InstrPos, e: TempId): NodePosition {.nimcall.} =
+               start: InstrPos, e: LocalId): NodePosition {.nimcall.} =
     ## Conservative data-flow analysis that computes whether the `p` might be
     ## modified. If there are no modifications of `p` between `start`
     ## (inclusive) and the use of `e`, the the usage of `e` is returned --
@@ -287,12 +287,12 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
     for op, n in traverse(dfg, all, start, s):
       case op
       of opUse:
-        if tree[n].kind == mnkTemp and tree[n].temp == e:
+        if tree[n].kind == mnkTemp and tree[n].local == e:
           # the searched-for temporary is used and there was no mutation of
           # `p` so far -> not modified
           return NodePosition(n)
       of opConsume, opDef, opMutate, opKill, opInvalidate:
-        if (tree[n].kind == mnkTemp and tree[n].temp == e) or
+        if (tree[n].kind == mnkTemp and tree[n].local == e) or
            overlaps(p, typ, n):
           # either the searched-for temporary is mutated or consumed itself,
           # or the lvalue is mutated/consumed
@@ -311,7 +311,7 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
   let dfg = computeDfg(tree)
   for i, op, n in instructions(dfg):
     if op == opDef and tree[n].kind == mnkTemp and
-       ct.getOrDefault(tree[n].temp.uint32, 0) == 2:
+       ct.getOrDefault(tree[n].local.uint32, 0) == 2:
       # definition of a single-use temporary that might be elidable. Look for
       # potential mutations of the lvalue
       let
@@ -319,7 +319,7 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
         def = tree.parent(n)
         p   = computePath(tree, tree.child(def, 1))
         typ = tree[n].typ
-        pos = findUse(tree, dfg, p, typ, i + 1, tree[n].temp)
+        pos = findUse(tree, dfg, p, typ, i + 1, tree[n].local)
 
       if pos == NodePosition(-1):
         # the copy is necessary
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 30cd6cfd523..99a38d267a3 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -41,13 +41,6 @@ type
 template indexLike*(_: typedesc[SourceId]) = discard
 
 type
-  ## Different to the ID types above, how and what the following ID types
-  ## represent is dictated by the MIR
-  TempId* = distinct uint32
-    ## ID of a temporary location. A temporary location is created and
-    ## inserted by the compiler. The only difference to other named locations
-    ## is that temporaries are allowed to be elided (by an optimization pass,
-    ## for example) if it's deemed to have no effect on the codes' semantics
   LabelId* = distinct uint32
     ## ID of a label, used to identify a block (``mnkBlock``).
 
@@ -63,8 +56,8 @@ type
     mnkGlobal ## global location
     mnkParam  ## parameter
     mnkLocal  ## local location
-    mnkTemp   ## temporary introduced during the MIR phase. Has the same
-              ## semantics as ``mnkLocal``
+    mnkTemp   ## like ``mnkLocal``, but the local was introduced by the
+              ## compiler during the MIR phase
     mnkAlias  ## local run-time handle. This is essentially a ``var T`` or
               ## ``lent T`` local
 
@@ -276,14 +269,12 @@ type
       global*: GlobalId
     of mnkConst:
       cnst*: ConstId
-    of mnkParam, mnkLocal:
+    of mnkParam, mnkLocal, mnkTemp, mnkAlias:
       local*: LocalId
     of mnkField, mnkPathNamed, mnkPathVariant:
       field*: PSym
     of mnkLiteral:
       lit*: PNode
-    of mnkTemp, mnkAlias:
-      temp*: TempId
     of mnkPathPos:
       position*: uint32 ## the 0-based position of the field
     of mnkCall, mnkCheckedCall:
@@ -376,7 +367,6 @@ const
 
 func `==`*(a, b: SourceId): bool {.borrow.}
 func `==`*(a, b: LocalId): bool {.borrow.}
-func `==`*(a, b: TempId): bool {.borrow.}
 func `==`*(a, b: LabelId): bool {.borrow.}
 func `==`*(a, b: ConstId): bool {.borrow.}
 func `==`*(a, b: GlobalId): bool {.borrow.}
@@ -608,7 +598,8 @@ iterator arguments*(tree: MirTree, n: NodePosition): (ArgKinds, OpValue) =
 func findDef*(tree: MirTree, n: NodePosition): NodePosition =
   ## Finds and returns the first definition for the name of the temporary
   ## at node `n`. No control-flow analysis is performed.
-  let expected = tree[n].temp
+  assert tree[n].kind in {mnkTemp, mnkAlias}
+  let expected = tree[n].local
   # first, unwind until the closest statement
   result = n
   while tree[result].kind notin StmtNodes:
@@ -618,7 +609,8 @@ func findDef*(tree: MirTree, n: NodePosition): NodePosition =
   while result > NodePosition 0:
     if tree[result].kind in DefNodes:
       let name = tree.operand(result, 0)
-      if tree[name].kind in {mnkTemp, mnkAlias} and tree[name].temp == expected:
+      if tree[name].kind in {mnkTemp, mnkAlias} and
+         tree[name].local == expected:
         return
 
     result = tree.previous(result)
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 03fbd70b053..69a284ed439 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -32,7 +32,7 @@ func `$`(n: MirNode): string =
   of mnkGlobal:
     result.add " global: "
     result.addInt n.global.uint32
-  of mnkParam, mnkLocal:
+  of mnkParam, mnkLocal, mnkTemp, mnkAlias:
     result.add " local: "
     result.addInt n.local.uint32
   of mnkField, mnkPathNamed, mnkPathVariant:
@@ -42,9 +42,6 @@ func `$`(n: MirNode): string =
     result.add " lit: "
     {.cast(noSideEffect).}:
       result.add renderTree(n.lit)
-  of mnkTemp, mnkAlias:
-    result.add " temp: "
-    result.add $ord(n.temp)
   of mnkPathPos:
     result.add " position: "
     result.add $n.position
@@ -176,7 +173,7 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
   of mnkProc:
     result.addName(n.prc, "<P", c)
   of mnkTemp, mnkAlias:
-    result.add "_" & $n.temp.int
+    result.add "_" & $n.local.int
   of mnkNone:
     result.add "<none>"
   of mnkLiteral:
diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index 698cec09b52..1fdd3dff165 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -70,7 +70,7 @@ func isSameRoot(an, bn: MirNode): bool =
     return false
 
   case an.kind
-  of mnkParam, mnkLocal:
+  of mnkParam, mnkLocal, mnkTemp:
     result = an.local == bn.local
   of mnkProc:
     result = an.prc == bn.prc
@@ -78,8 +78,6 @@ func isSameRoot(an, bn: MirNode): bool =
     result = an.cnst == bn.cnst
   of mnkGlobal:
     result = an.global == bn.global
-  of mnkTemp:
-    result = an.temp == bn.temp
   of mnkCall, mnkDeref, mnkDerefView:
     result = false
   of AllNodeKinds - Roots:
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 7a5396a5094..42adeb66c3c 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -171,10 +171,12 @@ func toName(n: MirNode): EntityName =
   result.a[0] = n.kind.int
   result.a[1] =
     case n.kind
-    of mnkParam, mnkLocal: n.local.int
-    of mnkGlobal:  n.global.int
-    of mnkTemp:    n.temp.int
-    else:          unreachable(n.kind)
+    of mnkParam, mnkLocal, mnkTemp:
+      n.local.int
+    of mnkGlobal:
+      n.global.int
+    else:
+      unreachable(n.kind)
 
 func findScope(entities: EntityDict, name: EntityName, at: InstrPos,
                exists: var bool): EntityInfo =
@@ -351,7 +353,7 @@ func requiresDestruction(tree: MirTree, cfg: DataFlowGraph,
       # unpacked tuples don't need to be destroyed because all elements are
       # moved out of them
       if tree[def].kind != mnkDefUnpack:
-        computeAlive(entity.temp, computeAliveOp[TempId])
+        computeAlive(entity.local, computeAliveOp[LocalId])
       else:
         (alive: false, escapes: false)
     else:
diff --git a/tests/arc/topt_cursor.nim b/tests/arc/topt_cursor.nim
index 4f4cb9f59ff..c3ea4a8d054 100644
--- a/tests/arc/topt_cursor.nim
+++ b/tests/arc/topt_cursor.nim
@@ -14,19 +14,19 @@ scope:
             break L0
       scope:
         x = <D2>
-    def_cursor _0: (string, int) = x
-    def _1: string = $(arg _0) (raises)
-    echo(arg type(array[0..0, string]), arg _1) (raises)
+    def_cursor _3: (string, int) = x
+    def _4: string = $(arg _3) (raises)
+    echo(arg type(array[0..0, string]), arg _4) (raises)
   finally:
-    =destroy(name _1)
+    =destroy(name _4)
 -- end of expandArc ------------------------
 --expandArc: sio
 
 scope:
   scope:
     def_cursor filename: string = "debug.txt"
-    def_cursor _0: string = filename
-    def f: File = open(arg _0, arg fmRead, arg 8000) (raises)
+    def_cursor _3: string = filename
+    def f: File = open(arg _3, arg fmRead, arg 8000) (raises)
     try:
       scope:
         try:
@@ -35,25 +35,25 @@ scope:
             scope:
               while true:
                 scope:
-                  def_cursor _1: File = f
-                  def :tmp: bool = readLine(arg _1, name res) (raises)
+                  def_cursor _6: File = f
+                  def :tmp: bool = readLine(arg _6, name res) (raises)
                   scope:
-                    def_cursor _2: bool = :tmp
-                    def _3: bool = not(arg _2)
-                    if _3:
+                    def_cursor _7: bool = :tmp
+                    def _8: bool = not(arg _7)
+                    if _8:
                       scope:
                         break L0
                   scope:
                     scope:
                       def_cursor x: string = res
-                      def_cursor _4: string = x
-                      echo(arg type(array[0..0, string]), arg _4) (raises)
+                      def_cursor _10: string = x
+                      echo(arg type(array[0..0, string]), arg _10) (raises)
         finally:
           =destroy(name res)
     finally:
       scope:
-        def_cursor _5: File = f
-        close(arg _5) (raises)
+        def_cursor _11: File = f
+        close(arg _11) (raises)
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 1dc6bcab5a4..d08a667d7c4 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -14,54 +14,54 @@ doing shady stuff...
 
 scope:
   def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) (raises)
-  bind_mut _4: string = splat.0
-  def _0: string = move _4
-  wasMoved(name _4)
-  bind_mut _5: string = splat.1
-  def _1: string = move _5
-  wasMoved(name _5)
-  bind_mut _6: string = splat.2
-  def _2: string = move _6
-  wasMoved(name _6)
-  def _3: Target = construct (consume _0, consume _1, consume _2)
-  result := move _3
+  bind_mut _7: string = splat.0
+  def _3: string = move _7
+  wasMoved(name _7)
+  bind_mut _8: string = splat.1
+  def _4: string = move _8
+  wasMoved(name _8)
+  bind_mut _9: string = splat.2
+  def _5: string = move _9
+  wasMoved(name _9)
+  def _6: Target = construct (consume _3, consume _4, consume _5)
+  result := move _6
   =destroy(name splat)
 -- end of expandArc ------------------------
 --expandArc: delete
 
 scope:
-  def_cursor _0: Node = target[]
-  def_cursor _1: Node = _0[].parent
+  def_cursor _3: Node = target[]
+  def_cursor _4: Node = _3[].parent
   def sibling: Node
-  =copy(name sibling, arg _1[].left)
-  def_cursor _2: Node = sibling
+  =copy(name sibling, arg _4[].left)
+  def_cursor _6: Node = sibling
   def saved: Node
-  =copy(name saved, arg _2[].right)
-  def_cursor _3: Node = sibling
-  def_cursor _4: Node = saved
-  def_cursor _6: Node = _4[].left
-  =copy(name _3[].right, arg _6)
-  def_cursor _5: Node = sibling
-  =sink(name _5[].parent, arg saved)
+  =copy(name saved, arg _6[].right)
+  def_cursor _7: Node = sibling
+  def_cursor _8: Node = saved
+  def_cursor _10: Node = _8[].left
+  =copy(name _7[].right, arg _10)
+  def_cursor _9: Node = sibling
+  =sink(name _9[].parent, arg saved)
   =destroy(name sibling)
 -- end of expandArc ------------------------
 --expandArc: p1
 
 scope:
-  def _0: array[0..0, int] = construct (consume 123)
-  def lresult: seq[int] = arrToSeq(consume _0)
+  def _2: array[0..0, int] = construct (consume 123)
+  def lresult: seq[int] = arrToSeq(consume _2)
   def lvalue: seq[int]
   def lnext: string
-  def _1: seq[int] = move lresult
-  def _: (seq[int], string) = construct (consume _1, consume ";")
-  bind_mut _3: seq[int] = _.0
-  lvalue := move _3
-  wasMoved(name _3)
-  bind_mut _4: string = _.1
-  lnext := move _4
-  wasMoved(name _4)
-  def _2: seq[int] = move(name lvalue)
-  result.value := move _2
+  def _6: seq[int] = move lresult
+  def _: (seq[int], string) = construct (consume _6, consume ";")
+  bind_mut _8: seq[int] = _.0
+  lvalue := move _8
+  wasMoved(name _8)
+  bind_mut _9: string = _.1
+  lnext := move _9
+  wasMoved(name _9)
+  def _7: seq[int] = move(name lvalue)
+  result.value := move _7
   =destroy(name _)
   =destroy(name lnext)
   =destroy(name lvalue)
@@ -71,16 +71,16 @@ scope:
 scope:
   try:
     def_cursor it: KeyValue = x
-    def _0: seq[int]
-    =copy(name _0, arg it.0)
-    def _1: seq[int]
-    =copy(name _1, arg it.1)
-    def a: (seq[int], seq[int]) = construct (consume _0, consume _1)
-    def_cursor _2: (seq[int], seq[int]) = a
-    def _3: string = $(arg _2) (raises)
-    echo(arg type(array[0..0, string]), arg _3) (raises)
+    def _4: seq[int]
+    =copy(name _4, arg it.0)
+    def _5: seq[int]
+    =copy(name _5, arg it.1)
+    def a: (seq[int], seq[int]) = construct (consume _4, consume _5)
+    def_cursor _6: (seq[int], seq[int]) = a
+    def _7: string = $(arg _6) (raises)
+    echo(arg type(array[0..0, string]), arg _7) (raises)
   finally:
-    =destroy(name _3)
+    =destroy(name _7)
     =destroy(name a)
 -- end of expandArc ------------------------
 --expandArc: extractConfig
@@ -91,38 +91,38 @@ scope:
     scope:
       def_cursor a: seq[string] = txt
       def i: int = 0
-      def_cursor _0: seq[string] = a
-      def L: int = lengthSeq(arg _0)
+      def_cursor _5: seq[string] = a
+      def L: int = lengthSeq(arg _5)
       block L0:
         scope:
           while true:
             scope:
-              def_cursor _1: int = i
-              def :tmp: bool = ltI(arg _1, arg L)
+              def_cursor _7: int = i
+              def :tmp: bool = ltI(arg _7, arg L)
               scope:
-                def_cursor _2: bool = :tmp
-                def _3: bool = not(arg _2)
-                if _3:
+                def_cursor _8: bool = :tmp
+                def _9: bool = not(arg _8)
+                if _9:
                   scope:
                     break L0
               scope:
                 scope:
                   try:
-                    def_cursor _4: int = i
-                    def line: lent string = borrow a[_4]
-                    def_cursor _5: string = line[]
-                    def splitted: seq[string] = split(arg _5, arg " ", arg -1) (raises)
+                    def_cursor _11: int = i
+                    def line: lent string = borrow a[_11]
+                    def_cursor _13: string = line[]
+                    def splitted: seq[string] = split(arg _13, arg " ", arg -1) (raises)
                     scope:
-                      def_cursor _6: string = splitted[0]
-                      def _7: bool = eqStr(arg _6, arg "opt")
-                      if _7:
+                      def_cursor _14: string = splitted[0]
+                      def _15: bool = eqStr(arg _14, arg "opt")
+                      if _15:
                         scope:
-                          def_cursor _10: string = splitted[1]
-                          =copy(name lan_ip, arg _10)
-                    def_cursor _8: string = lan_ip
-                    echo(arg type(array[0..0, string]), arg _8) (raises)
-                    def_cursor _9: string = splitted[1]
-                    echo(arg type(array[0..0, string]), arg _9) (raises)
+                          def_cursor _18: string = splitted[1]
+                          =copy(name lan_ip, arg _18)
+                    def_cursor _16: string = lan_ip
+                    echo(arg type(array[0..0, string]), arg _16) (raises)
+                    def_cursor _17: string = splitted[1]
+                    echo(arg type(array[0..0, string]), arg _17) (raises)
                   finally:
                     =destroy(name splitted)
                 i = addI(arg i, arg 1) (raises)
@@ -136,30 +136,30 @@ scope:
     =copy(name shadowScope, arg c[].currentScope)
     rawCloseScope(arg c) (raises)
     scope:
-      def_cursor _0: Scope = shadowScope
-      def_cursor a: seq[Symbol] = _0[].symbols
+      def_cursor _4: Scope = shadowScope
+      def_cursor a: seq[Symbol] = _4[].symbols
       def i: int = 0
-      def_cursor _1: seq[Symbol] = a
-      def L: int = lengthSeq(arg _1)
+      def_cursor _7: seq[Symbol] = a
+      def L: int = lengthSeq(arg _7)
       block L0:
         scope:
           while true:
             scope:
-              def_cursor _2: int = i
-              def :tmp: bool = ltI(arg _2, arg L)
+              def_cursor _9: int = i
+              def :tmp: bool = ltI(arg _9, arg L)
               scope:
-                def_cursor _3: bool = :tmp
-                def _4: bool = not(arg _3)
-                if _4:
+                def_cursor _10: bool = :tmp
+                def _11: bool = not(arg _10)
+                if _11:
                   scope:
                     break L0
               scope:
                 scope:
-                  def_cursor _5: int = i
-                  def sym: lent Symbol = borrow a[_5]
-                  def _6: Symbol
-                  =copy(name _6, arg sym[])
-                  addInterfaceDecl(arg c, consume _6) (raises)
+                  def_cursor _13: int = i
+                  def sym: lent Symbol = borrow a[_13]
+                  def _14: Symbol
+                  =copy(name _14, arg sym[])
+                  addInterfaceDecl(arg c, consume _14) (raises)
                 i = addI(arg i, arg 1) (raises)
   finally:
     =destroy(name shadowScope)
@@ -170,20 +170,20 @@ scope:
   try:
     def x: sink string
     scope:
-      def_cursor _0: sink string = x
-      def _1: int = lengthStr(arg _0)
-      def _2: bool = eqI(arg _1, arg 2)
-      if _2:
+      def_cursor _2: sink string = x
+      def _3: int = lengthStr(arg _2)
+      def _4: bool = eqI(arg _3, arg 2)
+      if _4:
         scope:
           result := move x
           wasMoved(name x)
           return
-    def_cursor _3: sink string = x
-    def _4: int = lengthStr(arg _3)
-    def _5: string = $(arg _4) (raises)
-    echo(arg type(array[0..0, string]), arg _5) (raises)
+    def_cursor _5: sink string = x
+    def _6: int = lengthStr(arg _5)
+    def _7: string = $(arg _6) (raises)
+    echo(arg type(array[0..0, string]), arg _7) (raises)
   finally:
-    =destroy(name _5)
+    =destroy(name _7)
     =destroy(name x)
 
 -- end of expandArc ------------------------
@@ -191,49 +191,49 @@ scope:
 
 scope:
   try:
-    def_cursor _0: string = this[].value
-    this[].isValid = fileExists(arg _0) (raises)
-    def _1: tuple[dir: string, front: string]
+    def_cursor _2: string = this[].value
+    this[].isValid = fileExists(arg _2) (raises)
+    def _4: tuple[dir: string, front: string]
     block L0:
       scope:
-        def_cursor _2: string = this[].value
-        def _3: bool = dirExists(arg _2) (raises)
-        if _3:
+        def_cursor _5: string = this[].value
+        def _6: bool = dirExists(arg _5) (raises)
+        if _6:
           scope:
-            def _4: string
-            =copy(name _4, arg this[].value)
-            _1 := construct (consume _4, consume "")
+            def _7: string
+            =copy(name _7, arg this[].value)
+            _4 := construct (consume _7, consume "")
             break L0
       scope:
         try:
-          def_cursor _5: string = this[].value
-          def _6: string = parentDir(arg _5) (raises)
-          def _7: string
-          =copy(name _7, arg this[].value)
-          def _8: tuple[head: string, tail: string] = splitPath(consume _7) (raises)
-          bind_mut _16: string = _8.1
-          def _9: string = move _16
-          wasMoved(name _16)
-          _1 := construct (consume _6, consume _9)
-          wasMoved(name _6)
+          def_cursor _8: string = this[].value
+          def _9: string = parentDir(arg _8) (raises)
+          def _10: string
+          =copy(name _10, arg this[].value)
+          def _11: tuple[head: string, tail: string] = splitPath(consume _10) (raises)
+          bind_mut _19: string = _11.1
+          def _12: string = move _19
+          wasMoved(name _19)
+          _4 := construct (consume _9, consume _12)
+          wasMoved(name _9)
         finally:
-          =destroy(name _8)
-          =destroy(name _6)
-    def par: tuple[dir: string, front: string] = move _1
+          =destroy(name _11)
+          =destroy(name _9)
+    def par: tuple[dir: string, front: string] = move _4
     block L1:
       scope:
-        def_cursor _10: string = par.0
-        def _11: bool = dirExists(arg _10) (raises)
-        if _11:
+        def_cursor _13: string = par.0
+        def _14: bool = dirExists(arg _13) (raises)
+        if _14:
           scope:
-            def_cursor _12: string = par.0
-            def_cursor _13: string = par.1
-            def _14: seq[string] = getSubDirs(arg _12, arg _13) (raises)
-            =sink(name this[].matchDirs, arg _14)
+            def_cursor _15: string = par.0
+            def_cursor _16: string = par.1
+            def _17: seq[string] = getSubDirs(arg _15, arg _16) (raises)
+            =sink(name this[].matchDirs, arg _17)
             break L1
       scope:
-        def _15: seq[string] = construct ()
-        =sink(name this[].matchDirs, arg _15)
+        def _18: seq[string] = construct ()
+        =sink(name this[].matchDirs, arg _18)
   finally:
     =destroy(name par)
 -- end of expandArc ------------------------'''
diff --git a/tests/arc/topt_refcursors.nim b/tests/arc/topt_refcursors.nim
index e0d466b1f3e..6544c1ca6dc 100644
--- a/tests/arc/topt_refcursors.nim
+++ b/tests/arc/topt_refcursors.nim
@@ -9,41 +9,41 @@ scope:
     scope:
       while true:
         scope:
-          def_cursor _0: Node = it
-          def _1: bool = eqRef(arg _0, arg nil)
-          def :tmp: bool = not(arg _1)
+          def_cursor _4: Node = it
+          def _5: bool = eqRef(arg _4, arg nil)
+          def :tmp: bool = not(arg _5)
           scope:
-            def_cursor _2: bool = :tmp
-            def _3: bool = not(arg _2)
-            if _3:
+            def_cursor _6: bool = :tmp
+            def _7: bool = not(arg _6)
+            if _7:
               scope:
                 break L0
           scope:
-            def_cursor _4: Node = it
-            def_cursor _5: string = _4[].s
-            echo(arg type(array[0..0, string]), arg _5) (raises)
-            def_cursor _6: Node = it
-            it = _6[].ri
+            def_cursor _8: Node = it
+            def_cursor _9: string = _8[].s
+            echo(arg type(array[0..0, string]), arg _9) (raises)
+            def_cursor _10: Node = it
+            it = _10[].ri
   def_cursor jt: Node = root
   block L1:
     scope:
       while true:
         scope:
-          def_cursor _7: Node = jt
-          def _8: bool = eqRef(arg _7, arg nil)
-          def :tmp: bool = not(arg _8)
+          def_cursor _13: Node = jt
+          def _14: bool = eqRef(arg _13, arg nil)
+          def :tmp: bool = not(arg _14)
           scope:
-            def_cursor _9: bool = :tmp
-            def _10: bool = not(arg _9)
-            if _10:
+            def_cursor _15: bool = :tmp
+            def _16: bool = not(arg _15)
+            if _16:
               scope:
                 break L1
           scope:
-            def_cursor _11: Node = jt
-            def_cursor ri: Node = _11[].ri
-            def_cursor _12: Node = jt
-            def_cursor _13: string = _12[].s
-            echo(arg type(array[0..0, string]), arg _13) (raises)
+            def_cursor _18: Node = jt
+            def_cursor ri: Node = _18[].ri
+            def_cursor _19: Node = jt
+            def_cursor _20: string = _19[].s
+            echo(arg type(array[0..0, string]), arg _20) (raises)
             jt = ri
 -- end of expandArc ------------------------'''
 """
diff --git a/tests/arc/topt_wasmoved_destroy_pairs.nim b/tests/arc/topt_wasmoved_destroy_pairs.nim
index 2d21d939f5b..42587fe13a7 100644
--- a/tests/arc/topt_wasmoved_destroy_pairs.nim
+++ b/tests/arc/topt_wasmoved_destroy_pairs.nim
@@ -11,12 +11,12 @@ scope:
     scope:
       if cond:
         scope:
-          def _0: seq[int] = move x
-          add(name a, consume _0)
+          def _5: seq[int] = move x
+          add(name a, consume _5)
           break L0
     scope:
-      def _1: seq[int] = move x
-      add(name b, consume _1)
+      def _6: seq[int] = move x
+      add(name b, consume _6)
   =destroy(name b)
   =destroy(name a)
 -- end of expandArc ------------------------
@@ -35,38 +35,38 @@ scope:
         scope:
           while true:
             scope:
-              def_cursor _0: int = i
-              def :tmp: bool = ltI(arg _0, arg b)
+              def_cursor _9: int = i
+              def :tmp: bool = ltI(arg _9, arg b)
               scope:
-                def_cursor _1: bool = :tmp
-                def _2: bool = not(arg _1)
-                if _2:
+                def_cursor _10: bool = :tmp
+                def _11: bool = not(arg _10)
+                if _11:
                   scope:
                     break L0
               scope:
                 scope:
                   def_cursor i: int = i
                   scope:
-                    def _3: bool = eqI(arg i, arg 2)
-                    if _3:
+                    def _13: bool = eqI(arg i, arg 2)
+                    if _13:
                       scope:
                         return
-                  def _4: seq[int]
-                  =copy(name _4, arg x)
-                  add(name a, consume _4)
+                  def _14: seq[int]
+                  =copy(name _14, arg x)
+                  add(name a, consume _14)
                 i = addI(arg i, arg 1) (raises)
     block L1:
       scope:
         if cond:
           scope:
-            def _5: seq[int] = move x
+            def _15: seq[int] = move x
             wasMoved(name x)
-            add(name a, consume _5)
+            add(name a, consume _15)
             break L1
       scope:
-        def _6: seq[int] = move x
+        def _16: seq[int] = move x
         wasMoved(name x)
-        add(name b, consume _6)
+        add(name b, consume _16)
   finally:
     =destroy(name x)
     =destroy(name b)
@@ -81,11 +81,11 @@ scope:
       if cond:
         scope:
           return
-    def _0: string = boolToStr(arg cond)
-    str := move _0
+    def _4: string = boolToStr(arg cond)
+    str := move _4
     scope:
-      def _1: bool = not(arg cond)
-      if _1:
+      def _5: bool = not(arg cond)
+      if _5:
         scope:
           result := move str
           wasMoved(name str)
diff --git a/tests/compiler/ttreechangesets.nim b/tests/compiler/ttreechangesets.nim
index 8cab8415fe8..30043cbff9b 100644
--- a/tests/compiler/ttreechangesets.nim
+++ b/tests/compiler/ttreechangesets.nim
@@ -13,9 +13,9 @@ import
 type Changeset = TreeChangeset
 
 proc temp(x: int): MirNode =
-  MirNode(kind: mnkTemp, temp: x.TempId)
+  MirNode(kind: mnkTemp, local: x.LocalId)
 
-func `==`(a: TempId, b: int): bool =
+func `==`(a: LocalId, b: int): bool =
   a.int == b
 
 func insert(c: var Changeset, i: int, n: sink MirNode) =
@@ -29,7 +29,7 @@ func `==`(a, b: MirNode): bool =
   # only implements the comparisons needed by the tests
   case a.kind
   of mnkTemp:
-    result = a.temp == b.temp
+    result = a.local == b.local
   else:
     doAssert false
 
diff --git a/tests/exception/truntime_check_panics.nim b/tests/exception/truntime_check_panics.nim
index d770f2a4c5a..ee292e3d09c 100644
--- a/tests/exception/truntime_check_panics.nim
+++ b/tests/exception/truntime_check_panics.nim
@@ -13,19 +13,19 @@ scope:
   chckIndex(arg a, arg i)
   discard a[i]
   chckBounds(arg a, arg 0, arg i)
-  def _0: openArray[int] = toOpenArray a, 0, i
-  def _1: int = addI(arg i, arg i)
-  def _2: int = unaryMinusI(arg i)
-  def _3: range 0..1(int) = chckRange(arg i, arg 0, arg 1)
+  def _6: openArray[int] = toOpenArray a, 0, i
+  def _7: int = addI(arg i, arg i)
+  def _8: int = unaryMinusI(arg i)
+  def _9: range 0..1(int) = chckRange(arg i, arg 0, arg 1)
   chckField(arg <D0>, arg o.kind, arg false, arg "field \'x\' is not accessible for type \'Object\' using \'kind = ")
   discard o.kind.x
-  def _5: bool = isNil(arg r)
-  def _4: bool = not(arg _5)
-  if _4:
+  def _11: bool = isNil(arg r)
+  def _10: bool = not(arg _11)
+  if _10:
     chckObj(arg r, arg type(Sub:ObjectType))
   discard r.(Sub)
-  def _6: float = mulF64(arg f, arg f)
-  chckNaN(arg _6)
+  def _12: float = mulF64(arg f, arg f)
+  chckNaN(arg _12)
 
 -- end of expandArc ------------------------'''
 """
diff --git a/tests/lang_objects/destructor/tv2_cast.nim b/tests/lang_objects/destructor/tv2_cast.nim
index e0a0f43f00a..c54fdbad387 100644
--- a/tests/lang_objects/destructor/tv2_cast.nim
+++ b/tests/lang_objects/destructor/tv2_cast.nim
@@ -7,63 +7,63 @@ destroying O1'''
   nimout: '''--expandArc: main
 scope:
   try:
-    def _0: string = newString(arg 100)
-    def_cursor _1: seq[byte] = cast _0
-    def _2: openArray[byte] = toOpenArray _1
-    def _3: seq[byte] = encode(arg _2) (raises)
-    def_cursor _4: string = cast _3
+    def _2: string = newString(arg 100)
+    def_cursor _3: seq[byte] = cast _2
+    def _4: openArray[byte] = toOpenArray _3
+    def _5: seq[byte] = encode(arg _4) (raises)
+    def_cursor _6: string = cast _5
     def data: string
-    =copy(name data, arg _4)
+    =copy(name data, arg _6)
   finally:
     =destroy(name data)
-    =destroy(name _3)
-    =destroy(name _0)
+    =destroy(name _5)
+    =destroy(name _2)
 -- end of expandArc ------------------------
 --expandArc: main1
 scope:
   try:
     def s: string = newString(arg 100)
-    def_cursor _0: string = s
-    def _1: int = lengthStr(arg _0)
-    def _2: int = subI(arg _1, arg 1) (raises)
-    chckBounds(arg s, arg 0, arg _2) (raises)
-    def _3: openArray[byte] = toOpenArray s, 0, _2
-    def _4: seq[byte] = encode(arg _3) (raises)
-    def_cursor _5: string = cast _4
+    def_cursor _3: string = s
+    def _4: int = lengthStr(arg _3)
+    def _5: int = subI(arg _4, arg 1) (raises)
+    chckBounds(arg s, arg 0, arg _5) (raises)
+    def _6: openArray[byte] = toOpenArray s, 0, _5
+    def _7: seq[byte] = encode(arg _6) (raises)
+    def_cursor _8: string = cast _7
     def data: string
-    =copy(name data, arg _5)
+    =copy(name data, arg _8)
   finally:
     =destroy(name data)
-    =destroy(name _4)
+    =destroy(name _7)
     =destroy(name s)
 -- end of expandArc ------------------------
 --expandArc: main2
 scope:
   try:
     def s: seq[byte] = newSeq(arg 100) (raises)
-    def _0: openArray[byte] = toOpenArray s
-    def _1: seq[byte] = encode(arg _0) (raises)
-    def_cursor _2: string = cast _1
+    def _3: openArray[byte] = toOpenArray s
+    def _4: seq[byte] = encode(arg _3) (raises)
+    def_cursor _5: string = cast _4
     def data: string
-    =copy(name data, arg _2)
+    =copy(name data, arg _5)
   finally:
     =destroy(name data)
-    =destroy(name _1)
+    =destroy(name _4)
     =destroy(name s)
 -- end of expandArc ------------------------
 --expandArc: main3
 scope:
   try:
-    def _0: seq[byte] = newSeq(arg 100) (raises)
-    def _1: openArray[byte] = toOpenArray _0
-    def _2: seq[byte] = encode(arg _1) (raises)
-    def_cursor _3: string = cast _2
+    def _2: seq[byte] = newSeq(arg 100) (raises)
+    def _3: openArray[byte] = toOpenArray _2
+    def _4: seq[byte] = encode(arg _3) (raises)
+    def_cursor _5: string = cast _4
     def data: string
-    =copy(name data, arg _3)
+    =copy(name data, arg _5)
   finally:
     =destroy(name data)
+    =destroy(name _4)
     =destroy(name _2)
-    =destroy(name _0)
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/misc/tdont_fold_procedure_cast.nim b/tests/misc/tdont_fold_procedure_cast.nim
index 81e6ce7d4c2..e34028e0ef0 100644
--- a/tests/misc/tdont_fold_procedure_cast.nim
+++ b/tests/misc/tdont_fold_procedure_cast.nim
@@ -8,10 +8,10 @@ discard """
   nimout: '''
 --expandArc: test
 scope:
-  def_cursor _0: proc (x: float){.nimcall.} = cast other
-  def p: proc (x: float){.nimcall.} = copy _0
-  def_cursor _1: proc (x: int){.nimcall.} = cast p
-  _1(arg 1) (raises)
+  def_cursor _2: proc (x: float){.nimcall.} = cast other
+  def p: proc (x: float){.nimcall.} = copy _2
+  def_cursor _3: proc (x: int){.nimcall.} = cast p
+  _3(arg 1) (raises)
 -- end of expandArc ------------------------
   '''
   output: "1"

From af3b15a35f083ff50f2d3bf5a25008a3a2f89bd2 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 30 Mar 2024 20:44:26 +0100
Subject: [PATCH 050/169] fix(sem): wrong error reported for `raise` (#1261)

## Summary

Fix errors in expressions within `raise` statements being hidden
behind an "only a 'ref object' can be raised" error.

Fixes https://github.com/nim-works/nimskull/issues/112

## Details

* make `semRaise` `nkError`-aware (proper error propagation)
* don't modify input AST in `semRaise`
* replace `localReport` in `semRaise` with `nkError`; the necessary
  diagnostics corresponding to the legacy reports are introduced
---
 compiler/ast/ast_types.nim        |  4 ++++
 compiler/front/cli_reporter.nim   |  7 +++++++
 compiler/front/msgs.nim           |  2 ++
 compiler/sem/semstmts.nim         | 32 ++++++++++++++++++-------------
 tests/errmsgs/terror_in_raise.nim |  6 ++++++
 5 files changed, 38 insertions(+), 13 deletions(-)
 create mode 100644 tests/errmsgs/terror_in_raise.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index e4fc830088c..429afb3a4ba 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1191,6 +1191,8 @@ type
     adSemDotOperatorsNotEnabled
     adSemCallOperatorsNotEnabled
     adSemUnexpectedPattern
+    adSemCannotBeRaised
+    adSemCannotRaiseNonException
     # types
     adSemTypeKindMismatch
     # semexprs
@@ -1349,6 +1351,8 @@ type
         adSemDotOperatorsNotEnabled,
         adSemCallOperatorsNotEnabled,
         adSemUnexpectedPattern,
+        adSemCannotBeRaised,
+        adSemCannotRaiseNonException,
         adSemIsOperatorTakes2Args,
         adSemNoTupleTypeForConstructor,
         adSemInvalidOrderInArrayConstructor,
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index de634c0cc33..647658542f9 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3831,6 +3831,13 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
       ast: diag.wrongNode,
       str: diag.compilerOpt.getStr,
       compilerOptArg: diag.compilerOptArg.getStr)
+  of adSemCannotBeRaised, adSemCannotRaiseNonException:
+    semRep = SemReport(
+      location: some diag.location,
+      reportInst: diag.instLoc.toReportLineInfo,
+      kind: kind,
+      ast: diag.wrongNode,
+      typ: diag.wrongNode[0].typ)
   of adVmError:
     let
       kind = diag.vmErr.kind.astDiagVmToLegacyReportKind()
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index 37dd2a33572..735abc46a94 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -531,6 +531,8 @@ func astDiagToLegacyReportKind*(
   of adSemDotOperatorsNotEnabled: rsemEnableDotOperatorsExperimental
   of adSemCallOperatorsNotEnabled: rsemEnableCallOperatorExperimental
   of adSemUnexpectedPattern: rsemUnexpectedPattern
+  of adSemCannotBeRaised: rsemCannotBeRaised
+  of adSemCannotRaiseNonException: rsemCannotRaiseNonException
   of adSemConstantOfTypeHasNoValue: rsemConstantOfTypeHasNoValue
   of adSemTypeConversionArgumentMismatch: rsemTypeConversionArgumentMismatch
   of adSemUnexpectedEqInObjectConstructor: rsemUnexpectedEqInObjectConstructor
diff --git a/compiler/sem/semstmts.nim b/compiler/sem/semstmts.nim
index ed49396a823..f027b528573 100644
--- a/compiler/sem/semstmts.nim
+++ b/compiler/sem/semstmts.nim
@@ -1730,20 +1730,26 @@ proc semCase(c: PContext, n: PNode; flags: TExprFlags): PNode =
     result.typ = typ
 
 proc semRaise(c: PContext, n: PNode): PNode =
-  result = n
   checkSonsLen(n, 1, c.config)
-  if n[0].kind != nkEmpty:
-    n[0] = semExprWithType(c, n[0])
-    var typ = n[0].typ
-    if not isImportedException(typ, c.config):
-      typ = typ.skipTypes({tyAlias, tyGenericInst})
-      if typ.kind != tyRef:
-        localReport(c.config, n.info, reportTyp(
-          rsemCannotBeRaised, typ))
-
-      if typ.len > 0 and not isException(typ.lastSon):
-        localReport(c.config, n.info, reportTyp(
-          rsemCannotRaiseNonException, typ))
+  result = shallowCopy(n)
+  case n[0].kind
+  of nkEmpty:
+    # make sure to copy, the nfSem flag needs to be included
+    result[0] = copyNode(n[0])
+    result[0].flags.incl nfSem
+  else:
+    result[0] = semExprWithType(c, n[0])
+    let typ = result[0].typ
+    if result[0].kind == nkError:
+      result = c.config.wrapError(result)
+    elif not isImportedException(typ, c.config):
+      let refTyp = typ.skipTypes({tyAlias, tyGenericInst})
+      if refTyp.kind != tyRef:
+        result = c.config.newError(result,
+          PAstDiag(kind: adSemCannotBeRaised))
+      elif not isException(refTyp.lastSon):
+        result = c.config.newError(result,
+          PAstDiag(kind: adSemCannotRaiseNonException))
 
 proc addGenericParamListToScope(c: PContext, n: PNode) =
   if n.kind != nkGenericParams:
diff --git a/tests/errmsgs/terror_in_raise.nim b/tests/errmsgs/terror_in_raise.nim
new file mode 100644
index 00000000000..360586e60ae
--- /dev/null
+++ b/tests/errmsgs/terror_in_raise.nim
@@ -0,0 +1,6 @@
+discard """
+  errormsg: "undeclared identifier: 'doesntExist'"
+  line: 6
+"""
+
+raise doesntExist

From d7426b7f62ca1ad04bdfa146976299fbf64be8df Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 30 Mar 2024 20:56:33 +0100
Subject: [PATCH 051/169] vmjit: remove expression-related workaround (#1262)

## Summary

Make the MIR tree produced for standalone expressions (e.g.,
initializer of a `const`) syntactically well-formed. Previously, these
trees contained a trailing MIR expression, which required various
workarounds in other places (all of which are now removed).

## Details

* add the `exprToMir` procedure to `mirgen`; it produces a proper MIR
  body for standalone expressions by assigning the expression to the
  result variable
  * the body is wrapped in a scope (`mnkScope`), which means passes can
    now rely on the presence of an outermost scope block
* use `exprToMir` in `vmjit` for producing the MIR body for standalone
  expressions
* remove the dedicated code generation for standalone expressions from
  `vmgen` (`genExpr`)
* unify the expression/statement handling in `vmjit`
* remove the workarounds for trailing expressions from `cgirgen` and
  `mirpasses`

To replicate the previous behaviour, where no copy of the value was
introduced for lvalue expressions, `vmjit` wraps standalone lvalue
expressions in an `nkHiddenAddr`, prior to passing the AST to
`exprToMir`.
---
 compiler/backend/cgirgen.nim | 17 +++------
 compiler/mir/mirgen.nim      | 40 +++++++++++++++------
 compiler/mir/mirpasses.nim   | 15 +-------
 compiler/vm/vmgen.nim        | 37 +++-----------------
 compiler/vm/vmjit.nim        | 68 ++++++++++++------------------------
 5 files changed, 62 insertions(+), 115 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 36415619ac6..75ad42ce1e2 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -272,7 +272,7 @@ func disable(cl: var TranslateCl) {.inline.} =
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
               cr: var TreeCursor, stmts: var seq[CgNode])
 proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, stmts: var seq[CgNode], allowExpr=false)
+               cr: var TreeCursor, stmts: var seq[CgNode])
 
 proc handleSpecialConv(c: ConfigRef, n: CgNode, info: TLineInfo,
                        dest: PType): CgNode =
@@ -1050,12 +1050,8 @@ proc genDefFor(sym: sink CgNode): CgNode =
     unreachable()
 
 proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-               cr: var TreeCursor, stmts: var seq[CgNode],
-               allowExpr = false) =
+               cr: var TreeCursor, stmts: var seq[CgNode]) =
   let
-    ends =
-      if allowExpr: {mnkEnd} + Atoms
-      else:         {mnkEnd}
     prev = cl.defs.len
     prevInUnscoped = cl.inUnscoped
     start = stmts.len
@@ -1064,7 +1060,7 @@ proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   cl.inUnscoped = false
 
   # translate all statements:
-  while cr.hasNext(tree) and tree[cr].kind notin ends:
+  while cr.hasNext(tree) and tree[cr].kind != mnkEnd:
     stmtToIr(tree, env, cl, cr, stmts)
 
   if cr.hasNext(tree) and tree[cr].kind == mnkEnd:
@@ -1085,7 +1081,7 @@ proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   ## Translate `tree` to the corresponding ``CgNode`` representation.
   var cr = TreeCursor(pos: start.uint32)
   var stmts: seq[CgNode]
-  scopeToIr(tree, env, cl, cr, stmts, allowExpr=true)
+  scopeToIr(tree, env, cl, cr, stmts)
   if cl.raiseExits.len > 0:
     # there's unhandled exceptional control-flow
     patchResume(cl.raiseExits, 0)
@@ -1094,11 +1090,6 @@ proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   if cl.returnLabel.isSome:
     join unknownLineInfo, cl.returnLabel.get()
 
-  if cr.hasNext(tree):
-    # the tree must be an expression; the last node is required to be an atom
-    let x = atomToIr(tree, cl, cr)
-    stmts.add x
-
   # XXX: the list of statements is still wrapped in a node for now, but
   #      this needs to change once all code generators use the new CGIR
   result = newStmt(cnkStmtList, unknownLineInfo)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index a5f497da1d6..d9d2a0f11e8 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -2050,16 +2050,6 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv,
   if n.typ.isEmptyType:
     withFront c.builder:
       gen(c, n)
-  elif n.typ.kind == tyTypeDesc:
-    # FIXME: this shouldn't happen, but type expressions are sometimes
-    #        evaluated with the VM, such as a ``typeof(T.x)`` appearing as
-    #        a field type within a generic object definition. While it makes
-    #        sense to allow evaluating type expression with the VM, in simple
-    #        situtations like the example above, it's simpler, faster, and more
-    #        intuitive to either evaluate them directly when analying the type
-    #        expression or during ``semfold``
-    c.builder.useSource(c.sp, n)
-    c.use genTypeExpr(c, n)
   else:
     c.builder.useSource(c.sp, n)
     # XXX: restructure the ``mirgen`` API to use a dedicated procedure for
@@ -2166,6 +2156,36 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
   let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
   MirBody(locals: locals, source: move c.sp.map, code: code)
 
+proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
+                config: TranslationConfig, e: PNode): MirBody =
+  ## Only meant to be used by `vmjit <#vmjit>`_. Produces a MIR body for a
+  ## standalone expression. The result of the expression is assigned to the
+  ## special local with ID 0.
+  var c = TCtx(context: skUnknown, graph: graph, config: config)
+  c.sp.active = (e, c.sp.map.add(e))
+  swap(c.env, env)
+
+  let res = c.addLocal(Local(typ: e.typ)) # the result variable
+  c.scope:
+    c.buildStmt mnkDef:
+      c.use toValue(mnkLocal, res, e.typ)
+      if e.typ.kind == tyTypeDesc:
+        # FIXME: this shouldn't happen, but type expressions are sometimes
+        #        evaluated with the VM, such as a ``typeof(T.x)`` appearing as
+        #        a field type within a generic object definition. While it
+        #        makes sense to allow evaluating type expression with the VM,
+        #        in simple situtations like the example above, it's simpler,
+        #        faster, and more intuitive to either evaluate them directly
+        #        when analyzing the type expression, or during ``semfold``
+        c.use genTypeExpr(c, e)
+      else:
+        c.genAsgnSource(e, {dfOwns, dfEmpty})
+
+  swap(c.env, env)
+
+  let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
+  MirBody(locals: locals, source: move c.sp.map, code: code)
+
 proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
   ## Translates the construction expression AST `n` representing some
   ## constant data to its corresponding MIR representation.
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 18c053754e6..e682726946d 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -208,16 +208,6 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
   ##   call(arg a.b.c)
   var ct = initCountTable[uint32]()
 
-  proc isDangerous(tree: MirTree, n: NodePosition): bool =
-    # HACK: this is a tremendous hack to detect whether `n` is part of a
-    #       loose expression, which are currently required by expression
-    #       support for ``vmjit``. Remove as soon as no longer needed
-    var i = int n
-    while i < tree.len and tree[i].kind notin StmtNodes:
-      inc i
-
-    result = i >= tree.len
-
   # first pass: gather all single-use temporaries that are created from
   # lvalues and are eligible for elimination.
   var i = NodePosition 0
@@ -240,10 +230,7 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
       #      looking for names
       let id = tree[i].local
       if hasKey(ct, id.uint32):
-        if isDangerous(tree, i):
-          ct.del(id.uint32)
-        else:
-          ct.inc(id.uint32)
+        ct.inc(id.uint32)
 
       inc i
     of mnkDeref, mnkDerefView:
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 31ccf2a6f19..6100ed15980 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -3198,45 +3198,16 @@ proc genStmt*(c: var TCtx; body: sink Body): Result[int, VmGenDiag] =
   c.prc = initProc(c, nil, body)
   let n = c.prc.body.code
 
-  var d: TDest = -1
   try:
     let eh = genSetEh(c, n.info)
-    c.gen(n, d)
+    c.gen(n)
     c.patchSetEh(eh)
   except VmGenError as e:
     return typeof(result).err(move e.diag)
 
-  c.config.internalAssert(d < 0, n.info, "VM problem: dest register is set")
-  result = typeof(result).ok(c.prc.regInfo.len)
-
-proc genExpr*(c: var TCtx; body: sink Body): Result[int, VmGenDiag] =
-  ## Generates and emits the code for a standalone expression.
-  c.prc = initProc(c, nil, body)
-  let n = c.prc.body.code
-
-  var d: TDest = -1
-  try:
-    let eh = genSetEh(c, n.info)
-    if n.kind == cnkStmtList:
-      # special case the expression here so that ``gen`` doesn't have to
-      for i in 0..<n.len-1:
-        c.gen(n[i])
-
-      c.gen(n[^1], d)
-    else:
-      c.gen(n, d)
-
-    c.patchSetEh(eh)
-  except VmGenError as e:
-    return typeof(result).err(move e.diag)
-
-  # the destination register not being set likely indicate that `n` is not an
-  # expression
-  c.config.internalAssert(d != noDest, n.info):
-    "VM problem: dest register is not set"
-  # standalone expressions are treated as nullary procedures that
-  # directly return the value
-  c.gABC(n, opcRet, d)
+  if not isEmptyType(c.prc.body[resultId].typ):
+    # the body has a result, emit a return
+    c.gABC(n, opcRet, c.prc[resultId].reg)
 
   result = typeof(result).ok(c.prc.regInfo.len)
 
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index dbd2f972444..e195db205c2 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -32,7 +32,6 @@ import
     datatables,
     mirbodies,
     mirbridge,
-    mirconstr,
     mirenv,
     mirgen,
     mirpasses,
@@ -44,9 +43,6 @@ import
   compiler/sem/[
     transf
   ],
-  compiler/utils/[
-    containers
-  ],
   compiler/vm/[
     identpatterns,
     vmaux,
@@ -61,6 +57,11 @@ import
     results
   ]
 
+# XXX: temporary imports for expression support
+from compiler/ast/ast import newTreeIT
+from compiler/sem/semdata import makeVarType
+from compiler/sem/parampatterns import isAssignable, TAssignableResult
+
 export VmGenResult
 
 type
@@ -148,17 +149,19 @@ proc generateMirCode(c: var TCtx, env: var MirEnv, n: PNode;
                      isStmt = false): MirBody =
   ## Generates the initial MIR code for a standalone statement/expression.
   if isStmt:
-    # we want statements wrapped in a scope, hence generating a proper
-    # fragment
     result = generateCode(c.graph, env, c.module, selectOptions(c), n)
   else:
-    var bu: MirBuilder
-     # add an empty local so that the result slot is occupied:
-    discard bu.addLocal(Local())
-    # XXX: ^^ this is a hack, and yet another reason to remove expression
-    #      support from the JIT
-    generateCode(c.graph, env, selectOptions(c), n, bu, result.source)
-    (result.code, result.locals) = finish(bu, default(Store[LocalId, Local]))
+    var n = n
+    # optimization: wrap the expression in a hidden address if it's an lvalue
+    # expression. This eliminates the unnecessary copy that would be created
+    # otherwise
+    if isAssignable(nil, n, isUnsafeAddr=true) in {arLocalLValue, arLValue,
+                                                   arLentValue}:
+      n = newTreeIT(nkHiddenAddr, n.info,
+                    makeVarType(c.module, n.typ, c.idgen, tyLent),
+                    n)
+
+    result = exprToMir(c.graph, env, selectOptions(c), n)
 
 proc generateIR(c: var TCtx, env: MirEnv, body: sink MirBody): Body =
   backends.generateIR(c.graph, c.idgen, env, c.module, body)
@@ -194,15 +197,14 @@ proc applyPasses(c: var TCtx, env: var MirEnv, prc: PSym, body: var MirBody) =
   if restore:
     prc.options.incl optProfiler
 
-proc genStmt*(jit: var JitState, c: var TCtx; n: PNode): VmGenResult =
-  ## Generates and emits code for the standalone top-level statement `n`.
+proc gen(jit: var JitState, c: var TCtx, n: PNode, isStmt: bool): VmGenResult =
   preCheck(jit.gen.env, n)
   c.removeLastEof()
 
   let cp = checkpoint(jit.gen.env)
 
   # `n` is expected to have been put through ``transf`` already
-  var mirBody = generateMirCode(c, jit.gen.env, n, isStmt = true)
+  var mirBody = generateMirCode(c, jit.gen.env, n, isStmt)
   applyPasses(c, jit.gen.env, c.module, mirBody)
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
@@ -222,37 +224,13 @@ proc genStmt*(jit: var JitState, c: var TCtx; n: PNode): VmGenResult =
 
   result = VmGenResult.ok: (start: start, regCount: r.get)
 
+proc genStmt*(jit: var JitState, c: var TCtx, n: PNode): VmGenResult =
+  ## Generates and emits code for the standalone top-level statement `n`.
+  gen(jit, c, n, isStmt = true)
+
 proc genExpr*(jit: var JitState, c: var TCtx, n: PNode): VmGenResult =
   ## Generates and emits code for the standalone expression `n`
-  preCheck(jit.gen.env, n)
-  c.removeLastEof()
-
-  # XXX: the way standalone expressions are currently handled is going to
-  #      be a problem as soon as proper MIR passes need to be run (which
-  #      all expect statements). Ideally, dedicated support for
-  #      expressions would be removed from the JIT.
-
-  let cp = checkpoint(jit.gen.env)
-
-  var mirBody = generateMirCode(c, jit.gen.env, n)
-  applyPasses(c, jit.gen.env, c.module, mirBody)
-  for _ in discover(jit.gen.env, cp):
-    discard "nothing to register"
-
-  let
-    body = generateIR(c, jit.gen.env, mirBody)
-    start = c.code.len
-
-  # generate the bytecode:
-  let r = runCodeGen(c, jit.gen, body): genExpr(jit.gen, body)
-
-  if unlikely(r.isErr):
-    rewind(jit.gen.env, cp)
-    return VmGenResult.err(r.takeErr)
-
-  updateEnvironment(c, jit.gen.env, cp)
-
-  result = VmGenResult.ok: (start: start, regCount: r.get)
+  gen(jit, c, n, isStmt = false)
 
 proc genProc(jit: var JitState, c: var TCtx, s: PSym): VmGenResult =
   let body =

From b65406e2ed67604a6741fb6aba1a4c0876befc4e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 31 Mar 2024 23:51:07 +0200
Subject: [PATCH 052/169] refactor: remove `aliasanalysis.isCursor` (#1263)

## Summary

The procedure and its usage are obsolete, as `mirgen` already takes
care of cursor location handling.

## Details

With commit

https://github.com/nim-works/nimskull/commit/94837f4ca9c6b01c12ba4ae57986390b95fe887d
([PR](https://github.com/nim-works/nimskull/pull/1195)),
no `sink` operations (i.e., the only assignment modifier for which
ownership computation is required) are inserted for cursor
locations, meaning that the `isCursor` call in `computeOwnership`
always returned false.
---
 compiler/sem/aliasanalysis.nim     | 10 ----------
 compiler/sem/injectdestructors.nim |  3 +--
 2 files changed, 1 insertion(+), 12 deletions(-)

diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index 1fdd3dff165..d5a35935e7b 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -114,16 +114,6 @@ proc getRoot*(tree: MirTree, n: OpValue): OpValue =
   else:
     result = pos
 
-func isCursor*(tree: MirTree, path: Path): bool =
-  ## Returns whether the path `n` denotes a cursor location.
-  # XXX: this is an intermediate solution. ``mirgen`` is going to handle
-  #      all cursor-related behaviour in the future, which will make this
-  #      procedure obsolete
-  for i in 0..<path.len:
-    if path[i].kind == pikNamed and sfCursor in tree[path[i].node].field.flags:
-      result = true
-      break
-
 proc computePath*(tree: MirTree, at: NodePosition): Path =
   ## Computes the ``Path`` for the given expression. The expression not being
   ## a path expression is allowed too.
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 42adeb66c3c..41e2b30792c 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -294,8 +294,7 @@ func computeOwnership(tree: MirTree, cfg: DataFlowGraph, entities: EntityDict,
     #       visit it first
     var exists = false
     let info = entities.findScope(toName(tree[lval.root]), start, exists)
-    exists and not isCursor(tree, lval) and
-      isLastRead(tree, cfg, info.scope, lval, start)
+    exists and isLastRead(tree, cfg, info.scope, lval, start)
   else:
     unreachable()
 

From df9b988385b47798765805b1375e086ef6eb5f94 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 2 Apr 2024 17:39:12 +0200
Subject: [PATCH 053/169] mir: improve set construction syntax (#1264)

## Summary

Introduce a dedicated node representation for set constructions in the
MIR, making their data layout more terse and fixing a set construction
like `{a .. b}` crashing the compiler when `a` or `b` are non-constant
expressions.

## Details

* add the `mnkSetConstr` and `mnkRange` node kinds
  * since `set`s are *not* aggregate types, wrapping the operands of
    the construction in argument nodes is unnecessary
  * `mnkSetConstr` is pretty-printed as `{...}` instead of the generic
    `construct (...)`
* don't treat `nkRange` as literal data
* translate `nkRange` to `mnkRange` for both branch labels and in set
  constructions
  * dynamic ranges are now properly considered by `mirgen`
* hashing/comparison for `DataTable`, constant expression
  serialization, and data-flow graph creation are adjusted to the new
  tree shapes
* translate `mnkSetConstr` and `mnkRange` to `cnkSetConstr` and
  `cnkRange` in `cgirgen`
  * both set construction elements and branch labels use
    `setElementToIr`, even though this doesn't reject incorrect syntax
    for branch labels

In addition to fixing the aforementioned compiler crash, the dedicated
`mnkSetConstr` and `mnkRange` node kinds:
* remove a difference between the MIR and CGIR
* encode set construction semantics directly in the MIR, removing a
  source of having to dispatch over the nodes' type
---
 compiler/backend/cgirgen.nim      | 24 ++++++++++++++----
 compiler/backend/compat.nim       |  8 ++++--
 compiler/mir/datatables.nim       |  8 ++----
 compiler/mir/mirgen.nim           | 42 +++++++++++++++++++++++--------
 compiler/mir/mirpasses.nim        |  2 +-
 compiler/mir/mirtrees.nim         | 12 ++++++---
 compiler/mir/proto_mir.nim        |  2 +-
 compiler/mir/utils.nim            | 10 ++++++++
 compiler/sem/mirexec.nim          |  8 ++++++
 compiler/vm/packed_env.nim        | 17 ++++++-------
 compiler/vm/vmserialize.nim       | 23 +++++++++--------
 doc/mir.rst                       | 11 ++++++--
 tests/stdlib/types/sets/tsets.nim |  9 +++++++
 13 files changed, 125 insertions(+), 51 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 75ad42ce1e2..0f4e4be7597 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -221,8 +221,6 @@ proc translateLit*(val: PNode): CgNode =
     newNode(cnkNilLit, val.info, val.typ)
   of nkNimNodeLit:
     node(cnkAstLit, astLit, val[0])
-  of nkRange:
-    node(cnkRange, kids, @[translateLit(val[0]), translateLit(val[1])])
   of nkSym:
     # special case for raw symbols used with emit and asm statements
     assert val.sym.kind == skField
@@ -912,6 +910,21 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   of AllNodeKinds - StmtNodes:
     unreachable(n.kind)
 
+proc setElementToIr(tree: MirBody, cl: var TranslateCl,
+                    cr: var TreeCursor): CgNode =
+  ## Translates a sub-tree appearing as a branch label or in a set
+  ## construction to the CGIR.
+  case tree[cr].kind
+  of LvalueExprKinds, mnkLiteral:
+    result = valueToIr(tree, cl, cr)
+  of mnkRange:
+    discard enter(tree, cr)
+    result = newTree(cnkRange, unknownLineInfo,
+                     [valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)])
+    leave(tree, cr)
+  else:
+    unreachable()
+
 proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
               cr: var TreeCursor, stmts: var seq[CgNode]) =
   assert n.kind == mnkCase
@@ -927,8 +940,7 @@ proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
 
     result.add newTree(cnkBranch, cr.info)
     for x in 0..<br.len:
-      assert tree[cr].kind in {mnkConst, mnkLiteral}
-      result[^1].add atomToIr(tree, cl, cr)
+      result[^1].add setElementToIr(tree, cl, cr)
 
     let label = newLabel(cl)
     result[^1].add node(label)
@@ -994,6 +1006,9 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
     op cnkHiddenAddr, lvalueToIr(tree, cl, cr)
   of mnkDerefView:
     op cnkDerefView, atomToIr(tree, cl, cr)
+  of mnkSetConstr:
+    treeOp cnkSetConstr:
+      res.add setElementToIr(tree, cl, cr)
   of mnkObjConstr:
     assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
@@ -1004,7 +1019,6 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
 
     let kind =
       case typ.kind
-      of tySet:               cnkSetConstr
       of tyArray, tySequence: cnkArrayConstr
       of tyTuple:             cnkTupleConstr
       of tyProc:
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index b46e62634e4..5d261776d69 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -171,8 +171,6 @@ proc translate*(t: MirTree): CgNode =
           cnkArrayConstr
         of tyTuple:
           cnkTupleConstr
-        of tySet:
-          cnkSetConstr
         of tyProc:
           cnkClosureConstr
         else:
@@ -180,6 +178,12 @@ proc translate*(t: MirTree): CgNode =
 
       tree kind:
         translateAux(t, i)
+    of mnkSetConstr:
+      tree cnkSetConstr:
+        translateAux(t, i)
+    of mnkRange:
+      tree cnkRange:
+        translateAux(t, i)
     of mnkArg:
       let x = translateAux(t, i)
       inc i # skip the end node
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index cefb94ba452..2650f896a86 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -47,15 +47,13 @@ func hashTree(tree: ConstrTree): Hash =
           hash(n.intVal)
         of nkNilLit:
           Hash(0)
-        of nkRange:
-          hashLit(n[0]) !& hashLit(n[1])
         else:
           unreachable(n.kind)
 
       result = result !& hashLit(n.lit)
     of mnkProc:
       result = result !& hash(n.prc.ord)
-    of mnkObjConstr, mnkConstr:
+    of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
       result = result !& hash(n.len)
     of mnkField:
       result = result !& hash(n.field.id)
@@ -88,8 +86,6 @@ func cmp(a, b: PNode): bool =
     a.strVal == b.strVal
   of nkNilLit:
     true
-  of nkRange:
-    cmp(a[0], b[0]) and cmp(a[1], b[1])
   else:
     unreachable(a.kind)
 
@@ -104,7 +100,7 @@ proc cmp(a, b: ConstrTree): bool =
       cmp(a.lit, b.lit)
     of mnkProc:
       a.prc == b.prc
-    of mnkConstr, mnkObjConstr:
+    of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
       a.len == b.len
     of mnkField:
       a.field.id == b.field.id
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index d9d2a0f11e8..1fc6f8d5679 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -762,6 +762,8 @@ proc genMacroCallArgs(c: var TCtx, n: PNode, kind: TSymKind, fntyp: PType) =
     else:
       unreachable()
 
+proc genSetConstr(c: var TCtx, n: PNode)
+
 proc genInSetOp(c: var TCtx, n: PNode) =
   ## Generates and emits the IR for the ``mInSet`` magic call `n`. If
   ## the element operand is a range check, it is integrated into the
@@ -808,9 +810,7 @@ proc genInSetOp(c: var TCtx, n: PNode) =
               sv = c.allocTemp(se.typ)
               c.subTree mnkDef:
                 c.use sv
-                c.subTree MirNode(kind: mnkConstr, typ: se.typ):
-                  for it in se.items:
-                    c.emitOperandTree it, false
+                genSetConstr(c, se)
             else:
               sv = genRd(c, se)
 
@@ -1091,9 +1091,15 @@ proc genCallOrMagic(c: var TCtx, n: PNode) =
     genCall(c, n)
 
 proc genSetConstr(c: var TCtx, n: PNode) =
-  c.buildTree mnkConstr, n.typ:
+  c.buildTree mnkSetConstr, n.typ:
     for it in n.items:
-      c.emitOperandTree it, false
+      if it.kind == nkRange:
+        # watch out! the operands don't have to be literal values
+        c.subTree mnkRange:
+          c.genArgExpression(it[0], sink=false)
+          c.genArgExpression(it[1], sink=false)
+      else:
+        c.genArgExpression(it, sink=false)
 
 proc genArrayConstr(c: var TCtx, n: PNode, isConsume: bool) =
   c.buildTree mnkConstr, n.typ:
@@ -1546,8 +1552,15 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
       discard
     of nkOfBranch:
       # emit the lables:
-      for (_, lit) in branchLabels(branch):
-        c.add MirNode(kind: mnkLiteral, lit: lit, typ: lit.typ)
+      for (_, label) in branchLabels(branch):
+        template add(n: PNode) =
+          c.add MirNode(kind: mnkLiteral, lit: n, typ: n.typ)
+        if label.kind == nkRange:
+          c.subTree mnkRange:
+            add(label[0])
+            add(label[1])
+        else:
+          add(label)
     else:
       unreachable(branch.kind)
 
@@ -2200,8 +2213,13 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
           bu.add MirNode(kind: mnkField, field: n[i][0].sym)
           bu.subTree mnkArg:
             constToMirAux(bu, env, n[i][1])
-
-    of nkBracket, nkCurly, nkTupleConstr, nkClosure:
+    of nkCurly:
+      # similar to object construction, no normalization means that ``{1, 2}``
+      # and ``{2, 1}`` results in two data table entries
+      bu.subTree MirNode(kind: mnkSetConstr, typ: n.typ, len: n.len):
+        for it in n.items:
+          constToMirAux(bu, env, it)
+    of nkBracket, nkTupleConstr, nkClosure:
       bu.subTree MirNode(kind: mnkConstr, typ: n.typ, len: n.len):
         for it in n.items:
           bu.subTree mnkArg:
@@ -2216,7 +2234,11 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         bu.use toValue(env.constants.add(n.sym), n.sym.typ)
       else:
         unreachable()
-    of nkLiterals, nkRange:
+    of nkRange:
+      bu.subTree MirNode(kind: mnkRange, len: 2):
+        constToMirAux(bu, env, n[0])
+        constToMirAux(bu, env, n[1])
+    of nkLiterals:
       bu.use literal(n)
     of nkHiddenStdConv, nkHiddenSubConv:
       # doesn't translate to a MIR node itself, but the type overrides
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index e682726946d..8b285c00e4b 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -321,7 +321,7 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
       of LvalueExprKinds:
         # usage in an lvalue expression -> the temporary can be elided
         elide = true
-      of RvalueExprKinds:
+      of RvalueExprKinds, mnkSetConstr:
         elide = true
       of mnkConstr, mnkObjConstr:
         # if the lvalue doesn't overlap with the assignment destination, the
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 99a38d267a3..e148c0bd5b3 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -171,6 +171,9 @@ type
     mnkConstr     ## constructs a either new aggregate value or set value made
                   ## up of the input values. Whether the resulting value is
                   ## owned depends on whether one the context it's used in
+    mnkSetConstr  ## constructor for set values
+    mnkRange      ## range constructor. May only appear in set constructions
+                  ## and as a branch label
     mnkObjConstr  ## either allocate a new managed heap cell and returns a
                   ## ``ref`` to it, or or constructs a new aggregate value
                   ## with named fields
@@ -335,8 +338,8 @@ const
     ## Assignment modifiers. Nodes that can only appear directly in the source
     ## slot of assignments.
 
-  ConstrTreeNodes* = {mnkConstr, mnkObjConstr, mnkLiteral, mnkProc,
-                      mnkArg, mnkField, mnkEnd}
+  ConstrTreeNodes* = {mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr,
+                      mnkLiteral, mnkProc, mnkArg, mnkField, mnkEnd}
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
   # --- semantics-focused sets:
@@ -360,8 +363,9 @@ const
   RvalueExprKinds* = {mnkLiteral, mnkType, mnkProc, mnkConv, mnkStdConv,
                       mnkCast, mnkAddr, mnkView, mnkToSlice} + UnaryOps +
                      BinaryOps
-  ExprKinds* =       {mnkCall, mnkCheckedCall, mnkConstr, mnkObjConstr} +
-                     LvalueExprKinds + RvalueExprKinds + ModifierNodes
+  ExprKinds* =       {mnkCall, mnkCheckedCall, mnkConstr, mnkSetConstr,
+                      mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
+                     ModifierNodes
 
   CallKinds* = {mnkCall, mnkCheckedCall}
 
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 0f4721ede8c..78e212800ae 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -594,7 +594,7 @@ proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: boo
     result.add ProtoItem(orig: n, typ: n.typ, kind: k, field: val)
 
   case n.kind
-  of nkLiterals, nkRange, nkNimNodeLit:
+  of nkLiterals, nkNimNodeLit:
     node pirLiteral
   of nkLambdaKinds:
     node pirProc, sym, n[namePos].sym
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 69a284ed439..fb2895a2a8c 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -309,6 +309,16 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       commaSeparated:
         argToStr()
       result.add ")"
+  of mnkSetConstr:
+    tree "{":
+      commaSeparated:
+        exprToStr(nodes, i, result, c)
+      result.add "}"
+  of mnkRange:
+    tree "":
+      valueToStr()
+      result.add " .. "
+      valueToStr()
   of mnkObjConstr:
     tree "(":
       commaSeparated:
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index a1b82a55203..f50cc2ae4e0 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -238,6 +238,14 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   case tree[source].kind
   of mnkCall, mnkCheckedCall, mnkConstr, mnkObjConstr:
     emitForArgs(env, tree, at, source)
+  of mnkSetConstr:
+    for it in subNodes(tree, source):
+      case tree[it].kind
+      of mnkRange:
+        emitLvalueOp(env, opUse, tree, at, tree.operand(it, 0))
+        emitLvalueOp(env, opUse, tree, at, tree.operand(it, 1))
+      else:
+        emitLvalueOp(env, opUse, tree, at, OpValue it)
   of mnkConv, mnkStdConv, mnkCast:
     # a read is performed on the source operand (if it's an lvalue)
     emitLvalueOp(env, opUse, tree, at, tree.operand(source))
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index a4776b0eb9b..d939acedeec 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -352,20 +352,19 @@ proc storeSetData(enc: var DataEncoder, e: var PackedEnv,
   enc.put e, PackedDataNode(kind: pdkSet, pos: count.uint32 * 2)
   e.nodes.growBy(count * 2) # make space for the content
 
-  proc adjusted(enc: DataEncoder, n: PNode, typ: PType): uint32 =
+  proc adjusted(enc: DataEncoder, n: MirNode, typ: PType): uint32 =
     # make the range start at zero
-    toUInt32(getInt(n) - firstOrd(enc.config, typ))
+    toUInt32(getInt(n.lit) - firstOrd(enc.config, typ))
 
   var n = n + 1
   # bitsets only store values in the range 0..high(uint16), so the values can
   # be stored directly
   for _ in 0..<count:
-    let x = t[n+1].lit
-    if x.kind == nkRange:
-      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, x[0], typ))
-      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, x[1], typ))
+    if t[n].kind == mnkRange:
+      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n + 1], typ))
+      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n + 2], typ))
     else:
-      let d = PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, x, typ))
+      let d = PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n], typ))
       enc.put e, d
       enc.put e, d
 
@@ -409,10 +408,10 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
       enc.storeArrayData(e, t, n)
     of tyTuple, tyProc:
       enc.storeTupleData(e, t, n)
-    of tySet:
-      enc.storeSetData(e, t, n)
     else:
       unreachable(t[n].kind)
+  of mnkSetConstr:
+    enc.storeSetData(e, t, n)
   of mnkObjConstr:
     enc.storeFieldsData(e, t, n)
   else:
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 019f312ef66..0a1116dc01e 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -85,16 +85,9 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int,
       recurse(c.heap.unsafeDeref(slot))
       deref(dest).refVal = slot
   of akSet:
-    proc put(dest: LocHandle, lit: PNode, first: Int128) {.inline.} =
-      proc adjusted(n: PNode, first: Int128): BiggestInt =
-        # subtract the first element's value to make all values zero-based
-        toInt(getInt(n) - first)
-
-      if lit.kind == nkRange:
-        bitSetInclRange(mbitSet(dest),
-          adjusted(lit[0], first)..adjusted(lit[1], first))
-      else:
-        bitSetIncl(mbitSet(dest), adjusted(lit, first))
+    proc adjusted(n: PNode, first: Int128): BiggestInt {.inline.} =
+      # subtract the first element's value to make all values zero-based
+      toInt(getInt(n) - first)
 
     let first =
       if tree[n].len > 0: firstOrd(c.config, tree[n].typ)
@@ -102,7 +95,15 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int,
     # XXX: ^^ ``set[empty]``-typed literals reach here, but they shouldn't. The
     #      len guard works around the issue
     iterTree(j):
-      arg put(dest, next().lit, first)
+      let node = next()
+      if node.kind == mnkRange:
+        let
+          a = adjusted(next().lit, first)
+          b = adjusted(next().lit, first)
+        bitSetInclRange(mbitSet(dest), a .. b)
+        inc n # skip the end node
+      else:
+        bitSetIncl(mbitSet(dest), adjusted(node.lit, first))
   of akPNode:
     deref(dest).nodeVal = next().lit[0]
   of akCallable:
diff --git a/doc/mir.rst b/doc/mir.rst
index df09c8c6b9d..601612196de 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -98,15 +98,17 @@ Semantics
                     | CheckedCall LVALUE CALL_ARG ...  EX_TARGET
                     | CheckedCall <Magic> CALL_ARG ... EX_TARGET
 
+  SET_CONSTR_ARG = VALUE
+                 | Range VALUE VALUE     # range construction
 
   RVALUE = UNARY_OP
          | BINARY_OP
          | CALL_EXPR
          | CHECKED_CALL_EXPR
-         | Constr   CONSTR_ARG ...       # construct a tuple, closure, set, or
+         | Constr   CONSTR_ARG ...       # construct a tuple, closure, or array
+         | SetConstr SET_CONSTR_ARG ...
          | ObjConstr (<Field> CONSTR_ARG) ... # construct an `object` or
                                          # `ref object`
-                                         # array
          | StdConv  VALUE                # number conversion or conversion
                                          # between cstring and string
          | Conv     VALUE                # same as `StdConv`. Only duplicate
@@ -211,6 +213,7 @@ Semantics
 
   BRANCH_LABEL = <Literal>
                | <Const>
+               | Range <Literal> <Literal>
   BRANCH_LIST = (Branch BRANCH_LABEL ... STATEMENT) ... # a list of branches
               | (Branch BRANCH_LABEL ... TARGET) ...
 
@@ -385,5 +388,9 @@ ones).
 
   ARG = Arg VALUE
 
+  SET_CONSTR_ARG = <Literal>
+                 | Range <Literal> <Literal>
+
   COMPLEX = Constr ARG...
+          | SetConstr SET_CONSTR_ARG...
           | ObjConstr (<Field> ARG)...
diff --git a/tests/stdlib/types/sets/tsets.nim b/tests/stdlib/types/sets/tsets.nim
index 71f914aaa63..8eebed66046 100644
--- a/tests/stdlib/types/sets/tsets.nim
+++ b/tests/stdlib/types/sets/tsets.nim
@@ -92,3 +92,12 @@ block:
 
   doAssert k99 notin s1
   doAssert k99 notin s2
+
+block set_construction_with_dynamic_range:
+  # constructing a set value using dynamic ranges crashed the compiler
+  var
+    a = 1'u8
+    b = 4'u8
+  let se = {a..b}
+  doAssert 3'u8 in se
+  doAssert 5'u8 notin se

From c544f9811f3701cc6c34cca42079e616a044f53b Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 4 Apr 2024 01:10:08 +0200
Subject: [PATCH 054/169] mir: store string data separately from nodes (#1266)

## Summary

Instead of storing string values via `PNode`s in `MirNode`, the
`string` data is stored in a separate table, indexed by `StringId`.
This removes a `PNode` dependency from the MIR and eliminates the
string copy at the MIR/CGIR edge.

## Details

### MIR

* the `mnkStrLit` node kind and variant are introduced. The variant
  stores a `StringId`
* the actual string data is stored in a `BiTable[string]` in `MirEnv`
* internally, `StringId` is a `LitId`, which is used for `BiTable`
  lookup
* `mnkLiteral` no longer covers string literals
* the `LiteralDataNodes` set is introduced, currently covering
  `mnkLiteral` and `mnkStrLit`
* `mirgen` translates string literals to `mnkStrLit` nodes, adding the
  string values to the environment in the process

### CGIR

* `CgNode` also uses the indirection via a `StringId` instead of
  storing the raw string directly

### Code generation

* `cgen` and `jsgen` use the `getString` routine added to both code
  generators, for querying a node's string value from the
  environment
* as an interim solution, for generating the C constant for a raw
  string value, a new `genStringLiteral` overload is added to
  `ccgliterals`
* `compat.newStrNode` is obsolete and thus removed

### VM back-end

* `vmserialize.initFromExpr` needs access to a `MirEnv` to look up the
  string data
* `vmjit` provides read-only access to a `JitState`'s `MirEnv` through
  the new public `env` accessor (the `compilerbridge` module need it
  for the `initFromExpr` calls)
* the `MirEnv`'s string table is re-used for the created `PackedEnv`

### Other

* `DataTable` lookup becomes slightly faster, since only the ID for
  strings needs to be compared and hashed
* the `extractStringLiterals` MIR pass can search for string literals
  (`mnkStrLit`) without an extra conditional
---
 compiler/backend/backends.nim    |  7 ++++---
 compiler/backend/ccgexprs.nim    | 18 ++++++++++--------
 compiler/backend/ccgliterals.nim | 30 ++++++++++++++++++++----------
 compiler/backend/ccgstmts.nim    | 10 +++++-----
 compiler/backend/cgen.nim        |  3 +++
 compiler/backend/cgendata.nim    | 18 +++---------------
 compiler/backend/cgir.nim        |  2 +-
 compiler/backend/cgirgen.nim     | 12 ++++++------
 compiler/backend/cgirutils.nim   |  2 +-
 compiler/backend/compat.nim      |  6 +++---
 compiler/backend/jsgen.nim       | 15 +++++++++------
 compiler/mir/datatables.nim      |  6 ++++--
 compiler/mir/mirconstr.nim       |  5 +++++
 compiler/mir/mirenv.nim          | 13 +++++++++++++
 compiler/mir/mirgen.nim          | 29 ++++++++++++++++++-----------
 compiler/mir/mirpasses.nim       | 13 ++++++-------
 compiler/mir/mirtrees.nim        | 17 +++++++++++++----
 compiler/mir/utils.nim           | 10 ++++++++++
 compiler/sem/mirexec.nim         |  2 +-
 compiler/vm/compilerbridge.nim   |  4 ++--
 compiler/vm/packed_env.nim       |  4 +++-
 compiler/vm/vmbackend.nim        |  2 +-
 compiler/vm/vmjit.nim            |  6 +++++-
 compiler/vm/vmserialize.nim      | 12 +++++++-----
 24 files changed, 153 insertions(+), 93 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index c0ad7ff81a2..a61fba16fee 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -467,7 +467,8 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
       bu.add MirNode(kind: mnkStmtList) # manual, for less visual nesting
       for candidate in candidates.items:
         var tmp = genLoadLib(bu, graph, env, val):
-          literal(newStrNode(candidate, graph.getSysType(path.info, tyString)))
+          literal(env.getOrIncl(candidate),
+                  graph.getSysType(path.info, tyString))
 
         tmp = bu.wrapTemp(graph.getSysType(path.info, tyBool)):
           bu.buildMagicCall mNot, graph.getSysType(path.info, tyBool):
@@ -480,7 +481,7 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
       # if none of the candidates worked, a run-time error is reported:
       bu.subTree mnkVoid:
         bu.buildCall env.procedures.add(errorProc), errorProc.typ, voidTyp:
-          bu.emitByVal literal(path)
+          bu.emitByVal literal(env.getOrIncl(path.strVal), path.typ)
       bu.add endNode(mnkStmtList)
   else:
     # the name of the dynamic library to load the procedure from is only known
@@ -559,7 +560,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
     let tmp = bu.wrapTemp(loadProc.typ[0]):
       bu.buildCall env.procedures.add(loadProc), loadProc.typ, loadProc.typ[0]:
         bu.emitByVal toValue(libVar, lib.name.typ)
-        bu.emitByVal literal(extname)
+        bu.emitByVal literal(env.getOrIncl(extname.strVal), extname.typ)
 
     bu.subTree mnkVoid:
       bu.buildMagicCall mAsgnDynlibVar, voidTyp:
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 5a70078b869..69d1d66f913 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -79,7 +79,7 @@ proc genLiteral(p: BProc, n: CgNode, ty: PType): Rope =
       # save tons of allocations:
       result = genStringLiteral(p.module, n)
     else:
-      result = makeCString(n.strVal)
+      result = makeCString(getString(p, n))
   of cnkFloatLit:
     if ty.kind == tyFloat32:
       result = rope(n.floatVal.float32.toStrMaxPrecision)
@@ -586,8 +586,10 @@ proc genFieldCheck(p: BProc, e: CgNode) =
       # by encoding the file names separately from `file(line:col)`, essentially
       # passing around `TLineInfo` + the set of files in the project.
       msg.add toFileLineCol(p.config, e.info) & " "
-    msg.add e[4].strVal
-    let strLit = genStringLiteral(p.module, newStrNode(msg))
+    msg.add getString(p, e[4])
+    # don't commit the string to the string table, as it's likely to be
+    # unique and never used again
+    let strLit = genStringLiteral(p.module, msg)
 
     ## discriminant check
     template fun(code) = linefmt(p, cpsStmts, code, [rdLoc(test)])
@@ -813,7 +815,7 @@ proc genStrConcat(p: BProc, e: CgNode, d: var TLoc) =
       appends.add(ropecg(p.module, "#appendChar($1, $2);$n", [strLoc(p, tmp), rdLoc(a)]))
     else:
       if e[i + 1].kind == cnkStrLit:
-        inc(L, e[i + 1].strVal.len)
+        inc(L, getString(p, e[i + 1]).len)
       else:
         lens.add(lenExpr(p, a))
         lens.add(" + ")
@@ -852,7 +854,7 @@ proc genStrAppend(p: BProc, e: CgNode, d: var TLoc) =
                         [strLoc(p, dest), rdLoc(a)]))
     else:
       if e[i + 2].kind == cnkStrLit:
-        inc(L, e[i + 2].strVal.len)
+        inc(L, getString(p, e[i + 2]).len)
       else:
         lens.add(lenExpr(p, a))
         lens.add(" + ")
@@ -1547,11 +1549,11 @@ proc genStrEquals(p: BProc, e: CgNode, d: var TLoc) =
   var x: TLoc
   var a = e[1]
   var b = e[2]
-  if a.kind == cnkStrLit and a.strVal == "":
+  if a.kind == cnkStrLit and getString(p, a) == "":
     initLocExpr(p, e[2], x)
     putIntoDest(p, d, e,
       ropecg(p.module, "($1 == 0)", [lenExpr(p, x)]))
-  elif b.kind == cnkStrLit and b.strVal == "":
+  elif b.kind == cnkStrLit and getString(p, b) == "":
     initLocExpr(p, e[1], x)
     putIntoDest(p, d, e,
       ropecg(p.module, "($1 == 0)", [lenExpr(p, x)]))
@@ -2379,7 +2381,7 @@ proc genBracedInit(p: BProc, n: CgNode; optionalType: PType): Rope =
       result = genConstObjConstr(p, n)
     of tyString, tyCstring:
       if n.kind != cnkNilLit and ty == tyString:
-        result = genStringLiteralV2Const(p.module, n, true)
+        result = genStringLiteralV2Const(p.module, n.strVal, true)
       else:
         var d: TLoc
         initLocExpr(p, n, d)
diff --git a/compiler/backend/ccgliterals.nim b/compiler/backend/ccgliterals.nim
index 0d74f6019ca..016e372e672 100644
--- a/compiler/backend/ccgliterals.nim
+++ b/compiler/backend/ccgliterals.nim
@@ -24,35 +24,45 @@ proc genStringLiteralDataOnlyV2(m: BModule, s: string; result: Rope; isConst: bo
        [result, rope(s.len), makeCString(s),
        rope(if isConst: "const" else: "")])
 
-proc genStringLiteralV2(m: BModule; n: CgNode; isConst: bool): Rope =
-  let id = getOrPut(m.strCache, n, m.labels)
+proc genStringLiteralV2(m: BModule; str: StringId; isConst: bool): Rope =
+  let id = m.strCache.mgetOrPut(str, m.labels)
+  let len = m.g.env[str].len
   if id == m.labels:
     let pureLit = getTempName(m)
-    genStringLiteralDataOnlyV2(m, n.strVal, pureLit, isConst)
+    genStringLiteralDataOnlyV2(m, m.g.env[str], pureLit, isConst)
     result = getTempName(m)
     discard cgsym(m, "NimStrPayload")
     discard cgsym(m, "NimStringV2")
     # string literal not found in the cache:
     m.s[cfsData].addf("static $4 NimStringV2 $1 = {$2, (NimStrPayload*)&$3};$n",
-          [result, rope(n.strVal.len), pureLit, rope(if isConst: "const" else: "")])
+          [result, rope(len), pureLit, rope(if isConst: "const" else: "")])
   else:
     result = getTempName(m)
     m.s[cfsData].addf("static $4 NimStringV2 $1 = {$2, (NimStrPayload*)&$3};$n",
-          [result, rope(n.strVal.len), m.tmpBase & rope(id),
+          [result, rope(len), m.tmpBase & rope(id),
           rope(if isConst: "const" else: "")])
 
-proc genStringLiteralV2Const(m: BModule; n: CgNode; isConst: bool): Rope =
-  let id = getOrPut(m.strCache, n, m.labels)
+proc genStringLiteralV2Const(m: BModule; str: StringId; isConst: bool): Rope =
+  let id = m.strCache.mgetOrPut(str, m.labels)
   var pureLit: Rope
   if id == m.labels:
     pureLit = getTempName(m)
     discard cgsym(m, "NimStrPayload")
     discard cgsym(m, "NimStringV2")
     # string literal not found in the cache:
-    genStringLiteralDataOnlyV2(m, n.strVal, pureLit, isConst)
+    genStringLiteralDataOnlyV2(m, m.g.env[str], pureLit, isConst)
   else:
     pureLit = m.tmpBase & rope(id)
-  result = "{$1, (NimStrPayload*)&$2}" % [rope(n.strVal.len), pureLit]
+  result = "{$1, (NimStrPayload*)&$2}" % [rope(m.g.env[str].len), pureLit]
+
+proc genStringLiteral(m: BModule, str: string): Rope =
+  ## Spawns and emits a new global C constant storing a NimString with content
+  ## `str` -- no caching is performed.
+  let content = getTempName(m)
+  genStringLiteralDataOnlyV2(m, str, content, true)
+  result = getTempName(m)
+  m.s[cfsData].addf("static const NimStringV2 $1 = {$2, (NimStrPayload*)&$3};$n",
+                    [result, rope(str.len), content])
 
 # ------ Version selector ---------------------------------------------------
 
@@ -60,4 +70,4 @@ proc genNilStringLiteral(m: BModule; info: TLineInfo): Rope =
   result = ropecg(m, "((#NimStringDesc*) NIM_NIL)", [])
 
 proc genStringLiteral(m: BModule; n: CgNode): Rope =
-  result = genStringLiteralV2(m, n, isConst = true)
\ No newline at end of file
+  result = genStringLiteralV2(m, n.strVal, isConst = true)
\ No newline at end of file
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index feb064bd623..bf7220ecd3e 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -226,7 +226,7 @@ proc genCaseStringBranch(p: BProc, b: CgNode, e: TLoc, labl: BlockId,
     assert(b[i].kind != cnkRange)
     initLocExpr(p, b[i], x)
     assert(b[i].kind == cnkStrLit)
-    var j = int(hashString(p.config, b[i].strVal) and high(branches))
+    var j = int(hashString(p.config, getString(p, b[i])) and high(branches))
     appcg(p.module, branches[j], "if (#eqStrings($1, $2)) goto $3;$n",
          [rdLoc(e), rdLoc(x), labl])
 
@@ -397,7 +397,7 @@ proc genAsmOrEmitStmt(p: BProc, t: CgNode, isAsmStmt=false): Rope =
   for it in t.items:
     case it.kind
     of cnkStrLit:
-      res.add(it.strVal)
+      res.add(getString(p, it))
     of cnkField:
         let sym = it.field
         # special support for raw field symbols
@@ -448,10 +448,10 @@ proc genAsmStmt(p: BProc, t: CgNode) =
   else:
     p.s(cpsStmts).add indentLine(p, runtimeFormat(CC[p.config.cCompiler].asmStmtFrmt, [s]))
 
-proc determineSection(n: CgNode): TCFileSection =
+proc determineSection(env: MirEnv, n: CgNode): TCFileSection =
   result = cfsProcHeaders
   if n.len >= 1 and n[0].kind == cnkStrLit:
-    let sec = n[0].strVal
+    let sec = env[n[0].strVal]
     if sec.startsWith("/*TYPESECTION*/"): result = cfsTypes
     elif sec.startsWith("/*VARSECTION*/"): result = cfsVars
     elif sec.startsWith("/*INCLUDESECTION*/"): result = cfsHeaders
@@ -460,7 +460,7 @@ proc genEmit(p: BProc, t: CgNode) =
   var s = genAsmOrEmitStmt(p, t)
   if sfTopLevel in p.prc.flags:
     # top level emit pragma?
-    let section = determineSection(t)
+    let section = determineSection(p.env, t)
     genCLineDir(p.module.s[section], t.info, p.config)
     p.module.s[section].add(s)
   else:
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 0dbcd114bc3..5281810949e 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -101,6 +101,9 @@ const
     ## the procedure contains top-level code, which currently affects how
     ## emit, asm, and error handling works
 
+template getString(p: BProc, n: CgNode): string =
+  p.env[n.strVal]
+
 proc findPendingModule(m: BModule, s: PSym): BModule =
   let ms = s.itemId.module  #getModule(s)
   result = m.g.modules[ms]
diff --git a/compiler/backend/cgendata.nim b/compiler/backend/cgendata.nim
index 4ebb9262597..7fd0b6ace29 100644
--- a/compiler/backend/cgendata.nim
+++ b/compiler/backend/cgendata.nim
@@ -11,7 +11,6 @@
 
 import
   std/[
-    hashes,
     intsets,
     tables,
     sets
@@ -96,8 +95,6 @@ type
                               ## code
     params*: seq[TLoc]        ## the locs of the parameters
 
-  StrNode* = distinct CgNode
-
   TLabel* = Rope              ## for the C generator a label is just a rope
   TCFileSection* = enum       ## the sections a generated C file consists of
     cfsMergeInfo,             ## section containing merge information
@@ -249,9 +246,9 @@ type
     defaultCache*: Table[SigHash, int]
       ## maps a type hash to the name of a C constant storing the type's
       ## default value
-    strCache*: Table[StrNode, int]
-      ## associates a string node with the label of a C constant generated for
-      ## it
+    strCache*: Table[StringId, int]
+      ## associates a string with the label of the C constant generated
+      ## for it
       ## TODO: strings should be turned into data-only constants (``DataId``)
       ##       during the MIR phase
     dataNames*: Table[DataId, int]
@@ -350,15 +347,6 @@ iterator items*[T](m: SymbolMap[T]): lent T =
   for it in m.store.items:
     yield it
 
-proc `==`(a, b: StrNode): bool =
-  a.CgNode.strVal == b.CgNode.strVal
-
-proc hash(x: StrNode): Hash =
-  hash(x.CgNode.strVal)
-
-proc getOrPut*(t: var Table[StrNode, int], n: CgNode, label: int): int =
-  mgetOrPut(t, StrNode(n), label)
-
 func isFilled*(x: TLoc): bool {.inline.} =
   x.k != locNone
 
diff --git a/compiler/backend/cgir.nim b/compiler/backend/cgir.nim
index 23bfa39e1e0..e2f52b5cf0a 100644
--- a/compiler/backend/cgir.nim
+++ b/compiler/backend/cgir.nim
@@ -179,7 +179,7 @@ type
       # future direction: use a ``BiggestUint`` for uint values
       intVal*: BiggestInt
     of cnkFloatLit:   floatVal*: BiggestFloat
-    of cnkStrLit:     strVal*: string
+    of cnkStrLit:     strVal*: StringId
     of cnkAstLit:     astLit*: PNode
     of cnkField:      field*: PSym
     of cnkProc:       prc*: ProcedureId
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 0f4e4be7597..3b5ce3b8e4c 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -215,8 +215,6 @@ proc translateLit*(val: PNode): CgNode =
       node(cnkFloatLit, floatVal, val.floatVal.float32.float64)
     else:
       unreachable()
-  of nkStrKinds:
-    node(cnkStrLit, strVal, val.strVal)
   of nkNilLit:
     newNode(cnkNilLit, val.info, val.typ)
   of nkNimNodeLit:
@@ -312,6 +310,8 @@ proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
     newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
   of mnkLiteral:
     translateLit(n.lit)
+  of mnkStrLit:
+    CgNode(kind: cnkStrLit, info: info, typ: n.typ, strVal: n.strVal)
   of mnkType:
     newTypeNode(info, n.typ)
   of mnkNone:
@@ -369,7 +369,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
     # XXX: this needs to be removed once there is a dedicated run-time-
     #      sequence access operator
     let arg =
-      if tree[cr].kind == mnkLiteral:
+      if tree[cr].kind in LiteralDataNodes:
         atomToIr(tree, cl, cr)
       else:
         recurse()
@@ -395,7 +395,7 @@ proc valueToIr(tree: MirBody, cl: var TranslateCl,
                cr: var TreeCursor): CgNode =
   case tree[cr].kind
   of mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkAlias,
-     mnkLiteral, mnkType:
+     mnkType, LiteralDataNodes:
     atomToIr(tree, cl, cr)
   of mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv, mnkPathVariant,
      mnkDeref, mnkDerefView:
@@ -417,7 +417,7 @@ proc argToIr(tree: MirBody, cl: var TranslateCl,
     # it is one, the expression must be an lvalue
     result = (true, lvalueToIr(tree, cl, cr))
     leave(tree, cr)
-  of mnkLiteral, mnkType, mnkProc, mnkNone:
+  of LiteralDataNodes, mnkType, mnkProc, mnkNone:
     # not a tag but an atom
     result = (false, atomToIr(n, cl, cr.info))
   of LvalueExprKinds:
@@ -915,7 +915,7 @@ proc setElementToIr(tree: MirBody, cl: var TranslateCl,
   ## Translates a sub-tree appearing as a branch label or in a set
   ## construction to the CGIR.
   case tree[cr].kind
-  of LvalueExprKinds, mnkLiteral:
+  of LvalueExprKinds, LiteralDataNodes:
     result = valueToIr(tree, cl, cr)
   of mnkRange:
     discard enter(tree, cr)
diff --git a/compiler/backend/cgirutils.nim b/compiler/backend/cgirutils.nim
index f5e0813ffea..12cca001f6a 100644
--- a/compiler/backend/cgirutils.nim
+++ b/compiler/backend/cgirutils.nim
@@ -34,7 +34,7 @@ proc treeRepr*(n: CgNode): string =
       result.add $n.floatVal
     of cnkStrLit:
       result.add "strVal: \""
-      result.add n.strVal
+      result.addInt n.strVal.uint32
       result.add "\""
     of cnkField:
       result.add "field: "
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 5d261776d69..d669b70ef0d 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -137,9 +137,6 @@ proc newSymNode*(env: MirEnv, s: PSym): CgNode {.inline.} =
   else:
     unreachable(s.kind)
 
-proc newStrNode*(str: sink string): CgNode {.inline.} =
-  CgNode(kind: cnkStrLit, info: unknownLineInfo, strVal: str)
-
 proc translate*(t: MirTree): CgNode =
   ## Compatibility routine for translating a MIR constant-expression (`t`) to
   ## a ``CgNode`` tree. Obsolete once the code generators use the MIR
@@ -190,6 +187,9 @@ proc translate*(t: MirTree): CgNode =
       x
     of mnkLiteral:
       translateLit(n.lit)
+    of mnkStrLit:
+      CgNode(kind: cnkStrLit, info: unknownLineInfo, typ: n.typ,
+             strVal: n.strVal)
     of mnkField:
       CgNode(kind: cnkField, info: unknownLineInfo, field: n.field)
     of mnkProc:
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index cf91e59e97f..2fbe90dd04a 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -234,6 +234,9 @@ func analyseIfAddressTaken(n: CgNode, addrTaken: var PackedSet[LocalId]) =
 template config*(p: PProc): ConfigRef = p.module.config
 template env*(p: PProc): untyped = p.g.env
 
+template getString(p: PProc, n: CgNode): string =
+  p.g.env[n.strVal]
+
 proc indentLine(p: PProc, r: Rope): Rope =
   for i in 0..<p.extraIndent:
     result.add "  "
@@ -873,7 +876,7 @@ proc genCaseJS(p: PProc, desc: StructDesc, stmts: openArray[CgNode], n: CgNode)
           if stringSwitch:
             case e.kind
             of cnkStrLit: lineF(p, "case $1:$n",
-                [makeJSString(e.strVal, false)])
+                [makeJSString(getString(p, e), false)])
             else: internalError(p.config, e.info, "jsgen.genCaseStmt: 2")
           else:
             gen(p, e, cond)
@@ -902,7 +905,7 @@ proc genAsmOrEmitStmt(p: PProc, n: CgNode) =
     let it = n[i]
     case it.kind
     of cnkStrLit:
-      p.body.add(it.strVal)
+      p.body.add(getString(p, it))
     of cnkProc, cnkConst, cnkGlobal, cnkLocal:
       # for backwards compatibility we don't deref syms here :-(
       if false:
@@ -1081,7 +1084,7 @@ proc genFieldCheck(p: PProc, e: CgNode) =
   useMagic(p, "reprDiscriminant") # no need to offset by firstOrd unlike for cgen
   lineF(p, "if ($1[$2]$3undefined) { raiseFieldError2(makeNimstrLit($4), reprDiscriminant($2, $5)); }$n",
     setx.res, val.rdLoc, if invert: ~"!==" else: ~"===",
-    makeJSString(e[4].strVal), genTypeInfo(p, e[2].typ))
+    makeJSString(getString(p, e[4])), genTypeInfo(p, e[2].typ))
 
 proc genArrayAddr(p: PProc, n: CgNode, r: var TCompRes) =
   var
@@ -2527,13 +2530,13 @@ proc gen(p: PProc, n: CgNode, r: var TCompRes) =
       r.kind = resExpr
   of cnkStrLit:
     if skipTypes(n.typ, abstractVarRange).kind == tyString:
-      if n.strVal.len != 0:
+      if getString(p, n).len != 0:
         useMagic(p, "makeNimstrLit")
-        r.res = "makeNimstrLit($1)" % [makeJSString(n.strVal)]
+        r.res = "makeNimstrLit($1)" % [makeJSString(getString(p, n))]
       else:
         r.res = rope"[]"
     else:
-      r.res = makeJSString(n.strVal, false)
+      r.res = makeJSString(getString(p, n), false)
     r.kind = resExpr
   of cnkFloatLit:
     let f = n.floatVal
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index 2650f896a86..6ba0c8816af 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -41,8 +41,6 @@ func hashTree(tree: ConstrTree): Hash =
           # make sure to hash the bit representation, so that NaNs are
           # accounted for
           hash(cast[BiggestInt](n.floatVal))
-        of nkStrKinds:
-          hash(n.strVal)
         of nkIntKinds:
           hash(n.intVal)
         of nkNilLit:
@@ -51,6 +49,8 @@ func hashTree(tree: ConstrTree): Hash =
           unreachable(n.kind)
 
       result = result !& hashLit(n.lit)
+    of mnkStrLit:
+      result = result !& hash(n.strVal)
     of mnkProc:
       result = result !& hash(n.prc.ord)
     of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
@@ -98,6 +98,8 @@ proc cmp(a, b: ConstrTree): bool =
     case a.kind
     of mnkLiteral:
       cmp(a.lit, b.lit)
+    of mnkStrLit:
+      a.strVal == b.strVal
     of mnkProc:
       a.prc == b.prc
     of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 06d7d1f105d..17db7ff3cd2 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -2,6 +2,7 @@
 
 import
   compiler/ast/[
+    ast_query,
     ast_types
   ],
   compiler/mir/[
@@ -75,8 +76,12 @@ func typeLit*(t: PType): Value =
   Value(node: MirNode(kind: mnkType, typ: t))
 
 func literal*(n: PNode): Value =
+  assert n.kind notin nkStrKinds
   Value(node: MirNode(kind: mnkLiteral, typ: n.typ, lit: n))
 
+func literal*(str: StringId, typ: PType): Value =
+  Value(node: MirNode(kind: mnkStrLit, typ: typ, strVal: str))
+
 func temp*(typ: PType, id: LocalId): Value =
   Value(node: MirNode(kind: mnkTemp, typ: typ, local: id))
 
diff --git a/compiler/mir/mirenv.nim b/compiler/mir/mirenv.nim
index e125203b47c..67b3b966049 100644
--- a/compiler/mir/mirenv.nim
+++ b/compiler/mir/mirenv.nim
@@ -14,6 +14,9 @@ import
     datatables,
     mirtrees
   ],
+  compiler/ic/[
+    bitabs
+  ],
   compiler/utils/[
     containers
   ]
@@ -40,6 +43,9 @@ type
       ## includes both normal globals and threadvars
     procedures*: SymbolTable[ProcedureId, PSym]
 
+    strings*: BiTable[string]
+      ## all string data referenced by the MIR
+
     bodies*: OrdinalSeq[ConstId, DataId]
       ## associates each user-defined constant with its content
       ## ## TODO: this needs to be merged into `constants`
@@ -103,6 +109,13 @@ func `[]`*(env: MirEnv, id: ProcedureId): lent PSym {.inline.} =
 func `[]`*(env: MirEnv, id: DataId): lent ConstrTree {.inline.} =
   env.data[id]
 
+func `[]`*(env: MirEnv, id: StringId): lent string {.inline.} =
+  env.strings[LitId id]
+
+func getOrIncl*(env: var MirEnv, str: string): StringId {.inline.} =
+  ## If not registered already, adds `str` to the environment.
+  StringId env.strings.getOrIncl(str)
+
 func setData*(env: var MirEnv, id: ConstId, data: DataId) =
   ## Sets the body for the constant identified by `id`.
   synchronize(env.bodies, env.constants.data)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 1fc6f8d5679..92ea86de011 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -319,6 +319,9 @@ proc empty(c: var TCtx, n: PNode): MirNode =
 func intLiteral(val: Int128, typ: PType): Value =
   literal(newIntTypeNode(val, typ))
 
+func strLiteral(env: var MirEnv, str: string, typ: PType): Value =
+  literal(env.getOrIncl(str), typ)
+
 func nameNode(c: var TCtx, s: PSym): MirNode =
   case s.kind
   of skTemp:
@@ -547,8 +550,8 @@ proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
       # inverted flag:
       c.emitByVal literal(newIntTypeNode(ord(inverted), call.typ))
       # error message operand:
-      c.emitByVal literal(newStrNode(genFieldDefect(conf, field, discr),
-                                     c.graph.getSysType(call.info, tyString)))
+      c.emitByVal strLiteral(c.env, genFieldDefect(conf, field, discr),
+                             c.graph.getSysType(call.info, tyString))
 
 proc genCheckedVariantAccess(c: var TCtx, variant: Value, name: PIdent,
                              check: PNode): PSym =
@@ -1167,8 +1170,8 @@ proc genRaise(c: var TCtx, n: PNode) =
           # lvalue conversion to the base ``Exception`` type:
           c.buildTree mnkPathConv, cp.typ[1]:
             c.use tmp
-        c.emitByVal literal(newStrNode(typ.sym.name.s,
-                                       c.graph.getSysType(n.info, tyCstring)))
+        c.emitByVal strLiteral(c.env, typ.sym.name.s,
+                               c.graph.getSysType(n.info, tyCstring))
 
     # emit the raise statement:
     c.buildStmt mnkRaise:
@@ -1553,14 +1556,12 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
     of nkOfBranch:
       # emit the lables:
       for (_, label) in branchLabels(branch):
-        template add(n: PNode) =
-          c.add MirNode(kind: mnkLiteral, lit: n, typ: n.typ)
         if label.kind == nkRange:
           c.subTree mnkRange:
-            add(label[0])
-            add(label[1])
+            genx(c, label[0])
+            genx(c, label[1])
         else:
-          add(label)
+          genx(c, label)
     else:
       unreachable(branch.kind)
 
@@ -1682,7 +1683,11 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
   of pirProc:
     c.use toValue(c.env.procedures.add(n.sym), n.sym.typ)
   of pirLiteral:
-    c.use literal(n.orig)
+    case n.orig.kind
+    of nkStrLiterals:
+      c.use strLiteral(c.env, n.orig.strVal, n.typ)
+    else:
+      c.use literal(n.orig)
   of pirLocal, pirGlobal, pirParam, pirConst:
     c.add nameNode(c, n.sym)
   of pirDeref:
@@ -2238,8 +2243,10 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       bu.subTree MirNode(kind: mnkRange, len: 2):
         constToMirAux(bu, env, n[0])
         constToMirAux(bu, env, n[1])
-    of nkLiterals:
+    of nkIntLiterals, nkFloatLiterals, nkNilLit:
       bu.use literal(n)
+    of nkStrLiterals:
+      bu.use strLiteral(env, n.strVal, n.typ)
     of nkHiddenStdConv, nkHiddenSubConv:
       # doesn't translate to a MIR node itself, but the type overrides
       # that of the sub-expression
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 8b285c00e4b..4cd6c0d0194 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -358,14 +358,13 @@ proc extractStringLiterals(tree: MirTree, env: var MirEnv,
   ## Extracts all string literals and promotes them to anonymous constants,
   ## replacing the string literals with a usage of the constants they were
   ## promoted to.
-  for i in search(tree, {mnkLiteral}):
+  for i in search(tree, {mnkStrLit}):
     # note: both normal string *and* cstring literals are currently included
-    if tree[i].lit.kind in nkStrLiterals:
-      # create an anonymous constant from the literal:
-      let c = toConstId env.data.getOrPut(@[tree[i]])
-      # replace the usage of the literal with the anonymous constant:
-      changes.replaceMulti(tree, i, bu):
-        bu.use toValue(c, tree[i].typ)
+    # create an anonymous constant from the literal:
+    let c = toConstId env.data.getOrPut(@[tree[i]])
+    # replace the usage of the literal with the anonymous constant:
+    changes.replaceMulti(tree, i, bu):
+      bu.use toValue(c, tree[i].typ)
 
 proc injectResultInit(tree: MirTree, resultTyp: PType, changes: var Changeset) =
   ## Injects a default-initialization for the result variable, if deemed
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index e148c0bd5b3..4a686dce6f8 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -26,6 +26,9 @@ type
     ## Identifies a procedure
   LiteralId {.used.} = distinct uint32
     ## Identifies a literal
+  StringId* = distinct uint32
+    ## Uniquely identifies a string value. Two strings sharing the same
+    ## content map to the same ID
   DataId* = distinct uint32
     ## Identifies a complete constant expression
 
@@ -66,6 +69,7 @@ type
     mnkLiteral ## literal data. Currently represented via a ``PNode``
     # future direction: split into IntLit, FloatLit, and StrLit and store the
     # values in a separate table (so that MirNode gets smaller)
+    mnkStrLit  ## reference to a literal string
     mnkType    ## a type literal
 
     # future direction:
@@ -278,6 +282,8 @@ type
       field*: PSym
     of mnkLiteral:
       lit*: PNode
+    of mnkStrLit:
+      strVal*: StringId
     of mnkPathPos:
       position*: uint32 ## the 0-based position of the field
     of mnkCall, mnkCheckedCall:
@@ -338,8 +344,10 @@ const
     ## Assignment modifiers. Nodes that can only appear directly in the source
     ## slot of assignments.
 
+  LiteralDataNodes* = {mnkLiteral, mnkStrLit}
+
   ConstrTreeNodes* = {mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr,
-                      mnkLiteral, mnkProc, mnkArg, mnkField, mnkEnd}
+                      mnkProc, mnkArg, mnkField, mnkEnd} + LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
   # --- semantics-focused sets:
@@ -360,9 +368,9 @@ const
   LvalueExprKinds* = {mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathVariant,
                       mnkPathConv, mnkDeref, mnkDerefView, mnkTemp, mnkAlias,
                       mnkLocal, mnkParam, mnkConst, mnkGlobal}
-  RvalueExprKinds* = {mnkLiteral, mnkType, mnkProc, mnkConv, mnkStdConv,
-                      mnkCast, mnkAddr, mnkView, mnkToSlice} + UnaryOps +
-                     BinaryOps
+  RvalueExprKinds* = {mnkType, mnkProc, mnkConv, mnkStdConv, mnkCast, mnkAddr,
+                      mnkView, mnkToSlice} + UnaryOps + BinaryOps +
+                     LiteralDataNodes
   ExprKinds* =       {mnkCall, mnkCheckedCall, mnkConstr, mnkSetConstr,
                       mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
                      ModifierNodes
@@ -376,6 +384,7 @@ func `==`*(a, b: ConstId): bool {.borrow.}
 func `==`*(a, b: GlobalId): bool {.borrow.}
 func `==`*(a, b: ProcedureId): bool {.borrow.}
 func `==`*(a, b: DataId): bool {.borrow.}
+func `==`*(a, b: StringId): bool {.borrow.}
 
 func isAnon*(id: ConstId): bool =
   ## Returns whether `id` represents an anonymous constant.
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index fb2895a2a8c..6c9750a368f 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -42,6 +42,9 @@ func `$`(n: MirNode): string =
     result.add " lit: "
     {.cast(noSideEffect).}:
       result.add renderTree(n.lit)
+  of mnkStrLit:
+    result.add " strVal: "
+    result.addInt n.strVal.uint32
   of mnkPathPos:
     result.add " position: "
     result.add $n.position
@@ -178,6 +181,13 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.add "<none>"
   of mnkLiteral:
     result.add $n.lit
+  of mnkStrLit:
+    if c.env.isNil:
+      result.add "<Str: "
+      result.addInt n.strVal.uint32
+      result.add ">"
+    else:
+      result.addQuoted c.env[][n.strVal]
   of mnkType:
     result.add "type("
     result.add $n.typ
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index f50cc2ae4e0..25b77c249e3 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -290,7 +290,7 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   of LvalueExprKinds:
     # raw usage of an lvalue
     emitLvalueOp(env, opUse, tree, at, OpValue source)
-  of mnkNone, mnkLiteral, mnkProc:
+  of mnkNone, LiteralDataNodes, mnkProc:
     discard "okay, ignore"
   of AllNodeKinds - ExprKinds - {mnkNone} + {mnkType}:
     unreachable(tree[source].kind)
diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index 27ee3988b7a..ccfa37e0c82 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -139,7 +139,7 @@ proc putIntoReg(dest: var TFullReg; jit: var JitState, c: var TCtx, n: PNode,
     dest.nimNode = data[0].lit
   else:
     dest.initLocReg(typ, c.memory)
-    initFromExpr(dest.handle, data, c)
+    initFromExpr(dest.handle, data, jit.env, c)
 
 proc unpackResult(res: sink ExecutionResult; config: ConfigRef, node: PNode): PNode =
   ## Unpacks the execution result. If the result represents a failure, returns
@@ -680,7 +680,7 @@ proc setGlobalValue*(c: var EvalContext; s: PSym, val: PNode) =
     slot = c.vm.heap.slots[slotIdx]
     data = constDataToMir(c.vm, c.jit, val)
 
-  initFromExpr(slot.handle, data, c.vm)
+  initFromExpr(slot.handle, data, c.jit.env, c.vm)
 
 ## what follows is an implementation of the ``passes`` interface that evaluates
 ## the code directly inside the VM. It is used for NimScript execution and by
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index d939acedeec..7d6e33a9d52 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -378,7 +378,6 @@ func storeLiteral(enc: var DataEncoder, e: var PackedEnv, n: PNode) =
     of EmbeddedInts:  (pdkIntLit, cast[uint32](n.intVal))
     of ExternalInts:  (pdkInt,    e.getLitId(n.intVal).uint32)
     of nkFloatKinds:  (pdkFloat,  e.getLitId(n.floatVal).uint32)
-    of nkStrKinds:    (pdkString, e.getLitId(n.strVal).uint32)
     of nkNilLit:
       if n.typ.skipTypes(abstractInst).callConv == ccClosure:
         # XXX: some unexpanded `nil` closure literals reach here, so we have
@@ -399,6 +398,9 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
   case t[n].kind
   of mnkLiteral:
     storeLiteral(enc, e, t[n].lit)
+  of mnkStrLit:
+    # the ID indexes into the string BiTable, it can be packed directly
+    enc.put e, PackedDataNode(kind: pdkString, pos: t[n].strVal.uint32)
   of mnkProc:
     # the ID is stable, it can be packed directly
     enc.put e, PackedDataNode(kind: pdkIntLit, pos: t[n].prc.uint32)
diff --git a/compiler/vm/vmbackend.nim b/compiler/vm/vmbackend.nim
index 4084bce8c8a..8351982f907 100644
--- a/compiler/vm/vmbackend.nim
+++ b/compiler/vm/vmbackend.nim
@@ -308,7 +308,7 @@ proc generateCode*(g: ModuleGraph, mlist: sink ModuleList) =
   # pack the data and write it to the ouput file:
   var
     enc: PackedEncoder
-    penv: PackedEnv
+    penv = PackedEnv(strings: move c.gen.env.strings)
 
   enc.init(env.types)
   storeEnv(enc, penv, env)
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index e195db205c2..5878ea57d67 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -70,6 +70,10 @@ type
     gen: CodeGenCtx
       ## code generator state
 
+func env*(jit: JitState): lent MirEnv {.inline.} =
+  ## The JIT code generator's MIR environment.
+  jit.gen.env
+
 func selectOptions(c: TCtx): TranslationConfig =
   result = TranslationConfig(options: {goIsNimvm}, magicsToKeep: MagicsToKeep)
   # include additional options based on the JIT's configuration
@@ -125,7 +129,7 @@ proc updateEnvironment(c: var TCtx, env: var MirEnv, cp: EnvCheckpoint) =
       typ = c.getOrCreate(data[0].typ)
       handle = c.allocator.allocConstantLocation(typ)
 
-    initFromExpr(handle, data, c)
+    initFromExpr(handle, data, env, c)
 
     c.complexConsts.add handle
 
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 0a1116dc01e..f803bd48777 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -11,6 +11,7 @@ import
     options
   ],
   compiler/mir/[
+    mirenv,
     mirtrees
   ],
   compiler/vm/[
@@ -27,12 +28,12 @@ import
     int128
   ]
 
-proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int,
+proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
                   c: var TCtx) =
   ## Loads the value represented by `tree` at `n` into `dest`. On exit, `n`
   ## points to the next sub-tree.
   template recurse(dest: LocHandle) =
-    initFromExpr(dest, tree, n, c)
+    initFromExpr(dest, tree, n, env, c)
 
   template next(): lent MirNode =
     let i = n
@@ -62,7 +63,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int,
     else:
       writeFloat64(dest, float64(next().lit.floatVal))
   of akString:
-    deref(dest).strVal.newVmString(next().lit.strVal, c.allocator)
+    deref(dest).strVal.newVmString(env[next().strVal], c.allocator)
   of akSeq:
     # allocate the sequence first:
     newVmSeq(deref(dest).seqVal, dest.typ, tree[n].len, c.memory)
@@ -144,9 +145,10 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int,
     iterTree(i):
       arg recurse(slice[i])
 
-proc initFromExpr*(dest: LocHandle, tree: MirTree, c: var TCtx) {.inline.} =
+proc initFromExpr*(dest: LocHandle, tree: MirTree, env: MirEnv,
+                   c: var TCtx) {.inline.} =
   ## Intializes the memory location `dest` with the value represented by the
   ## MIR contant expression `tree`. The location is expected to be in its
   ## zero'ed state.
   var i = 0
-  initFromExpr(dest, tree, i, c)
+  initFromExpr(dest, tree, i, env, c)

From ae543125c222693c915e3cfaa3cc3edb0110c569 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 4 Apr 2024 05:08:40 +0200
Subject: [PATCH 055/169] js: support variant destructors (#1267)

## Summary

Fix destructors not being properly executed for fields within case
objects when changing the active branch, and using the JS backend.

## Details

The destructor produced by `produceDestructorForDiscriminator` took a
reference to the *discriminant field* and used pointer arithmetic to
compute the address of the enclosing object. Not only is this
unnecessarily complex, it also doesn't work with the JS backend.

Instead, the destructor now takes a mutable reference to the
discriminant field's enclosing object type -- the MIR emitted for the
call is adjusted accordingly.

Since the destructor definitely modifies the object, `ekMutate` is used
instead of `ekInvalidate` for the parameter passing. This results in a
small move analyzer regression:
```nim
var x = Object()
var y = x.fieldOutsideOfVariant # not automatically moved anymore
x.kind = ... # potential branch switch that requires destruction
```

Finally, a test is added for ensuring proper destruction when changing
the active branch.
---
 compiler/sem/injectdestructors.nim            | 11 +++--
 compiler/sem/liftdestructors.nim              | 40 +++----------------
 .../destructor/tcaseobj_transition_2.nim      | 39 ++++++++++++++++++
 3 files changed, 52 insertions(+), 38 deletions(-)
 create mode 100644 tests/lang_objects/destructor/tcaseobj_transition_2.nim

diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 41e2b30792c..5320861c77e 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -813,14 +813,19 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
       bu.buildMagicCall mNot, boolTyp:
          bu.emitByVal val
 
+    var src = body.child(NodePosition target, 0)
+    # skip all ``mnkPathVariant`` nodes:
+    while body[src].kind == mnkPathVariant:
+      src = body.child(src, 0)
+
     bu.subTree mnkIf:
       bu.use val
       # ``=destroy`` call:
       bu.buildVoidCall(env, branchDestructor):
-        # pass the original variant access to the destroy call
+        # pass the object access expression to the destroy call
         bu.subTree mnkName:
-          bu.subTree MirNode(kind: mnkTag, effect: ekInvalidate):
-            bu.emitFrom(body, NodePosition target)
+          bu.subTree MirNode(kind: mnkTag, effect: ekMutate):
+            bu.emitFrom(body, src)
 
   else:
     # the object doesn't need destruction, which means that neither does one
diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index 5712b14c2b9..289412b5d6d 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -125,29 +125,6 @@ proc genWhileLoop(c: var TLiftCtx; i, dest: PNode): PNode =
 proc genIf(c: var TLiftCtx; cond, action: PNode): PNode =
   result = newTree(nkIfStmt, newTree(nkElifBranch, cond, action))
 
-proc genContainerOf(c: var TLiftCtx; objType: PType, field, x: PSym): PNode =
-  # generate: cast[ptr ObjType](cast[int](addr(x)) - offsetOf(objType.field))
-  let intType = getSysType(c.g, unknownLineInfo, tyInt)
-
-  let addrOf = newTreeIT(nkAddr, c.info, makePtrType(x.owner, x.typ, c.idgen)):
-    newDeref(newSymNode(x))
-  let castExpr1 = newTreeIT(nkCast, c.info, intType):
-    [newNodeIT(nkType, c.info, intType), addrOf]
-
-  let dotExpr = newTreeIT(nkDotExpr, c.info, x.typ):
-    [newNodeIT(nkType, c.info, objType), newSymNode(field)]
-
-  let offsetOf = genBuiltin(c, mOffsetOf, "offsetof", dotExpr)
-  offsetOf.typ = intType
-
-  let minusExpr = genBuiltin(c, mSubI, "-", castExpr1)
-  minusExpr.typ = intType
-  minusExpr.add foldOffsetOf(c.g.config, offsetOf, offsetOf)
-
-  let objPtr = makePtrType(objType.owner, objType, c.idgen)
-  result = newTreeIT(nkCast, c.info, objPtr):
-    [newNodeIT(nkType, c.info, objPtr), minusExpr]
-
 proc destructorCall(c: var TLiftCtx; op: PSym; x: PNode): PNode =
   var destroy = newTreeIT(nkCall, x.info, op.typ[0]):
     [newSymNode(op), genAddr(c, x)]
@@ -948,23 +925,16 @@ proc produceSym(g: ModuleGraph; c: PContext; typ: PType; kind: TTypeAttachedOp;
 proc produceDestructorForDiscriminator*(g: ModuleGraph; typ: PType; field: PSym,
                                         info: TLineInfo; idgen: IdGenerator): PSym =
   assert(typ.skipTypes({tyAlias, tyGenericInst}).kind == tyObject)
-  result = symPrototype(g, field.typ, typ.owner, attachedDestructor, info, idgen)
+  result = symPrototype(g, typ, typ.owner, attachedDestructor, info, idgen)
   var a = TLiftCtx(info: info, g: g, kind: attachedDestructor, asgnForType: typ, idgen: idgen,
                    fn: result)
   a.asgnForType = typ
   a.filterDiscriminator = field
   a.addMemReset = true
-  let discrimantDest = result.typ.n[1].sym
-
-  let dst = newSym(skVar, getIdent(g.cache, "dest"), nextSymId(idgen), result, info)
-  dst.typ = makePtrType(typ.owner, typ, idgen)
-  let dstSym = newSymNode(dst)
-  let d = newDeref(dstSym)
-  let v = newTreeI(nkVarSection, info):
-    newIdentDefs(dstSym, genContainerOf(a, typ, field, discrimantDest))
-  result.ast[bodyPos].add v
-  let placeHolder = newNodeIT(nkSym, info, getSysType(g, info, tyPointer))
-  fillBody(a, typ, result.ast[bodyPos], d, placeHolder)
+  let
+    d = newDeref(newSymNode(result.typ.n[1].sym))
+    placeholder = newNodeIT(nkSym, info, getSysType(g, info, tyPointer))
+  fillBody(a, typ, result.ast[bodyPos], d, placeholder)
   incl result.flags, sfNeverRaises
 
 
diff --git a/tests/lang_objects/destructor/tcaseobj_transition_2.nim b/tests/lang_objects/destructor/tcaseobj_transition_2.nim
new file mode 100644
index 00000000000..ceae2a9f357
--- /dev/null
+++ b/tests/lang_objects/destructor/tcaseobj_transition_2.nim
@@ -0,0 +1,39 @@
+discard """
+  description: '''
+    Ensure that the destructor of a field within a case obj is triggered when
+    changing the active case object branch
+  '''
+  targets: "c js vm"
+  knownIssue.vm: '''
+    Lowering branch switch statements is disabled for the VM backend
+  '''
+"""
+
+type
+  Object = object
+    name: int
+
+var steps: seq[int]
+
+proc `=destroy`(x: var Object) =
+  steps.add x.name
+
+type
+  WithVariant = object
+    outer: Object
+      ## field not within the case object; unaffected by branch changing
+    case kind: bool
+    of false:
+      a: Object
+    of true:
+      b: Object
+
+proc test() =
+  var o = WithVariant(outer: Object(name: 1), kind: false, a: Object(name: 2))
+  o.kind = true # change branch; `a` is destroyed
+  doAssert o.b.name == 0 # uninitialized
+  o.b.name = 3
+  # on destruction, both `b` and `outer` must be destroyed
+
+test()
+doAssert steps == [2, 1, 3], $steps
\ No newline at end of file

From dad0f6b977a8de58d91b6ab4c8d67efc8ba778dd Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 5 Apr 2024 19:14:38 +0200
Subject: [PATCH 056/169] mir: split up `mnkConstr` (#1269)

## Summary

The `mnkConstr` node kind is removed and replaced with dedicated node
kinds for each construction (`array`, `seq`, `tuple`, and closure).
This is a step towards replacing type queries with syntax-only queries
as much as possible.

## Details

* `mnkConstr` is split into `mnkArrayConstr`, `mnkSeqConstr`,
  `mnkTupleConstr`, and `mnkClosureConstr`
* the proto-MIR covers `seq` construction now (`pirSeqConstr`)
* `mirgen` translates `pirSeqConstr` to `mnkSeqConstr`
* what `mnkConstr` usage is replaced with depends on the context
* the pretty-printer uses a textual representation for the new node
  kinds that matches their high-level one (e.g.:
  `mnkArrayConstr` is rendered as `[...]`)
* the `topt_no_cursor.nim` test is updated to account for the pretty-
  printer changes

It's now possible to search for, e.g., `seq` constructions
(`mnkSeqConstr`) without having to perform type queries on MIR nodes.
---
 compiler/backend/cgirgen.nim   | 24 +++++++++---------------
 compiler/backend/compat.nim    | 21 ++++++++-------------
 compiler/mir/datatables.nim    |  6 ++++--
 compiler/mir/mirgen.nim        | 23 +++++++++++++++++++----
 compiler/mir/mirpasses.nim     |  3 ++-
 compiler/mir/mirtrees.nim      | 13 ++++++++-----
 compiler/mir/proto_mir.nim     | 17 +++++++++++------
 compiler/mir/utils.nim         | 19 +++++++++++++++++--
 compiler/sem/mirexec.nim       |  3 ++-
 compiler/vm/packed_env.nim     | 12 ++++--------
 compiler/vm/vmserialize.nim    |  2 +-
 doc/mir.rst                    | 12 +++++++++---
 tests/arc/topt_no_cursor.nim   | 14 +++++++-------
 tests/compiler/tdatatables.nim |  8 ++++----
 14 files changed, 105 insertions(+), 72 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 3b5ce3b8e4c..b5a16a2ea78 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -1009,26 +1009,20 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   of mnkSetConstr:
     treeOp cnkSetConstr:
       res.add setElementToIr(tree, cl, cr)
+  of mnkArrayConstr, mnkSeqConstr:
+    treeOp cnkArrayConstr:
+      res.add argToIr(tree, cl, cr)[1]
+  of mnkTupleConstr:
+    treeOp cnkTupleConstr:
+      res.add argToIr(tree, cl, cr)[1]
+  of mnkClosureConstr:
+    treeOp cnkClosureConstr:
+      res.add argToIr(tree, cl, cr)[1]
   of mnkObjConstr:
     assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
       let f = newFieldNode(get(tree, cr).field)
       res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
-  of mnkConstr:
-    let typ = n.typ.skipTypes(abstractVarRange)
-
-    let kind =
-      case typ.kind
-      of tyArray, tySequence: cnkArrayConstr
-      of tyTuple:             cnkTupleConstr
-      of tyProc:
-        assert typ.callConv == ccClosure
-        cnkClosureConstr
-      else:
-        unreachable(typ.kind)
-
-    treeOp kind:
-      res.add argToIr(tree, cl, cr)[1]
   of mnkCall:
     callToIr(tree, cl, n, cr)
   of mnkCheckedCall:
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index d669b70ef0d..bc40143ec3d 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -161,19 +161,14 @@ proc translate*(t: MirTree): CgNode =
         let field = translateAux(t, i)
         CgNode(kind: cnkBinding, info: unknownLineInfo,
                kids: @[field, translateAux(t, i)])
-    of mnkConstr:
-      let kind =
-        case n.typ.skipTypes(abstractVarRange).kind
-        of tyArray, tySequence, tyOpenArray:
-          cnkArrayConstr
-        of tyTuple:
-          cnkTupleConstr
-        of tyProc:
-          cnkClosureConstr
-        else:
-          unreachable()
-
-      tree kind:
+    of mnkArrayConstr, mnkSeqConstr:
+      tree cnkArrayConstr:
+        translateAux(t, i)
+    of mnkTupleConstr:
+      tree cnkTupleConstr:
+        translateAux(t, i)
+    of mnkClosureConstr:
+      tree cnkClosureConstr:
         translateAux(t, i)
     of mnkSetConstr:
       tree cnkSetConstr:
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index 6ba0c8816af..2e3e2bfcd3a 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -53,7 +53,8 @@ func hashTree(tree: ConstrTree): Hash =
       result = result !& hash(n.strVal)
     of mnkProc:
       result = result !& hash(n.prc.ord)
-    of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
+    of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
+       mnkClosureConstr, mnkObjConstr:
       result = result !& hash(n.len)
     of mnkField:
       result = result !& hash(n.field.id)
@@ -102,7 +103,8 @@ proc cmp(a, b: ConstrTree): bool =
       a.strVal == b.strVal
     of mnkProc:
       a.prc == b.prc
-    of mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr:
+    of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
+       mnkClosureConstr, mnkObjConstr:
       a.len == b.len
     of mnkField:
       a.field.id == b.field.id
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 92ea86de011..30bd4c6ef2b 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1105,18 +1105,23 @@ proc genSetConstr(c: var TCtx, n: PNode) =
         c.genArgExpression(it, sink=false)
 
 proc genArrayConstr(c: var TCtx, n: PNode, isConsume: bool) =
-  c.buildTree mnkConstr, n.typ:
+  c.buildTree mnkArrayConstr, n.typ:
     for it in n.items:
       c.emitOperandTree it, isConsume
 
+proc genSeqConstr(c: var TCtx, n: PNode) =
+  c.buildTree mnkSeqConstr, n.typ:
+    for it in n.items:
+      c.emitOperandTree it, true
+
 proc genTupleConstr(c: var TCtx, n: PNode, isConsume: bool) =
   assert n.typ.skipTypes(abstractVarRange-{tyTypeDesc}).kind == tyTuple
-  c.buildTree mnkConstr, n.typ:
+  c.buildTree mnkTupleConstr, n.typ:
     for it in n.items:
       c.emitOperandTree skipColon(it), isConsume
 
 proc genClosureConstr(c: var TCtx, n: PNode, isConsume: bool) =
-  c.buildTree mnkConstr, n.typ:
+  c.buildTree mnkClosureConstr, n.typ:
     c.emitOperandTree n[0].skipConv, false # the procedural value
     # transf wraps the procedure operand in a conversion that we don't
     # need
@@ -1813,6 +1818,8 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       c.emitOperandTree n.orig[0], false
   of pirArrayConstr:
     genArrayConstr(c, n.orig, n.owning)
+  of pirSeqConstr:
+    genSeqConstr(c, n.orig)
   of pirSetConstr:
     genSetConstr(c, n.orig)
   of pirRefConstr:
@@ -2225,7 +2232,15 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         for it in n.items:
           constToMirAux(bu, env, it)
     of nkBracket, nkTupleConstr, nkClosure:
-      bu.subTree MirNode(kind: mnkConstr, typ: n.typ, len: n.len):
+      let kind: range[mnkArrayConstr..mnkClosureConstr] =
+        case n.typ.skipTypes(abstractInst).kind
+        of tyArray:                 mnkArrayConstr
+        of tyOpenArray, tySequence: mnkSeqConstr
+        of tyTuple:                 mnkTupleConstr
+        of tyProc:                  mnkClosureConstr
+        else:                       unreachable()
+
+      bu.subTree MirNode(kind: kind, typ: n.typ, len: n.len):
         for it in n.items:
           bu.subTree mnkArg:
             constToMirAux(bu, env, it.skipColon)
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 4cd6c0d0194..05ec8772114 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -323,7 +323,8 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
         elide = true
       of RvalueExprKinds, mnkSetConstr:
         elide = true
-      of mnkConstr, mnkObjConstr:
+      of mnkArrayConstr, mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
+         mnkObjConstr:
         # if the lvalue doesn't overlap with the assignment destination, the
         # temporary can be elided
         let stmt = tree.parent(expr)
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 4a686dce6f8..f600ce5ab68 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -172,12 +172,13 @@ type
               ## tree. Describes what kind of mutation is applied to the
               ## lvalue within the called procedure
 
-    mnkConstr     ## constructs a either new aggregate value or set value made
-                  ## up of the input values. Whether the resulting value is
-                  ## owned depends on whether one the context it's used in
     mnkSetConstr  ## constructor for set values
     mnkRange      ## range constructor. May only appear in set constructions
                   ## and as a branch label
+    mnkArrayConstr## constructor for array values
+    mnkSeqConstr  ## constructor for seq values
+    mnkTupleConstr## constructor for tuple values
+    mnkClosureConstr## constructor for closure values
     mnkObjConstr  ## either allocate a new managed heap cell and returns a
                   ## ``ref`` to it, or or constructs a new aggregate value
                   ## with named fields
@@ -346,7 +347,8 @@ const
 
   LiteralDataNodes* = {mnkLiteral, mnkStrLit}
 
-  ConstrTreeNodes* = {mnkConstr, mnkSetConstr, mnkRange, mnkObjConstr,
+  ConstrTreeNodes* = {mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr,
+                      mnkTupleConstr, mnkClosureConstr, mnkObjConstr,
                       mnkProc, mnkArg, mnkField, mnkEnd} + LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
@@ -371,7 +373,8 @@ const
   RvalueExprKinds* = {mnkType, mnkProc, mnkConv, mnkStdConv, mnkCast, mnkAddr,
                       mnkView, mnkToSlice} + UnaryOps + BinaryOps +
                      LiteralDataNodes
-  ExprKinds* =       {mnkCall, mnkCheckedCall, mnkConstr, mnkSetConstr,
+  ExprKinds* =       {mnkCall, mnkCheckedCall, mnkSetConstr, mnkArrayConstr,
+                      mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
                       mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
                      ModifierNodes
 
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 78e212800ae..8586d296461 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -85,6 +85,7 @@ type
     pirRefConstr
     pirTupleConstr
     pirArrayConstr
+    pirSeqConstr
 
     pirConstExpr ## an expression that needs to be turned into an anonymous
                  ## constant
@@ -204,7 +205,7 @@ func classify*(e: seq[ProtoItem], i: int): ExprKind =
       OwnedRvalue
     else:
       Rvalue
-  of pirRefConstr:
+  of pirRefConstr, pirSeqConstr:
     OwnedRvalue
   of pirCast:
     Rvalue
@@ -255,7 +256,7 @@ func isPure(e: seq[ProtoItem], n: int): bool =
   of pirDeref, pirViewDeref:
     # the pointer destination could change (unless it's an immutable view)
     false
-  of pirSetConstr, pirObjConstr, pirTupleConstr, pirArrayConstr,
+  of pirSetConstr, pirObjConstr, pirTupleConstr, pirArrayConstr, pirSeqConstr,
      pirClosureConstr, pirRefConstr, pirStringToCString, pirCStringToString,
      pirToSubSlice, pirChckRange, pirCall, pirComplex:
     # not analyzable
@@ -457,7 +458,7 @@ func handleConstExpr(result: var seq[ProtoItem], n: PNode, kind: ProtoItemKind,
   if lift and n.len > ord(n.kind == nkObjConstr) and
      isDeepConstExpr(n):
     result.add ProtoItem(orig: n, typ: n.typ, kind: pirConstExpr)
-  elif kind == pirSetConstr:
+  elif kind in {pirSetConstr, pirSeqConstr}:
     result.add ProtoItem(orig: n, typ: n.typ, kind: kind)
   else:
     result.add ProtoItem(orig: n, typ: n.typ, kind: kind)
@@ -770,9 +771,13 @@ proc exprToPmir(c: TranslateCtx, result: var seq[ProtoItem], n: PNode, sink: boo
   of nkBracket:
     # if the construction is of seq type, then it's a constant seq value,
     # which we prefer to lift into a constant (again), even in sink contexts
-    let lift =
-      n.typ.skipTypes(IrrelevantTypes).kind == tySequence or not(sink)
-    handleConstExpr(result, n, pirArrayConstr, sink, lift)
+    let kind =
+      if n.typ.skipTypes(IrrelevantTypes).kind == tySequence:
+        pirSeqConstr
+      else:
+        pirArrayConstr
+    handleConstExpr(result, n, kind, sink,
+                    lift = (kind == pirSeqConstr) or not(sink))
   of nkCurly:
     # always attempt to turn set constructions into constants, regardless of
     # whether they're used in a sink context
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 6c9750a368f..fd252b96fe5 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -314,8 +314,23 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   of mnkStdConv:
     tree "stdConv ":
       valueToStr()
-  of mnkConstr:
-    tree "construct (":
+  of mnkArrayConstr:
+    tree "[":
+      commaSeparated:
+        argToStr()
+      result.add "]"
+  of mnkSeqConstr:
+    tree "@[":
+      commaSeparated:
+        argToStr()
+      result.add "]"
+  of mnkTupleConstr:
+    tree "(":
+      commaSeparated:
+        argToStr()
+      result.add ")"
+  of mnkClosureConstr:
+    tree "closure (":
       commaSeparated:
         argToStr()
       result.add ")"
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index 25b77c249e3..07695603289 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -236,7 +236,8 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
     env.dfaOp(o, tree, at, v)
 
   case tree[source].kind
-  of mnkCall, mnkCheckedCall, mnkConstr, mnkObjConstr:
+  of mnkCall, mnkCheckedCall, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
+     mnkClosureConstr, mnkObjConstr:
     emitForArgs(env, tree, at, source)
   of mnkSetConstr:
     for it in subNodes(tree, source):
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index 7d6e33a9d52..c3778c04ec6 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -404,14 +404,10 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
   of mnkProc:
     # the ID is stable, it can be packed directly
     enc.put e, PackedDataNode(kind: pdkIntLit, pos: t[n].prc.uint32)
-  of mnkConstr:
-    case t[n].typ.skipTypes(abstractInst).kind
-    of tySequence, tyArray, tyOpenArray:
-      enc.storeArrayData(e, t, n)
-    of tyTuple, tyProc:
-      enc.storeTupleData(e, t, n)
-    else:
-      unreachable(t[n].kind)
+  of mnkArrayConstr, mnkSeqConstr:
+    enc.storeArrayData(e, t, n)
+  of mnkTupleConstr, mnkClosureConstr:
+    enc.storeTupleData(e, t, n)
   of mnkSetConstr:
     enc.storeSetData(e, t, n)
   of mnkObjConstr:
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index f803bd48777..6887d8853ff 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -117,7 +117,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       assert tree[n].lit.kind == nkNilLit
       # only skip the node, don't initialize anything
       discard next()
-    of mnkConstr:
+    of mnkTupleConstr, mnkClosureConstr:
       iterTree(j):
         arg recurse(dest.getFieldHandle(j.FieldPosition))
     of mnkObjConstr:
diff --git a/doc/mir.rst b/doc/mir.rst
index 601612196de..a7f171dea9a 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -105,8 +105,11 @@ Semantics
          | BINARY_OP
          | CALL_EXPR
          | CHECKED_CALL_EXPR
-         | Constr   CONSTR_ARG ...       # construct a tuple, closure, or array
          | SetConstr SET_CONSTR_ARG ...
+         | ArrayConstr CONSTR_ARG...
+         | SeqConstr CONSTR_ARG...
+         | TupleConstr CONSTR_ARG...
+         | ClosureConstr CONSTR_ARG...
          | ObjConstr (<Field> CONSTR_ARG) ... # construct an `object` or
                                          # `ref object`
          | StdConv  VALUE                # number conversion or conversion
@@ -391,6 +394,9 @@ ones).
   SET_CONSTR_ARG = <Literal>
                  | Range <Literal> <Literal>
 
-  COMPLEX = Constr ARG...
-          | SetConstr SET_CONSTR_ARG...
+  COMPLEX = SetConstr SET_CONSTR_ARG...
+          | ArrayConstr ARG...
+          | SeqConstr ARG...
+          | TupleConstr ARG...
+          | ClosureConstr ARG...
           | ObjConstr (<Field> ARG)...
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index d08a667d7c4..3bc9582764c 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -23,7 +23,7 @@ scope:
   bind_mut _9: string = splat.2
   def _5: string = move _9
   wasMoved(name _9)
-  def _6: Target = construct (consume _3, consume _4, consume _5)
+  def _6: Target = (consume _3, consume _4, consume _5)
   result := move _6
   =destroy(name splat)
 -- end of expandArc ------------------------
@@ -48,12 +48,12 @@ scope:
 --expandArc: p1
 
 scope:
-  def _2: array[0..0, int] = construct (consume 123)
+  def _2: array[0..0, int] = [consume 123]
   def lresult: seq[int] = arrToSeq(consume _2)
   def lvalue: seq[int]
   def lnext: string
   def _6: seq[int] = move lresult
-  def _: (seq[int], string) = construct (consume _6, consume ";")
+  def _: (seq[int], string) = (consume _6, consume ";")
   bind_mut _8: seq[int] = _.0
   lvalue := move _8
   wasMoved(name _8)
@@ -75,7 +75,7 @@ scope:
     =copy(name _4, arg it.0)
     def _5: seq[int]
     =copy(name _5, arg it.1)
-    def a: (seq[int], seq[int]) = construct (consume _4, consume _5)
+    def a: (seq[int], seq[int]) = (consume _4, consume _5)
     def_cursor _6: (seq[int], seq[int]) = a
     def _7: string = $(arg _6) (raises)
     echo(arg type(array[0..0, string]), arg _7) (raises)
@@ -202,7 +202,7 @@ scope:
           scope:
             def _7: string
             =copy(name _7, arg this[].value)
-            _4 := construct (consume _7, consume "")
+            _4 := (consume _7, consume "")
             break L0
       scope:
         try:
@@ -214,7 +214,7 @@ scope:
           bind_mut _19: string = _11.1
           def _12: string = move _19
           wasMoved(name _19)
-          _4 := construct (consume _9, consume _12)
+          _4 := (consume _9, consume _12)
           wasMoved(name _9)
         finally:
           =destroy(name _11)
@@ -232,7 +232,7 @@ scope:
             =sink(name this[].matchDirs, arg _17)
             break L1
       scope:
-        def _18: seq[string] = construct ()
+        def _18: seq[string] = @[]
         =sink(name this[].matchDirs, arg _18)
   finally:
     =destroy(name par)
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index 9485607bdb8..ef81b9b66c9 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -40,12 +40,12 @@ block tree_equality:
     @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, -0.0))],
 
     # --- ordered aggregates
-    @[node(mnkConstr, t1, len, 0), node(mnkEnd)],
-    @[node(mnkConstr, t2, len, 0), node(mnkEnd)],
-    @[node(mnkConstr, t1, len, 1),
+    @[node(mnkTupleConstr, t1, len, 0), node(mnkEnd)],
+    @[node(mnkTupleConstr, t2, len, 0), node(mnkEnd)],
+    @[node(mnkTupleConstr, t1, len, 1),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)),
       node(mnkEnd)],
-    @[node(mnkConstr, t1, len, 2),
+    @[node(mnkTupleConstr, t1, len, 2),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
       node(mnkEnd)],

From a0874a46207a9f48e224570d5687aeb36a964e03 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 6 Apr 2024 01:46:56 +0200
Subject: [PATCH 057/169] mir: reference fields by their position (#1268)

## Summary

Instead of storing the fields' `PSym` in `MirNode`, the fields'
position is stored instead. This is progress towards:
* making `MirNode` a plain data-type
* decoupling the MIR from `sem`'s data types

## Details

* `mnkField` stores the field position as an `int32`, intended to allow
  for negative field positions in the future
* a field position uniquely identifies a field within a record
  hierarchy; allowing for unambiguous symbol look- up
* the new `types.lookupInType` overload accepting an `int` parameter is
  used for looking up a field's symbol
* `types.lookupInType` uses `astalgo.lookupInRecord` internally, which
  is based on `vmtypegen.findInType`
* `findInType` is removed and its usage replaced by `lookupInRecord`
* to ease the transition, the CGIR still references fields via their
  `PSym` directly
* the `tdatatables` test is adjusted to the `MirNode` change
---
 compiler/ast/astalgo.nim           | 26 ++++++++++++++++++++++++++
 compiler/ast/types.nim             | 13 +++++++++++++
 compiler/backend/cgirgen.nim       | 12 ++++++++----
 compiler/backend/compat.nim        | 10 +++++-----
 compiler/mir/datatables.nim        |  4 ++--
 compiler/mir/mirgen.nim            | 17 ++++++++++-------
 compiler/mir/mirtrees.nim          |  3 ++-
 compiler/mir/utils.nim             | 10 +++++++---
 compiler/sem/injectdestructors.nim |  5 +++--
 compiler/vm/packed_env.nim         |  6 ++++--
 compiler/vm/vmcompilerserdes.nim   | 30 +++---------------------------
 compiler/vm/vmserialize.nim        |  2 +-
 tests/compiler/tdatatables.nim     | 14 ++++++--------
 13 files changed, 90 insertions(+), 62 deletions(-)

diff --git a/compiler/ast/astalgo.nim b/compiler/ast/astalgo.nim
index 7c28ef0f070..4d50c463972 100644
--- a/compiler/ast/astalgo.nim
+++ b/compiler/ast/astalgo.nim
@@ -17,6 +17,9 @@ import
     idents,
     renderer
   ],
+  compiler/utils/[
+    idioms
+  ],
   std/[
     hashes,
     intsets,
@@ -128,6 +131,29 @@ proc lookupInRecord(n: PNode, field: PIdent): PSym =
     if n.sym.name.id == field.id: result = n.sym
   else: return nil
 
+func lookupInRecord*(n: PNode, pos: int): PSym =
+  ## Searches record AST `n` for a symbol with position `pos`, returning
+  ## the symbol if one is found.
+  case n.kind
+  of nkSym:
+    if n.sym.position == pos:
+      return n.sym
+  of nkRecList:
+    for it in n.items:
+      result = lookupInRecord(it, pos)
+      if result != nil:
+        return
+  of nkRecCase:
+    if n[0].sym.position == pos:
+      return n[0].sym
+
+    for i in 1..<n.len:
+      result = lookupInRecord(n[i][^1], pos)
+      if result != nil:
+        return
+  else:
+    unreachable(n.kind)
+
 proc getModule*(s: PSym): PSym =
   ## if it's a module returns itself, otherwise looks through `s`' owners, may
   ## return nil if none are found.
diff --git a/compiler/ast/types.nim b/compiler/ast/types.nim
index 92e7b05be53..e2b137e0d19 100644
--- a/compiler/ast/types.nim
+++ b/compiler/ast/types.nim
@@ -1346,6 +1346,19 @@ proc lookupFieldAgain*(ty: PType; field: PSym): PSym =
     ty = ty[0]
   if result == nil: result = field
 
+proc lookupInType*(ty: PType, position: int): PSym =
+  ## Looks up and returns the field with the given `position` in `ty`. Returns
+  ## nil if there's no such field. `ty` is expected to be a fully resolved
+  ## ``object`` or ``ref object``/``ptr object`` type.
+  var ty = ty.skipTypes(skipPtrs + tyUserTypeClasses + tyDistinct)
+  while ty != nil:
+    ty = ty.skipTypes(skipPtrs)
+    assert ty.kind in {tyTuple, tyObject}
+    result = lookupInRecord(ty.n, position)
+    if result != nil:
+      break
+    ty = ty[0]
+
 proc isCharArrayPtr*(t: PType; allowPointerToChar: bool): bool =
   let t = t.skipTypes(abstractInst)
   if t.kind == tyPtr:
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index b5a16a2ea78..e5a362711b1 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -351,12 +351,16 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   of mnkLocal, mnkGlobal, mnkParam, mnkTemp, mnkAlias, mnkConst, mnkProc:
     return atomToIr(n, cl, info)
   of mnkPathNamed:
+    let obj = recurse()
     result = newExpr(cnkFieldAccess, info, n.typ,
-                     [recurse(), newFieldNode(n.field)])
+                     [obj, newFieldNode(lookupInType(obj.typ, n.field.int))])
   of mnkPathVariant:
     if preferField:
-      result = newExpr(cnkFieldAccess, cr.info, n.field.typ,
-                      [recurse(), newFieldNode(n.field)])
+      let
+        obj = recurse()
+        field = lookupInType(obj.typ, n.field.int)
+      result = newExpr(cnkFieldAccess, info, field.typ,
+                      [obj, newFieldNode(field)])
     else:
       # variant access itself has no ``CgNode`` counterpart at the moment
       result = recurse()
@@ -1021,7 +1025,7 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   of mnkObjConstr:
     assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
-      let f = newFieldNode(get(tree, cr).field)
+      let f = newFieldNode(lookupInType(n.typ, get(tree, cr).field))
       res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
   of mnkCall:
     callToIr(tree, cl, n, cr)
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index bc40143ec3d..3e9c452187d 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -158,9 +158,11 @@ proc translate*(t: MirTree): CgNode =
     case n.kind
     of mnkObjConstr:
       tree cnkObjConstr:
-        let field = translateAux(t, i)
+        let field = lookupInType(n.typ, t[i].field.int)
+        inc i # advance to the arg node
         CgNode(kind: cnkBinding, info: unknownLineInfo,
-               kids: @[field, translateAux(t, i)])
+               kids: @[CgNode(kind: cnkField, field: field),
+                       translateAux(t, i)])
     of mnkArrayConstr, mnkSeqConstr:
       tree cnkArrayConstr:
         translateAux(t, i)
@@ -185,11 +187,9 @@ proc translate*(t: MirTree): CgNode =
     of mnkStrLit:
       CgNode(kind: cnkStrLit, info: unknownLineInfo, typ: n.typ,
              strVal: n.strVal)
-    of mnkField:
-      CgNode(kind: cnkField, info: unknownLineInfo, field: n.field)
     of mnkProc:
       CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: n.typ)
-    of AllNodeKinds - ConstrTreeNodes + {mnkEnd}:
+    of AllNodeKinds - ConstrTreeNodes + {mnkEnd, mnkField}:
       # 'end' nodes are skipped manually
       unreachable(n.kind)
 
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index 2e3e2bfcd3a..69378d5554c 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -57,7 +57,7 @@ func hashTree(tree: ConstrTree): Hash =
        mnkClosureConstr, mnkObjConstr:
       result = result !& hash(n.len)
     of mnkField:
-      result = result !& hash(n.field.id)
+      result = result !& hash(n.field)
     of mnkArg, mnkEnd:
       discard
     of AllNodeKinds - ConstrTreeNodes:
@@ -107,7 +107,7 @@ proc cmp(a, b: ConstrTree): bool =
        mnkClosureConstr, mnkObjConstr:
       a.len == b.len
     of mnkField:
-      a.field.id == b.field.id
+      a.field == b.field
     of mnkArg, mnkEnd:
       true # same node kind -> equal nodes
     of AllNodeKinds - ConstrTreeNodes:
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 30bd4c6ef2b..17a7b3f1adf 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -545,7 +545,7 @@ proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
       # discriminator value operand:
       c.subTree mnkArg:
         c.subTree MirNode(kind: mnkPathNamed, typ: discr.typ,
-                          field: discr):
+                          field: discr.position.int32):
           c.use access
       # inverted flag:
       c.emitByVal literal(newIntTypeNode(ord(inverted), call.typ))
@@ -1152,7 +1152,7 @@ proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
         (isRef or isConsume) and
         sfCursor notin field.flags
 
-      c.add MirNode(kind: mnkField, field: field)
+      c.add MirNode(kind: mnkField, field: field.position.int32)
       c.emitOperandTree it[1], useConsume
 
 proc genRaise(c: var TCtx, n: PNode) =
@@ -1705,14 +1705,16 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     c.subTree MirNode(kind: mnkPathPos, typ: n.typ, position: n.pos):
       recurse()
   of pirFieldAccess:
-    c.subTree MirNode(kind: mnkPathNamed, typ: n.typ, field: n.field):
+    c.subTree MirNode(kind: mnkPathNamed, typ: n.typ,
+                      field: n.field.position.int32):
       recurse()
   of pirArrayAccess, pirSeqAccess:
     c.buildOp mnkPathArray, n.typ:
       recurse()
       c.use toValue(c, e, n.index)
   of pirVariantAccess:
-    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ, field: n.field):
+    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ,
+                      field: n.field.position.int32):
       recurse()
   of pirLvalueConv:
     c.buildOp mnkPathConv, n.typ:
@@ -1735,7 +1737,8 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       variant = toValue(c, e, i - 1)
       discr = genCheckedVariantAccess(c, variant, n.orig[0][1].sym.name,
                                       n.orig[n.nodeIndex])
-    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ, field: discr):
+    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ,
+                      field: discr.position.int32):
       c.use variant
   of pirCheckedObjConv:
     let
@@ -1941,7 +1944,7 @@ proc gen(c: var TCtx, n: PNode) =
         # the 'switch' operations expects a variant access as the first
         # operand
         c.subTree MirNode(kind: mnkPathVariant, typ: dest[^2].typ,
-                          field: dest[^1].field):
+                          field: dest[^1].field.position.int32):
           genx(c, dest, dest.len - 2)
 
         genAsgnSource(c, n[1], {dfOwns}) # the source operand
@@ -2222,7 +2225,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       # table entries, even though the values they represent are equivalent
       bu.subTree MirNode(kind: mnkObjConstr, typ: n.typ, len: n.len-1):
         for i in 1..<n.len:
-          bu.add MirNode(kind: mnkField, field: n[i][0].sym)
+          bu.add MirNode(kind: mnkField, field: n[i][0].sym.position.int32)
           bu.subTree mnkArg:
             constToMirAux(bu, env, n[i][1])
     of nkCurly:
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index f600ce5ab68..9c34f46319d 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -280,7 +280,8 @@ type
     of mnkParam, mnkLocal, mnkTemp, mnkAlias:
       local*: LocalId
     of mnkField, mnkPathNamed, mnkPathVariant:
-      field*: PSym
+      field*: int32
+        ## field position
     of mnkLiteral:
       lit*: PNode
     of mnkStrLit:
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index fd252b96fe5..86e922178bb 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -12,6 +12,7 @@ import
   compiler/ast/[
     ast_types,
     renderer,
+    types,
     typesrenderer,
   ],
   compiler/mir/[
@@ -37,7 +38,7 @@ func `$`(n: MirNode): string =
     result.addInt n.local.uint32
   of mnkField, mnkPathNamed, mnkPathVariant:
     result.add " field:"
-    result.add $n.field.name.s
+    result.addInt n.field
   of mnkLiteral:
     result.add " lit: "
     {.cast(noSideEffect).}:
@@ -226,9 +227,10 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       result.addInt n.position
   of mnkPathNamed, mnkPathVariant:
     tree "":
+      let typ = nodes[i].typ # type of the object operand
       valueToStr()
       result.add "."
-      result.add n.field.name.s
+      result.add lookupInType(typ, n.field).name.s
   of mnkPathConv:
     tree "":
       valueToStr()
@@ -345,9 +347,11 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       result.add " .. "
       valueToStr()
   of mnkObjConstr:
+    let typ = nodes[i].typ
     tree "(":
       commaSeparated:
-        result.add next(nodes, i).field.name.s & ": "
+        let field = lookupInType(typ, next(nodes, i).field.int)
+        result.add field.name.s & ": "
         argToStr()
       result.add ")"
   of mnkCall:
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 5320861c77e..61d21c44289 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -759,7 +759,8 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
   let
     target = body.operand(stmt, 0)
     objType = body[target].typ
-    typ = body[target].field.typ
+    field = lookupInType(objType, body[target].field.int)
+    typ = field.typ
 
   assert body[target].kind == mnkPathVariant
   # the source expression must either be an rvalue, or there must be a
@@ -793,7 +794,7 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
     #      field alignment, however.
     let branchDestructor = produceDestructorForDiscriminator(
                             graph, objType,
-                            body[target].field,
+                            field,
                             unknownLineInfo, idgen
                            )
 
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index c3778c04ec6..4cae4cab4dc 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -300,14 +300,16 @@ func storeDiscrData(enc: var DataEncoder, e: var PackedEnv, s: PSym, v: PNode) =
 
 proc storeFieldsData(enc: var DataEncoder, e: var PackedEnv,
                      t: MirTree, n: NodePosition) =
-  let count = t[n].len
+  let
+    typ = t[n].typ
+    count = t[n].len
   enc.put e, PackedDataNode(kind: pdkObj, pos: count.uint32)
   e.nodes.growBy(count * 2) # make space for the content
 
   # iterate over all fields in the construction and pack and store them:
   var n = n + 1
   for _ in 0..<count:
-    let s = t[n].field ## the field symbol
+    let s = lookupInType(typ, t[n].field.int) ## the field symbol
     inc n # move the cursor to the field's data
 
     enc.put e, PackedDataNode(kind: pdkField, pos: s.position.uint32)
diff --git a/compiler/vm/vmcompilerserdes.nim b/compiler/vm/vmcompilerserdes.nim
index 0a58623284c..0d1f2771dab 100644
--- a/compiler/vm/vmcompilerserdes.nim
+++ b/compiler/vm/vmcompilerserdes.nim
@@ -4,6 +4,7 @@ import
   compiler/ast/[
     ast_types,
     ast,
+    astalgo,
     errorhandling,
     lineinfos,
     nimsets,
@@ -87,31 +88,6 @@ proc deserializeRef*(c: TCtx, slot: HeapSlotHandle, vt: PVmType; f, con: PType,
 proc deserialize(c: TCtx, m: VmMemoryRegion, vt: PVmType, formal: PType, info: TLineInfo): PNode {.inline.} =
   deserialize(c, m, vt, formal, formal.skipTypes(SkipSet), info)
 
-
-# TODO: record walking is implemented multiple times in multiple different
-#       places across the compiler. An `iterator` encapsulating the logic would
-#       probably make sense...
-func findField(n: PNode, pos: int): PSym =
-  case n.kind
-  of nkSym:
-    if n.sym.position == pos:
-      return n.sym
-  of nkRecList:
-    for x in n.items:
-      result = findField(x, pos)
-      if result != nil:
-        return
-  of nkRecCase:
-    if n[0].sym.position == pos:
-      return n[0].sym
-
-    for i in 1..<n.len:
-      result = findField(lastSon(n[i]), pos)
-      if result != nil:
-        return
-  else:
-    unreachable()
-
 proc deserializeTuple(c: TCtx, m: VmMemoryRegion, vt: PVmType; formal, ty: PType, info: TLineInfo): PNode =
   assert vt.kind == akObject
 
@@ -163,7 +139,7 @@ proc deserializeObjectPart(c: TCtx,
     # no variant object
     for i in start..<vt.objFields.len:
       let f = vt.objFields[i]
-      let sym = findField(ty.n, vt.toFieldPos(FieldIndex i).int)
+      let sym = lookupInRecord(ty.n, vt.toFieldPos(FieldIndex i).int)
       dest.sons[result.cIdx] = constrField(f, sym)
       inc result.cIdx
 
@@ -181,7 +157,7 @@ proc deserializeObjectPart(c: TCtx,
       let r = iter.get()
       if r.valid:
         let f = vt.fieldAt(r.idx)
-        let sym = findField(ty.n, vt.toFieldPos(r.idx).int)
+        let sym = lookupInRecord(ty.n, vt.toFieldPos(r.idx).int)
         assert sym.typ != nil
         dest.sons[result.cIdx] = constrField(f, sym)
         inc result.cIdx
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 6887d8853ff..09087968c42 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -124,7 +124,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       let typ = tree[n].typ.skipTypes(abstractPtrs) ## the object's type
       iterTree(i):
         let
-          sym = next().field
+          sym = lookupInType(typ, next().field)
           field = dest.getFieldHandle(sym.position.FieldPosition)
         # object types require special handling for tag fields
         if sfDiscriminant in sym.flags:
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index ef81b9b66c9..63fb970d2a9 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -12,8 +12,6 @@ let
   t1 = PType(itemId: ItemId(item: 1), kind: tyObject, sons: @[PType nil])
   t2 = PType(itemId: ItemId(item: 2), kind: tyObject, sons: @[PType nil])
   t3 = PType(itemId: ItemId(item: 3), kind: tyObject, sons: @[PType nil])
-  field1 = PSym(itemId: ItemId(item: 1))
-  field2 = PSym(itemId: ItemId(item: 2))
 
 # node constructor
 template node(k: MirNodeKind, t: PType, field, val: untyped): MirNode =
@@ -54,25 +52,25 @@ block tree_equality:
     @[node(mnkObjConstr, t1, len, 0), node(mnkEnd)],
     @[node(mnkObjConstr, t2, len, 0), node(mnkEnd)],
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, field1),
+        node(mnkField, field, 0),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
       node(mnkEnd)],
     # same field value, different field:
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, field2),
+        node(mnkField, field, 1),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
       node(mnkEnd)],
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, field1),
+        node(mnkField, field, 0),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
-        node(mnkField, field, field2),
+        node(mnkField, field, 1),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
       node(mnkEnd)],
     # swapped fields
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, field2),
+        node(mnkField, field, 1),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
-        node(mnkField, field, field1),
+        node(mnkField, field, 0),
         node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
       node(mnkEnd)]
   ]

From aecf3670464f571bf4e4b7f9a4a93e42bd80dec6 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 7 Apr 2024 01:46:06 +0200
Subject: [PATCH 058/169] mir: split up `mnkLiteral` (#1270)

## Summary

Split up `mnkLiteral` into its constituent kinds and replace the
`PNode`-based data representation for literals with a data-oriented
one. This removes the last `ref` type usage from within the `MirNode`
record-case. In addition, comparing numeric values becomes a single
integer comparison.

## Details

`mnkLiteral` is split into `mnkNilLit`, `mnkIntLit`, `mnkUIntLit`,
`mnkFloatLit`, and `mnkAstLit`. Same as with the CGIR, numeric type
width is not part of the syntax (it's not needed).

The `MirNode` variant for the numeric literal nodes stores a
`NumberId`, which is a `LitId` uniquely identifying a bit-pattern
(stored as `BiggestInt` in `MirEnv.numbers`).

A shared storage is used because:
* it's easier to implement (one table instead of three; no special
  handling for floats is needed)
* less memory usage (value storage is shared between the three numeric
  literal kinds)
* only one ID type is needed, instead of three
* reinterpreting bit-patterns is made slightly easier

Literal AST (identified by the new `AstId` type) doesn't use a table,
only a `Store`. Their sparse usage doesn't warrant the implementation
complexity / run-time overhead of hashing/comparing the trees (though
`treetabs` could be used).

### Translation

* for integer and float literals, `mirgen` performs the same
  translation that `cgirgen` previously did in `translateLit`
* so that the code generators don't need to be adjusted, the CGIR still
  stores the numeric and AST values directly in `CgNode`
* to prevent excessive parameter passing in `cgirgen`, a pointer to the
  `MirEnv` is stored in `TranslateCl`. Access to the environment is
  needed for looking up the values for `NumberId` and `AstId`
* `compat.translate` now requires a `MirEnv` argument, for looking up
  the numerical values
* `cgirgen.translateLit` is obsolete and thus removed
* raw field symbols are transported to the code generator via a
  `mnkAstLit`/`cnkAstLit` (a `mnkLiteral` node was previously used)

### VM backend

* the `MirEnv.numbers` table is re-used for the `PackedEnv`. This
  allows for also re-using the `NumberId`s (they can be treated
  directly as a `LitId`)
* the serialization logic is adjusted to the new MIR syntax

### Tests

* the `mnkLiteral` usage in `tdatatables.nim` is replaced
* `tcompilerapi.nim` passed untyped float values to
  `nimeval.callRoutine`, which no longer works, since `constDataToMir`
  always expects typed literal nodes now. The test is changed to pass
  typed `nkFloatLit` nodes
---
 compiler/backend/ccgexprs.nim      |  6 +-
 compiler/backend/ccgstmts.nim      |  4 +-
 compiler/backend/cgirgen.nim       | 64 ++++++---------------
 compiler/backend/compat.nim        | 41 +++++++++-----
 compiler/backend/jsgen.nim         |  4 +-
 compiler/mir/datatables.nim        | 48 ++++------------
 compiler/mir/injecthooks.nim       |  6 +-
 compiler/mir/mirconstr.nim         |  9 ++-
 compiler/mir/mirenv.nim            | 22 ++++++++
 compiler/mir/mirgen.nim            | 90 ++++++++++++++++++++++++------
 compiler/mir/mirtrees.nim          | 26 ++++++---
 compiler/mir/utils.nim             | 80 +++++++++++++++++++++-----
 compiler/sem/aliasanalysis.nim     |  4 +-
 compiler/vm/compilerbridge.nim     | 12 ++--
 compiler/vm/packed_env.nim         | 80 +++++++++++---------------
 compiler/vm/vmbackend.nim          |  3 +-
 compiler/vm/vmserialize.nim        | 31 +++++-----
 tests/compiler/tdatatables.nim     | 37 ++++++------
 tests/compilerapi/tcompilerapi.nim |  8 ++-
 19 files changed, 339 insertions(+), 236 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 69d1d66f913..c48ddd6484e 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1972,7 +1972,7 @@ proc genConstDefinition*(q: BModule; id: ConstId) =
   let name = mangleName(q.g.graph, sym)
   if exfNoDecl notin sym.extFlags:
     let p = newProc(nil, q)
-    let data = translate(q.g.env[q.g.env.dataFor(id)])
+    let data = translate(q.g.env[q.g.env.dataFor(id)], q.g.env)
     q.s[cfsData].addf("N_LIB_PRIVATE NIM_CONST $1 $2 = $3;$n",
         [getTypeDesc(q, sym.typ), name,
         genBracedInit(p, data, sym.typ)])
@@ -1992,7 +1992,7 @@ proc useData(p: BProc, x: ConstId, typ: PType): string =
     inc p.module.labels
     p.module.s[cfsData].addf("static NIM_CONST $1 $2 = $3;$n",
       [getTypeDesc(p.module, typ), result,
-       genBracedInit(p, translate(p.env[id]), typ)])
+       genBracedInit(p, translate(p.env[id], p.env), typ)])
 
 proc expr(p: BProc, n: CgNode, d: var TLoc) =
   when defined(nimCompilerStacktraceHints):
@@ -2012,7 +2012,7 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
     if isSimpleConst(p.config, n.typ):
       # simple constants are inlined at the usage site
       let da = p.env.dataFor(n.cnst)
-      let val = translate(p.env[da])
+      let val = translate(p.env[da], p.env)
       if val.kind == cnkSetConstr:
         let cs = toBitSet(p.config, val)
         putIntoDest(p, d, n, genRawSetData(cs, int(getSize(p.config, n.typ))))
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index bf7220ecd3e..3bed1798f6a 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -398,8 +398,8 @@ proc genAsmOrEmitStmt(p: BProc, t: CgNode, isAsmStmt=false): Rope =
     case it.kind
     of cnkStrLit:
       res.add(getString(p, it))
-    of cnkField:
-        let sym = it.field
+    of cnkAstLit:
+        let sym = it.astLit.sym
         # special support for raw field symbols
         discard getTypeDesc(p.module, skipTypes(sym.typ, abstractPtrs))
         p.config.internalAssert(sym.locId != 0, it.info):
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index e5a362711b1..810ae605c04 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -55,6 +55,9 @@ type
   TranslateCl = object
     graph: ModuleGraph
     idgen: IdGenerator
+    env: ptr MirEnv
+      ## read-only reference to the MirEnv. Stored here to prevent excessive
+      ## parameter passing
 
     owner: PSym
 
@@ -184,48 +187,6 @@ proc newExpr(kind: CgNodeKind, info: TLineInfo, typ: PType,
   result = CgNode(kind: kind, info: info, typ: typ)
   result.kids = kids
 
-proc translateLit*(val: PNode): CgNode =
-  ## Translates an ``mnkLiteral`` node to a ``CgNode``.
-  ## Note that the MIR not only uses ``mnkLiteral`` for "real" literals, but
-  ## also for pushing other raw ``PNode``s through the MIR phase.
-  template node(k: CgNodeKind, field, value: untyped): CgNode =
-    CgNode(kind: k, info: val.info, typ: val.typ, field: value)
-
-  case val.kind
-  of nkIntLiterals:
-    # use the type for deciding what whether it's a signed or unsigned value
-    case val.typ.skipTypes(abstractRange + {tyEnum}).kind
-    of tyInt..tyInt64, tyBool:
-      node(cnkIntLit, intVal, val.intVal)
-    of tyUInt..tyUInt64, tyChar:
-      node(cnkUIntLit, intVal, val.intVal)
-    of tyPtr, tyPointer, tyProc:
-      # XXX: consider adding a dedicated node for pointer-like-literals
-      #      to both ``PNode`` and ``CgNode``
-      node(cnkUIntLit, intVal, val.intVal)
-    else:
-      unreachable(val.typ.skipTypes(abstractRange).kind)
-  of nkFloatLiterals:
-    case val.typ.skipTypes(abstractRange).kind
-    of tyFloat, tyFloat64:
-      node(cnkFloatLit, floatVal, val.floatVal)
-    of tyFloat32:
-      # all code-generators need to do this at one point, so we help them out
-      # by narrowing the value to a float32 value
-      node(cnkFloatLit, floatVal, val.floatVal.float32.float64)
-    else:
-      unreachable()
-  of nkNilLit:
-    newNode(cnkNilLit, val.info, val.typ)
-  of nkNimNodeLit:
-    node(cnkAstLit, astLit, val[0])
-  of nkSym:
-    # special case for raw symbols used with emit and asm statements
-    assert val.sym.kind == skField
-    node(cnkField, field, val.sym)
-  else:
-    unreachable("implement: " & $val.kind)
-
 func addIfNotEmpty(stmts: var seq[CgNode], n: sink CgNode) =
   ## Only adds the node to the list if it's not an empty node. Used to prevent
   ## the creation of statement-list expression that only consist of empty
@@ -308,10 +269,21 @@ proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
       typ = cl.locals[id].typ
     # the view is auto-dereferenced here for convenience
     newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
-  of mnkLiteral:
-    translateLit(n.lit)
+  of mnkNilLit:
+    CgNode(kind: cnkNilLit, info: info, typ: n.typ)
+  of mnkIntLit:
+    CgNode(kind: cnkIntLit, info: info, typ: n.typ,
+           intVal: cl.env[].getInt(n.number))
+  of mnkUIntLit:
+    CgNode(kind: cnkUIntLit, info: info, typ: n.typ,
+           intVal: cl.env[].getInt(n.number))
+  of mnkFloatLit:
+    CgNode(kind: cnkFloatLit, info: info, typ: n.typ,
+           floatVal: cl.env[].getFloat(n.number))
   of mnkStrLit:
     CgNode(kind: cnkStrLit, info: info, typ: n.typ, strVal: n.strVal)
+  of mnkAstLit:
+    CgNode(kind: cnkAstLit, info: info, typ: n.typ, astLit: cl.env[][n.ast])
   of mnkType:
     newTypeNode(info, n.typ)
   of mnkNone:
@@ -1112,8 +1084,8 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
                  body: sink MirBody): Body =
   ## Generates the ``CgNode`` IR corresponding to the input MIR `body`,
   ## using `idgen` to provide new IDs when creating symbols.
-  var cl = TranslateCl(graph: graph, idgen: idgen, owner: owner,
-                       locals: move body.locals)
+  var cl = TranslateCl(graph: graph, idgen: idgen, env: addr env,
+                       owner: owner, locals: move body.locals)
   # enable translation:
   cl.isActive = true
 
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 3e9c452187d..a7df7f69db9 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -32,8 +32,6 @@ import
     int128
   ]
 
-from compiler/backend/cgirgen import translateLit
-
 func lastSon*(n: CgNode): CgNode {.inline.} =
   # XXX: replace usages with `n[^1]`
   {.cast(noSideEffect).}:
@@ -137,11 +135,14 @@ proc newSymNode*(env: MirEnv, s: PSym): CgNode {.inline.} =
   else:
     unreachable(s.kind)
 
-proc translate*(t: MirTree): CgNode =
+proc translate*(t: MirTree, env: MirEnv): CgNode =
   ## Compatibility routine for translating a MIR constant-expression (`t`) to
   ## a ``CgNode`` tree. Obsolete once the code generators use the MIR
   ## directly.
-  proc translateAux(t: MirTree, i: var int): CgNode =
+  proc translateAux(t: MirTree, i: var int, env: MirEnv): CgNode =
+    template recurse(): CgNode =
+      translateAux(t, i, env)
+
     template tree(k: CgNodeKind, body: untyped): CgNode =
       ## Convenience template for setting up the tree node and iterating the
       ## input node's child nodes.
@@ -162,31 +163,43 @@ proc translate*(t: MirTree): CgNode =
         inc i # advance to the arg node
         CgNode(kind: cnkBinding, info: unknownLineInfo,
                kids: @[CgNode(kind: cnkField, field: field),
-                       translateAux(t, i)])
+                       recurse()])
     of mnkArrayConstr, mnkSeqConstr:
       tree cnkArrayConstr:
-        translateAux(t, i)
+        recurse()
     of mnkTupleConstr:
       tree cnkTupleConstr:
-        translateAux(t, i)
+        recurse()
     of mnkClosureConstr:
       tree cnkClosureConstr:
-        translateAux(t, i)
+        recurse()
     of mnkSetConstr:
       tree cnkSetConstr:
-        translateAux(t, i)
+        recurse()
     of mnkRange:
       tree cnkRange:
-        translateAux(t, i)
+        recurse()
     of mnkArg:
-      let x = translateAux(t, i)
+      let x = recurse()
       inc i # skip the end node
       x
-    of mnkLiteral:
-      translateLit(n.lit)
+    of mnkNilLit:
+      CgNode(kind: cnkNilLit, info: unknownLineInfo, typ: n.typ)
+    of mnkIntLit:
+      CgNode(kind: cnkIntLit, info: unknownLineInfo, typ: n.typ,
+             intVal: env.getInt(n.number))
+    of mnkUIntLit:
+      CgNode(kind: cnkUIntLit, info: unknownLineInfo, typ: n.typ,
+             intVal: env.getInt(n.number))
+    of mnkFloatLit:
+      CgNode(kind: cnkFloatLit, info: unknownLineInfo, typ: n.typ,
+             floatVal: env.getFloat(n.number))
     of mnkStrLit:
       CgNode(kind: cnkStrLit, info: unknownLineInfo, typ: n.typ,
              strVal: n.strVal)
+    of mnkAstLit:
+      CgNode(kind: cnkAstLit, info: unknownLineInfo, typ: n.typ,
+             astLit: env[n.ast])
     of mnkProc:
       CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: n.typ)
     of AllNodeKinds - ConstrTreeNodes + {mnkEnd, mnkField}:
@@ -194,7 +207,7 @@ proc translate*(t: MirTree): CgNode =
       unreachable(n.kind)
 
   var i = 0
-  translateAux(t, i)
+  translateAux(t, i, env)
 
 proc pick*[T](n: CgNode, forInt, forFloat: T): T =
   ## Returns either `forInt` or `forFloat` depending on the type of `n`.
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index 2fbe90dd04a..4b2f294f25e 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -1604,7 +1604,7 @@ proc genConstant*(g: PGlobals, m: BModule, id: ConstId) =
     var p = newInitProc(g, m)
     #genLineDir(p, c.ast)
     genVarInit(p, c.typ, name, storage,
-               translate(g.env[g.env.dataFor(id)]))
+               translate(g.env[g.env.dataFor(id)], g.env))
     g.constants.add(p.body)
 
   # all constants need a name:
@@ -2419,7 +2419,7 @@ proc rdData(p: PProc, data: DataId, typ: PType): TCompRes =
   ## Returns the loc for the `data` of type `typ`. Emits the definition for
   ## `data` if it hasn't been already.
   if not containsOrIncl(p.g.dataGenerated, data.int):
-    let val = gen(p, translate(p.env[data]))
+    let val = gen(p, translate(p.env[data], p.env))
     # emit the definition into the constants section:
     p.g.constants.addf("var Data$1 = $2;$n", [$ord(data), val.res])
 
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index 69378d5554c..b8d1604862f 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -6,7 +6,6 @@ import
     hashes
   ],
   compiler/ast/[
-    ast_query,
     ast_types,
     types
   ],
@@ -34,23 +33,12 @@ func hashTree(tree: ConstrTree): Hash =
   func hash(n: MirNode): Hash {.nimcall.} =
     result = hash(n.kind)
     case n.kind
-    of mnkLiteral:
-      proc hashLit(n: PNode): Hash =
-        case n.kind
-        of nkFloatKinds:
-          # make sure to hash the bit representation, so that NaNs are
-          # accounted for
-          hash(cast[BiggestInt](n.floatVal))
-        of nkIntKinds:
-          hash(n.intVal)
-        of nkNilLit:
-          Hash(0)
-        else:
-          unreachable(n.kind)
-
-      result = result !& hashLit(n.lit)
+    of mnkIntLit, mnkUIntLit, mnkFloatLit:
+      result = result !& hash(n.number)
     of mnkStrLit:
       result = result !& hash(n.strVal)
+    of mnkAstLit:
+      result = result !& hash(n.ast)
     of mnkProc:
       result = result !& hash(n.prc.ord)
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
@@ -58,7 +46,7 @@ func hashTree(tree: ConstrTree): Hash =
       result = result !& hash(n.len)
     of mnkField:
       result = result !& hash(n.field)
-    of mnkArg, mnkEnd:
+    of mnkArg, mnkEnd, mnkNilLit:
       discard
     of AllNodeKinds - ConstrTreeNodes:
       unreachable(n.kind)
@@ -72,24 +60,6 @@ func hashTree(tree: ConstrTree): Hash =
   result = result !& hash(tree[0].typ.kind)
   result = !$(result)
 
-func cmp(a, b: PNode): bool =
-  ## Compares for equality two nodes storing literal values. For float values,
-  ## their bit-representation is compared.
-  if a.kind != b.kind:
-    return false
-
-  case a.kind
-  of nkIntLiterals:
-    a.intVal == b.intVal
-  of nkFloatLiterals:
-    cast[BiggestUInt](a.floatVal) == cast[BiggestUInt](b.floatVal)
-  of nkStrLiterals:
-    a.strVal == b.strVal
-  of nkNilLit:
-    true
-  else:
-    unreachable(a.kind)
-
 proc cmp(a, b: ConstrTree): bool =
   ## Compares two MIR constant expressions for structural equality.
   proc `==`(a, b: MirNode): bool {.nimcall.} =
@@ -97,10 +67,12 @@ proc cmp(a, b: ConstrTree): bool =
       return false # cannot be the same
 
     case a.kind
-    of mnkLiteral:
-      cmp(a.lit, b.lit)
+    of mnkIntLit, mnkUIntLit, mnkFloatLit:
+      a.number == b.number
     of mnkStrLit:
       a.strVal == b.strVal
+    of mnkAstLit:
+      a.ast == b.ast
     of mnkProc:
       a.prc == b.prc
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
@@ -108,7 +80,7 @@ proc cmp(a, b: ConstrTree): bool =
       a.len == b.len
     of mnkField:
       a.field == b.field
-    of mnkArg, mnkEnd:
+    of mnkArg, mnkEnd, mnkNilLit:
       true # same node kind -> equal nodes
     of AllNodeKinds - ConstrTreeNodes:
       unreachable(a.kind)
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index e6e7f7f5255..7991c478450 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -25,6 +25,7 @@ import
     mirtrees
   ],
   compiler/modules/[
+    magicsys,
     modulegraphs
   ],
   compiler/sem/[
@@ -41,7 +42,7 @@ from compiler/ast/report_enums import ReportKind
 # XXX: temporary dependency until switch assignments are lowered differently
 from compiler/sem/injectdestructors import buildVoidCall
 
-from compiler/sem/liftdestructors import boolLit, cyclicType
+from compiler/sem/liftdestructors import cyclicType
 
 type
   LocalDiagKind = enum
@@ -154,7 +155,8 @@ template genCopy(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
       # pass whether the copy can potentially introduce cycles as the third
       # parameter:
       let c = maybeCyclic and couldIntroduceCycle(tree, dest)
-      bu.emitByVal literal(boolLit(graph, unknownLineInfo, c))
+      bu.emitByVal literal(mnkIntLit, env.getOrIncl(BiggestInt(c)),
+                           graph.getSysType(unknownLineInfo, tyBool))
 
 proc genDestroy*(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
                  target: Value) =
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 17db7ff3cd2..a783367a995 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -75,13 +75,16 @@ func endNode*(k: MirNodeKind): MirNode {.inline.} =
 func typeLit*(t: PType): Value =
   Value(node: MirNode(kind: mnkType, typ: t))
 
-func literal*(n: PNode): Value =
-  assert n.kind notin nkStrKinds
-  Value(node: MirNode(kind: mnkLiteral, typ: n.typ, lit: n))
+func literal*(kind: range[mnkIntLit..mnkFloatLit], n: NumberId,
+              typ: PType): Value =
+  Value(node: MirNode(kind: kind, typ: typ, number: n))
 
 func literal*(str: StringId, typ: PType): Value =
   Value(node: MirNode(kind: mnkStrLit, typ: typ, strVal: str))
 
+func literal*(ast: AstId, typ: PType): Value =
+  Value(node: MirNode(kind: mnkAstLit, typ: typ, ast: ast))
+
 func temp*(typ: PType, id: LocalId): Value =
   Value(node: MirNode(kind: mnkTemp, typ: typ, local: id))
 
diff --git a/compiler/mir/mirenv.nim b/compiler/mir/mirenv.nim
index 67b3b966049..9cf1f43f09d 100644
--- a/compiler/mir/mirenv.nim
+++ b/compiler/mir/mirenv.nim
@@ -43,8 +43,13 @@ type
       ## includes both normal globals and threadvars
     procedures*: SymbolTable[ProcedureId, PSym]
 
+    numbers*: BiTable[BiggestInt]
+      ## all numerical values referenced by the MIR, stored as bit patterns
     strings*: BiTable[string]
       ## all string data referenced by the MIR
+    asts*: Store[AstId, PNode]
+      ## all AST fragments referenced by the MIR. No unification is
+      ## performed
 
     bodies*: OrdinalSeq[ConstId, DataId]
       ## associates each user-defined constant with its content
@@ -109,9 +114,26 @@ func `[]`*(env: MirEnv, id: ProcedureId): lent PSym {.inline.} =
 func `[]`*(env: MirEnv, id: DataId): lent ConstrTree {.inline.} =
   env.data[id]
 
+func getInt*(env: MirEnv, id: NumberId): BiggestInt {.inline.} =
+  env.numbers[LitId id]
+
+func getUInt*(env: MirEnv, id: NumberId): BiggestUInt {.inline.} =
+  cast[BiggestUInt](env.numbers[LitId id])
+
+func getFloat*(env: MirEnv, id: NumberId): BiggestFloat {.inline.} =
+  cast[BiggestFloat](env.numbers[LitId id])
+
 func `[]`*(env: MirEnv, id: StringId): lent string {.inline.} =
   env.strings[LitId id]
 
+func `[]`*(env: MirEnv, id: AstId): lent PNode {.inline.} =
+  env.asts[id]
+
+func getOrIncl*(env: var MirEnv, v: BiggestInt|BiggestUInt|BiggestFloat
+               ): NumberId {.inline.} =
+  ## If not registered already, adds `v` to the environment.
+  NumberId env.numbers.getOrIncl(cast[BiggestInt](v))
+
 func getOrIncl*(env: var MirEnv, str: string): StringId {.inline.} =
   ## If not registered already, adds `str` to the environment.
   StringId env.strings.getOrIncl(str)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 17a7b3f1adf..3b14298f7f8 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -316,8 +316,54 @@ func addLocal(c: var TCtx, s: PSym): LocalId =
 proc empty(c: var TCtx, n: PNode): MirNode =
   MirNode(kind: mnkNone, typ: n.typ)
 
-func intLiteral(val: Int128, typ: PType): Value =
-  literal(newIntTypeNode(val, typ))
+func intLiteral(env: var MirEnv, val: BiggestInt, typ: PType): Value =
+  literal(mnkIntLit, env.getOrIncl(val), typ)
+
+func uintLiteral(env: var MirEnv, val: BiggestUInt, typ: PType): Value =
+  literal(mnkUIntLit, env.getOrIncl(val), typ)
+
+func floatLiteral(env: var MirEnv, val: BiggestFloat, typ: PType): Value =
+  literal(mnkFloatLit, env.getOrIncl(val), typ)
+
+func astLiteral(env: var MirEnv, val: PNode, typ: PType): Value =
+  literal(env.asts.add(val), typ)
+
+proc toIntLiteral(env: var MirEnv, val: Int128, typ: PType): Value =
+  ## Interprets `val` based on `typ`.
+  if isUnsigned(typ):
+    uintLiteral(env, val.toUInt, typ)
+  else:
+    intLiteral(env, val.toInt, typ)
+
+proc toIntLiteral(env: var MirEnv, n: PNode): Value =
+  ## Translates an integer value (represented by `n`) to its MIR
+  ## counterpart.
+  assert n.kind in nkIntLiterals
+  # use the type for deciding what whether it's a signed or unsigned value
+  case n.typ.skipTypes(abstractRange + {tyEnum}).kind
+  of tyInt..tyInt64, tyBool:
+    intLiteral(env, n.intVal, n.typ)
+  of tyUInt..tyUInt64, tyChar, tyPtr, tyPointer, tyProc:
+    uintLiteral(env, cast[BiggestUInt](n.intVal), n.typ)
+  else:
+    unreachable()
+
+proc toFloatLiteral(env: var MirEnv, n: PNode): Value =
+  ## Translates a float value (represented by `n`) to its MIR
+  ## counterpart.
+  assert n.kind in nkFloatLiterals
+  var val = n.floatVal
+  case n.typ.skipTypes(abstractRange).kind
+  of tyFloat, tyFloat64:
+    discard "nothing to adjust"
+  of tyFloat32:
+    # all code-generators would have to narrow the value at some point, so we
+    # help them by doing it here
+    val = val.float32.float64
+  else:
+    unreachable()
+
+  floatLiteral(env, val, n.typ)
 
 func strLiteral(env: var MirEnv, str: string, typ: PType): Value =
   literal(env.getOrIncl(str), typ)
@@ -548,7 +594,7 @@ proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
                           field: discr.position.int32):
           c.use access
       # inverted flag:
-      c.emitByVal literal(newIntTypeNode(ord(inverted), call.typ))
+      c.emitByVal intLiteral(c.env, ord(inverted), call.typ)
       # error message operand:
       c.emitByVal strLiteral(c.env, genFieldDefect(conf, field, discr),
                              c.graph.getSysType(call.info, tyString))
@@ -742,8 +788,7 @@ proc genMacroCallArgs(c: var TCtx, n: PNode, kind: TSymKind, fntyp: PType) =
     genCallee(c, n[1])
   of skTemplate:
     # for late template invocations, the callee template is an argument
-    c.subTree mnkArg:
-      c.use literal(newTreeIT(nkNimNodeLit, n[1].info, n[1].typ, n[1]))
+    c.emitByVal astLiteral(c.env, n[1], n[1].typ)
   else:
     unreachable(kind)
 
@@ -960,8 +1005,8 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
           let val = c.wrapTemp(typ): op(c, dest, n, m)
           c.buildDefectMagicCall mChckRange, typ:
             c.emitByVal val
-            c.emitByVal intLiteral(firstOrd(c.graph.config, typ), typ)
-            c.emitByVal intLiteral(lastOrd(c.graph.config, typ), typ)
+            c.emitByVal toIntLiteral(c.env, firstOrd(c.graph.config, typ), typ)
+            c.emitByVal toIntLiteral(c.env, lastOrd(c.graph.config, typ), typ)
         else:
           # no range check is needed
           op(c, dest, n, m)
@@ -1132,8 +1177,8 @@ proc genClosureConstr(c: var TCtx, n: PNode, isConsume: bool) =
         # we ensure that the nil literal has the correct type
         # TODO: prevent a ``nkNilLit`` with no type information from being
         #       created instead
-        c.use literal(newNodeIT(nkNilLit, n[1].info,
-                                c.graph.getSysType(n[1].info, tyNil)))
+        c.add MirNode(kind: mnkNilLit,
+                      typ: c.graph.getSysType(n[1].info, tyNil))
       else:
         genArgExpression(c, n[1], isConsume)
 
@@ -1638,11 +1683,10 @@ proc genAsmOrEmitStmt(c: var TCtx, kind: range[mnkAsm..mnkEmit], n: PNode) =
       if it.typ != nil and it.typ.kind == tyTypeDesc:
         c.use genTypeExpr(c, it)
       elif it.kind == nkSym and it.sym.kind == skField:
-        # emit and asm support using raw symbols. So that we don't
-        # have to allow ``skField``s in general, we special case them
-        # here (by pushing them through the MIR phase boxed as
-        # ``mnkLiteral``s)
-        c.add MirNode(kind: mnkLiteral, lit: it, typ: it.sym.typ)
+        # emit and asm support using raw field symbols. For pushing them
+        # through to the code generators, they're quoted (i.e., boxed into
+        # an AST literal)
+        c.use astLiteral(c.env, it, it.sym.typ)
       else:
         # emit and asm statements support lvalue operands
         genOperand(c, it)
@@ -1689,10 +1733,18 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     c.use toValue(c.env.procedures.add(n.sym), n.sym.typ)
   of pirLiteral:
     case n.orig.kind
+    of nkNilLit:
+      c.add MirNode(kind: mnkNilLit, typ: n.typ)
+    of nkIntLiterals:
+      c.use toIntLiteral(c.env, n.orig)
+    of nkFloatLiterals:
+      c.use toFloatLiteral(c.env, n.orig)
     of nkStrLiterals:
       c.use strLiteral(c.env, n.orig.strVal, n.typ)
+    of nkNimNodeLit:
+      c.use astLiteral(c.env, n.orig[0], n.typ)
     else:
-      c.use literal(n.orig)
+      unreachable(n.orig.kind)
   of pirLocal, pirGlobal, pirParam, pirConst:
     c.add nameNode(c, n.sym)
   of pirDeref:
@@ -2261,8 +2313,12 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       bu.subTree MirNode(kind: mnkRange, len: 2):
         constToMirAux(bu, env, n[0])
         constToMirAux(bu, env, n[1])
-    of nkIntLiterals, nkFloatLiterals, nkNilLit:
-      bu.use literal(n)
+    of nkNilLit:
+      bu.add MirNode(kind: mnkNilLit, typ: n.typ)
+    of nkIntLiterals:
+      bu.use toIntLiteral(env, n)
+    of nkFloatLiterals:
+      bu.use toFloatLiteral(env, n)
     of nkStrLiterals:
       bu.use strLiteral(env, n.strVal, n.typ)
     of nkHiddenStdConv, nkHiddenSubConv:
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 9c34f46319d..5bf4f28722d 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -24,11 +24,14 @@ type
     ## Identifies the field of a record type
   ProcedureId* = distinct uint32
     ## Identifies a procedure
-  LiteralId {.used.} = distinct uint32
-    ## Identifies a literal
+  NumberId* = distinct uint32
+    ## Uniquely identifies some numerical value (float, signed int,
+    ## unsigned int). Two values with the same bit pattern have the same ID
   StringId* = distinct uint32
     ## Uniquely identifies a string value. Two strings sharing the same
     ## content map to the same ID
+  AstId* = distinct uint32
+    ## Identifies an AST fragment stored in the MIR environment.
   DataId* = distinct uint32
     ## Identifies a complete constant expression
 
@@ -66,10 +69,12 @@ type
 
     mnkField  ## declarative node only allowed in special contexts
 
-    mnkLiteral ## literal data. Currently represented via a ``PNode``
-    # future direction: split into IntLit, FloatLit, and StrLit and store the
-    # values in a separate table (so that MirNode gets smaller)
+    mnkNilLit  ## nil literal
+    mnkIntLit  ## reference to signed integer literal
+    mnkUIntLit ## reference to unsigend integer literal
+    mnkFloatLit## reference to float literal
     mnkStrLit  ## reference to a literal string
+    mnkAstLit  ## reference to AST fragment
     mnkType    ## a type literal
 
     # future direction:
@@ -282,10 +287,12 @@ type
     of mnkField, mnkPathNamed, mnkPathVariant:
       field*: int32
         ## field position
-    of mnkLiteral:
-      lit*: PNode
+    of mnkIntLit, mnkUIntLit, mnkFloatLit:
+      number*: NumberId
     of mnkStrLit:
       strVal*: StringId
+    of mnkAstLit:
+      ast*: AstId
     of mnkPathPos:
       position*: uint32 ## the 0-based position of the field
     of mnkCall, mnkCheckedCall:
@@ -346,7 +353,8 @@ const
     ## Assignment modifiers. Nodes that can only appear directly in the source
     ## slot of assignments.
 
-  LiteralDataNodes* = {mnkLiteral, mnkStrLit}
+  LiteralDataNodes* = {mnkNilLit, mnkIntLit, mnkUIntLit, mnkFloatLit,
+                       mnkStrLit, mnkAstLit}
 
   ConstrTreeNodes* = {mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr,
                       mnkTupleConstr, mnkClosureConstr, mnkObjConstr,
@@ -388,7 +396,9 @@ func `==`*(a, b: ConstId): bool {.borrow.}
 func `==`*(a, b: GlobalId): bool {.borrow.}
 func `==`*(a, b: ProcedureId): bool {.borrow.}
 func `==`*(a, b: DataId): bool {.borrow.}
+func `==`*(a, b: NumberId): bool {.borrow.}
 func `==`*(a, b: StringId): bool {.borrow.}
+func `==`*(a, b: AstId): bool {.borrow.}
 
 func isAnon*(id: ConstId): bool =
   ## Returns whether `id` represents an anonymous constant.
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 86e922178bb..7475111a796 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -10,6 +10,7 @@ import
     strutils
   ],
   compiler/ast/[
+    ast_query,
     ast_types,
     renderer,
     types,
@@ -39,13 +40,15 @@ func `$`(n: MirNode): string =
   of mnkField, mnkPathNamed, mnkPathVariant:
     result.add " field:"
     result.addInt n.field
-  of mnkLiteral:
-    result.add " lit: "
-    {.cast(noSideEffect).}:
-      result.add renderTree(n.lit)
+  of mnkIntLit, mnkUIntLit, mnkFloatLit:
+    result.add " number: "
+    result.addInt n.number.uint32
   of mnkStrLit:
     result.add " strVal: "
     result.addInt n.strVal.uint32
+  of mnkAstLit:
+    result.add " ast: "
+    result.addInt n.ast.uint32
   of mnkPathPos:
     result.add " position: "
     result.add $n.position
@@ -140,12 +143,15 @@ func next(tree: MirTree, i: var int): lent MirNode =
   result = tree[i]
   inc i
 
+func idToStr[I](result: var string, id: I, open: string) =
+  result.add open
+  result.addInt id.uint32
+  result.add ">"
+
 func addName[I](result: var string, id: I, open: string, c: RenderCtx) =
   if c.env.isNil:
     # just render the ID
-    result.add open
-    result.addInt id.uint32
-    result.add ">"
+    idToStr(result, id, open)
   else:
     result.add c.env[][id].name.s
 
@@ -153,12 +159,39 @@ func addLocalName(result: var string, id: LocalId, open: string,
                   c: RenderCtx) =
   if c.body.isNil:
     # render just the ID
-    result.add open
-    result.addInt id.uint32
-    result.add ">"
+    idToStr(result, id, open)
   else:
     result.add c.body[][id].name.s
 
+proc addTypedNumber(result: var string, bits: BiggestInt, typ: PType) =
+  ## Interprets the bit representation `bits` as `typ` and renders it
+  ## accordingly. Errors are output directly into `result`.
+  let typ = typ.skipTypes(abstractRange)
+  case typ.kind
+  of tyInt..tyInt64:
+    result.addInt bits
+    result.add [tyInt: "", "'i8", "'i16", "'i32", "'i64"][typ.kind]
+  of tyUInt..tyUInt64:
+    result.addInt cast[BiggestUInt](bits)
+    result.add [tyUInt: "", "'u8", "'u16", "'u32", "'u64"][typ.kind]
+  of tyFloat:
+    result.addFloat cast[BiggestFloat](bits)
+    result.add [tyFloat: "", "'f32", "'f64"][typ.kind]
+  of tyEnum, tyBool:
+    # use the name of the enum field
+    block render:
+      # search for the enum field with the given value
+      for it in typ.n.items:
+        if it.sym.position == bits:
+          # found it!
+          result.add it.sym.name.s
+          break render
+      result.add "<invalid enum>"
+  of tyProc, tyPtr, tyPointer:
+    result.addInt cast[BiggestUInt](bits)
+  else:
+    result.add "<invalid literal>"
+
 proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
   case n.kind
   of mnkParam:
@@ -167,9 +200,7 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.addLocalName(n.local, "<L", c)
   of mnkConst:
     if isAnon(n.cnst):
-      result.add "<D" # "D" for "Data"
-      result.addInt extract(n.cnst).uint32
-      result.add ">"
+      idToStr(result, extract(n.cnst), "<D") # "D" for "Data"
     else:
       result.addName(n.cnst, "<C", c)
   of mnkGlobal:
@@ -180,8 +211,23 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.add "_" & $n.local.int
   of mnkNone:
     result.add "<none>"
-  of mnkLiteral:
-    result.add $n.lit
+  of mnkNilLit:
+    result.add "nil"
+  of mnkIntLit:
+    if c.env.isNil:
+      idToStr(result, n.number, "<Int: ")
+    else:
+      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
+  of mnkUIntLit:
+    if c.env.isNil:
+      idToStr(result, n.number, "<UInt: ")
+    else:
+      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
+  of mnkFloatLit:
+    if c.env.isNil:
+      idToStr(result, n.number, "<Float: ")
+    else:
+      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
   of mnkStrLit:
     if c.env.isNil:
       result.add "<Str: "
@@ -189,6 +235,10 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
       result.add ">"
     else:
       result.addQuoted c.env[][n.strVal]
+  of mnkAstLit:
+    # could also be pretty-printed, but, given the sparse usage, doesn't
+    # warrant the extra effort at the moment
+    result.add "<Ast>"
   of mnkType:
     result.add "type("
     result.add $n.typ
diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index d5a35935e7b..cc1a82646b8 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -84,10 +84,10 @@ func isSameRoot(an, bn: MirNode): bool =
     unreachable(an.kind)
 
 func sameIndex*(a, b: MirNode): Ternary =
-  if a.kind != b.kind or a.kind != mnkLiteral:
+  if a.kind != b.kind or a.kind notin {mnkIntLit, mnkUIntLit}:
     maybe
   else:
-    if a.lit.intVal == b.lit.intVal:
+    if a.number == b.number:
       yes
     else:
       no
diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index ccfa37e0c82..249f7113029 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -27,6 +27,10 @@ import
     msgs,
     options
   ],
+  compiler/mir/[
+    mirenv,
+    mirtrees
+  ],
   compiler/modules/[
     modulegraphs
   ],
@@ -126,17 +130,17 @@ proc putIntoReg(dest: var TFullReg; jit: var JitState, c: var TCtx, n: PNode,
   case typ.kind
   of akInt:
     dest.ensureKind(rkInt, c.memory)
-    dest.intVal = data[0].lit.intVal
+    dest.intVal = jit.env.getInt(data[0].number)
   of akFloat:
     dest.ensureKind(rkFloat, c.memory)
-    dest.floatVal = data[0].lit.floatVal
+    dest.floatVal = jit.env.getFloat(data[0].number)
   of akPtr:
     dest.ensureKind(rkAddress, c.memory)
     # non-nil values should have already been reported as an error
-    assert data[0].lit.kind == nkNilLit
+    assert data[0].kind == mnkNilLit
   of akPNode:
     dest.ensureKind(rkNimNode, c.memory)
-    dest.nimNode = data[0].lit
+    dest.nimNode = jit.env[data[0].ast]
   else:
     dest.initLocReg(typ, c.memory)
     initFromExpr(dest.handle, data, jit.env, c)
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index 4cae4cab4dc..4ab0160344a 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -196,10 +196,6 @@ type
     i: int ## the index in `PackedEnv.nodes` where the next item is to be stored
 
 const
-  EmbeddedUInts = {nkCharLit, nkUInt8Lit..nkUInt32Lit}
-  EmbeddedInts = {nkInt8Lit..nkInt32Lit} # these also fit into a `uint32`
-  ExternalInts = {nkIntLit, nkInt64Lit, nkUIntLit, nkUInt64Lit}
-
   NilSymId = -1.SymId
   NilTypeId = -1.TypeId
 
@@ -259,6 +255,15 @@ func getLitId(e: var PackedEnv, x: BiggestInt): LitId {.inline.} =
 func getLitId(e: var PackedEnv, x: BiggestFloat): LitId {.inline.} =
   e.numbers.getOrIncl(cast[BiggestInt](x))
 
+func getInt(e: PackedEnv, n: MirNode): Int128 =
+  case n.kind
+  of mnkIntLit:
+    toInt128 e.numbers[n.number.LitId]
+  of mnkUIntLit:
+    toInt128 cast[BiggestUInt](e.numbers[n.number.LitId])
+  else:
+    unreachable()
+
 # -------- data storing --------------------------------------------------
 
 func startEncoding*(enc: var DataEncoder, e: PackedEnv) {.inline.} =
@@ -269,14 +274,6 @@ func put(enc: var DataEncoder, e: var PackedEnv,
   e.nodes[enc.i] = d
   inc enc.i
 
-func putLater(enc: var DataEncoder): int {.inline.} =
-  result = enc.i
-  inc enc.i
-
-func setAt(enc: var DataEncoder, e: var PackedEnv, i: int,
-           d: sink PackedDataNode) {.inline.} =
-  e.nodes[i] = d
-
 func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
                    t: MirTree, n: NodePosition)
   ## Stores in `e.nodes` the data represented by the MIR constant expression
@@ -284,10 +281,10 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
   ## allocated in `e.nodes` for the top data-node. Space allocation for the
   ## sub-data-nodes is handled by ``storeData``.
 
-func storeDiscrData(enc: var DataEncoder, e: var PackedEnv, s: PSym, v: PNode) =
+func storeDiscrData(enc: var DataEncoder, e: var PackedEnv, s: PSym, v: Int128) =
   let
     recCase = findRecCase(s.owner.typ, s)
-    b = findMatchingBranch(recCase, getInt(v))
+    b = findMatchingBranch(recCase, v)
   assert b != -1
   # We don't have access to vm type information here, so 32 is always
   # used for `numBits`. This is safe, since the both `value` and `index`
@@ -295,7 +292,7 @@ func storeDiscrData(enc: var DataEncoder, e: var PackedEnv, s: PSym, v: PNode) =
   # of repacking the discriminator with the correct `numBits`
   # XXX: 16 could be safely used for `numBits` and then the resulting
   #      value could be stored as a `pdkIntLit`
-  let val = packDiscr(v.intVal, b, numBits = 32)
+  let val = packDiscr(v.toInt, b, numBits = 32)
   enc.put e, PackedDataNode(kind: pdkInt, pos: e.getLitId(val).uint32)
 
 proc storeFieldsData(enc: var DataEncoder, e: var PackedEnv,
@@ -317,7 +314,7 @@ proc storeFieldsData(enc: var DataEncoder, e: var PackedEnv,
     if sfDiscriminant notin s.flags:
       enc.storeDataNode(e, t, n+1)
     else:
-      enc.storeDiscrData(e, s, t[n+1].lit)
+      enc.storeDiscrData(e, s, e.getInt(t[n+1]))
 
     n = t.sibling(n) # move the cursor to the next field
 
@@ -354,52 +351,43 @@ proc storeSetData(enc: var DataEncoder, e: var PackedEnv,
   enc.put e, PackedDataNode(kind: pdkSet, pos: count.uint32 * 2)
   e.nodes.growBy(count * 2) # make space for the content
 
-  proc adjusted(enc: DataEncoder, n: MirNode, typ: PType): uint32 =
+  template adjusted(n: MirNode, typ: PType): uint32 =
     # make the range start at zero
-    toUInt32(getInt(n.lit) - firstOrd(enc.config, typ))
+    toUInt32(e.getInt(n) - firstOrd(enc.config, typ))
 
   var n = n + 1
   # bitsets only store values in the range 0..high(uint16), so the values can
   # be stored directly
   for _ in 0..<count:
     if t[n].kind == mnkRange:
-      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n + 1], typ))
-      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n + 2], typ))
+      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(t[n + 1], typ))
+      enc.put e, PackedDataNode(kind: pdkIntLit, pos: adjusted(t[n + 2], typ))
     else:
-      let d = PackedDataNode(kind: pdkIntLit, pos: adjusted(enc, t[n], typ))
+      let d = PackedDataNode(kind: pdkIntLit, pos: adjusted(t[n], typ))
       enc.put e, d
       enc.put e, d
 
     n = t.sibling(n)
 
-func storeLiteral(enc: var DataEncoder, e: var PackedEnv, n: PNode) =
-  let dstIdx = enc.putLater()
-  let (kind, item) =
-    case n.kind
-    of EmbeddedUInts: (pdkIntLit, n.intVal.uint32)
-    of EmbeddedInts:  (pdkIntLit, cast[uint32](n.intVal))
-    of ExternalInts:  (pdkInt,    e.getLitId(n.intVal).uint32)
-    of nkFloatKinds:  (pdkFloat,  e.getLitId(n.floatVal).uint32)
-    of nkNilLit:
-      if n.typ.skipTypes(abstractInst).callConv == ccClosure:
-        # XXX: some unexpanded `nil` closure literals reach here, so we have
-        #      to expand them here. This needs to happen earlier
-        e.nodes.growBy(4)
-        enc.put e, PackedDataNode(kind: pdkField, pos: 0)
-        enc.put e, PackedDataNode(kind: pdkPtr, pos: 0)
-        enc.put e, PackedDataNode(kind: pdkField, pos: 0)
-        enc.put e, PackedDataNode(kind: pdkPtr, pos: 0)
-        (pdkObj, 2'u32)
-      else:
-        (pdkPtr, 0'u32)
-    else:             unreachable(n.kind)
-  enc.setAt e, dstIdx, PackedDataNode(kind: kind, pos: item)
-
 func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
                    t: MirTree, n: NodePosition) =
   case t[n].kind
-  of mnkLiteral:
-    storeLiteral(enc, e, t[n].lit)
+  of mnkNilLit:
+    if t[n].typ.skipTypes(abstractInst).callConv == ccClosure:
+      # XXX: some unexpanded `nil` closure literals reach here, so we have
+      #      to expand them here. This needs to happen earlier
+      enc.put e, PackedDataNode(kind: pdkObj, pos: 2)
+      e.nodes.growBy(4)
+      enc.put e, PackedDataNode(kind: pdkField, pos: 0)
+      enc.put e, PackedDataNode(kind: pdkPtr, pos: 0)
+      enc.put e, PackedDataNode(kind: pdkField, pos: 0)
+      enc.put e, PackedDataNode(kind: pdkPtr, pos: 0)
+    else:
+      enc.put e, PackedDataNode(kind: pdkPtr, pos: 0)
+  of mnkIntLit, mnkUIntLit:
+    enc.put e, PackedDataNode(kind: pdkInt, pos: t[n].number.uint32)
+  of mnkFloatLit:
+    enc.put e, PackedDataNode(kind: pdkFloat, pos: t[n].number.uint32)
   of mnkStrLit:
     # the ID indexes into the string BiTable, it can be packed directly
     enc.put e, PackedDataNode(kind: pdkString, pos: t[n].strVal.uint32)
diff --git a/compiler/vm/vmbackend.nim b/compiler/vm/vmbackend.nim
index 8351982f907..b74ed810cce 100644
--- a/compiler/vm/vmbackend.nim
+++ b/compiler/vm/vmbackend.nim
@@ -308,7 +308,8 @@ proc generateCode*(g: ModuleGraph, mlist: sink ModuleList) =
   # pack the data and write it to the ouput file:
   var
     enc: PackedEncoder
-    penv = PackedEnv(strings: move c.gen.env.strings)
+    penv = PackedEnv(numbers: move c.gen.env.numbers,
+                     strings: move c.gen.env.strings)
 
   enc.init(env.types)
   storeEnv(enc, penv, env)
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 09087968c42..be51f79dcc7 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -28,6 +28,12 @@ import
     int128
   ]
 
+proc getInt(env: MirEnv, n: MirNode): Int128 =
+  case n.kind
+  of mnkIntLit:  env.getInt(n.number).toInt128
+  of mnkUIntLit: env.getUInt(n.number).toInt128
+  else:          unreachable(n.kind)
+
 proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
                   c: var TCtx) =
   ## Loads the value represented by `tree` at `n` into `dest`. On exit, `n`
@@ -53,15 +59,15 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
 
   case dest.typ.kind
   of akInt:
-    writeUInt(dest, next().lit.intVal)
+    writeUInt(dest, env.getInt(next().number))
   of akDiscriminator:
     # handled during object processing below
     unreachable("cannot be written directly")
   of akFloat:
     if dest.typ.sizeInBytes == 4:
-      writeFloat32(dest, float32(next().lit.floatVal))
+      writeFloat32(dest, float32(env.getFloat(next().number)))
     else:
-      writeFloat64(dest, float64(next().lit.floatVal))
+      writeFloat64(dest, float64(env.getFloat(next().number)))
   of akString:
     deref(dest).strVal.newVmString(env[next().strVal], c.allocator)
   of akSeq:
@@ -76,7 +82,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
     # nothing to do, only nil literals are allowed here
     discard next()
   of akRef:
-    if tree[n].kind == mnkLiteral:
+    if tree[n].kind == mnkNilLit:
       discard next() # nothing to do for 'nil' literals
     else:
       # allocate a managed heap location and fill it:
@@ -86,9 +92,9 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       recurse(c.heap.unsafeDeref(slot))
       deref(dest).refVal = slot
   of akSet:
-    proc adjusted(n: PNode, first: Int128): BiggestInt {.inline.} =
+    proc adjusted(val, first: Int128): BiggestInt {.inline.} =
       # subtract the first element's value to make all values zero-based
-      toInt(getInt(n) - first)
+      toInt(val - first)
 
     let first =
       if tree[n].len > 0: firstOrd(c.config, tree[n].typ)
@@ -99,22 +105,21 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       let node = next()
       if node.kind == mnkRange:
         let
-          a = adjusted(next().lit, first)
-          b = adjusted(next().lit, first)
+          a = adjusted(env.getInt(next()), first)
+          b = adjusted(env.getInt(next()), first)
         bitSetInclRange(mbitSet(dest), a .. b)
         inc n # skip the end node
       else:
-        bitSetIncl(mbitSet(dest), adjusted(node.lit, first))
+        bitSetIncl(mbitSet(dest), adjusted(env.getInt(node), first))
   of akPNode:
-    deref(dest).nodeVal = next().lit[0]
+    deref(dest).nodeVal = env[next().ast]
   of akCallable:
     deref(dest).callableVal = toFuncPtr FunctionIndex(next().prc)
   of akObject:
     # the source can either be an object or tuple constructor
     case tree[n].kind
-    of mnkLiteral:
+    of mnkNilLit:
       # special case: nil closure literal
-      assert tree[n].lit.kind == nkNilLit
       # only skip the node, don't initialize anything
       discard next()
     of mnkTupleConstr, mnkClosureConstr:
@@ -131,7 +136,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
           let (owner, idx) = getFieldAndOwner(dest.typ, fpos sym.position)
           # fetch the integer value:
           var val: Int128
-          arg (;val = getInt(next().lit))
+          arg (;val = env.getInt(next()))
           # compute the branch index:
           let b = findMatchingBranch(findRecCase(typ, sym), val)
           # write the tag value to the location:
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index 63fb970d2a9..f875c0a275e 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -20,8 +20,8 @@ template node(k: MirNodeKind, field, val: untyped): MirNode =
   MirNode(kind: k, field: val)
 template node(k: MirNodeKind): MirNode =
   MirNode(kind: k)
-template literal(val: PNode): MirNode =
-  MirNode(kind: mnkLiteral, lit: val)
+template literal(val: NumberId): MirNode =
+  MirNode(kind: mnkIntLit, number: val)
 
 block tree_equality:
   # the type is only relevant for the head of the tree (the first node)
@@ -29,23 +29,24 @@ block tree_equality:
   # setup a list of structurally valid and unique (in terms of equality) trees
   let trees = @[
     # --- literals
-    @[node(mnkLiteral, t1, lit, newIntNode(nkIntLit, 0))],
-    @[node(mnkLiteral, t2, lit, newIntNode(nkIntLit, 0))],
-    @[node(mnkLiteral, t1, lit, newStrNode(nkStrLit, ""))],
-    @[node(mnkLiteral, t1, lit, newStrNode(nkStrLit, "a"))],
-    @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, 0.0))],
-    # 0.0 and -0.0 are different float values
-    @[node(mnkLiteral, t1, lit, newFloatNode(nkFloatLit, -0.0))],
+    @[node(mnkIntLit, t1, number, NumberId 0)],
+    @[node(mnkIntLit, t2, number, NumberId 0)],
+    @[node(mnkUIntLit, t1, number, NumberId 0)],
+    @[node(mnkUIntLit, t2, number, NumberId 0)],
+    @[node(mnkStrLit, t1, strVal, StringId 0)],
+    @[node(mnkStrLit, t1, strVal, StringId 1)],
+    @[node(mnkFloatLit, t1, number, NumberId 0)],
+    @[node(mnkFloatLit, t2, number, NumberId 0)],
 
     # --- ordered aggregates
     @[node(mnkTupleConstr, t1, len, 0), node(mnkEnd)],
     @[node(mnkTupleConstr, t2, len, 0), node(mnkEnd)],
     @[node(mnkTupleConstr, t1, len, 1),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)),
+        node(mnkArg), literal(NumberId 0),
       node(mnkEnd)],
     @[node(mnkTupleConstr, t1, len, 2),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
       node(mnkEnd)],
 
     # --- aggregates with fields
@@ -53,25 +54,25 @@ block tree_equality:
     @[node(mnkObjConstr, t2, len, 0), node(mnkEnd)],
     @[node(mnkObjConstr, t1, len, 1),
         node(mnkField, field, 0),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
       node(mnkEnd)],
     # same field value, different field:
     @[node(mnkObjConstr, t1, len, 1),
         node(mnkField, field, 1),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
       node(mnkEnd)],
     @[node(mnkObjConstr, t1, len, 1),
         node(mnkField, field, 0),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
         node(mnkField, field, 1),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
       node(mnkEnd)],
     # swapped fields
     @[node(mnkObjConstr, t1, len, 1),
         node(mnkField, field, 1),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
         node(mnkField, field, 0),
-        node(mnkArg), literal(newIntNode(nkIntLit, 0)), node(mnkEnd),
+        node(mnkArg), literal(NumberId 0), node(mnkEnd),
       node(mnkEnd)]
   ]
 
diff --git a/tests/compilerapi/tcompilerapi.nim b/tests/compilerapi/tcompilerapi.nim
index 517374930de..e3100f44654 100644
--- a/tests/compilerapi/tcompilerapi.nim
+++ b/tests/compilerapi/tcompilerapi.nim
@@ -57,6 +57,9 @@ proc vmReport(config: ConfigRef, report: Report): TErrorHandling {.gcsafe.} =
   elif report.kind == rintEchoMessage:
     echo report.internalReport.msg
 
+proc newFloatTypeNode(val: float, typ: PType): PNode =
+  result = newFloatNode(nkFloatLit, val)
+  result.typ = typ
 
 proc main() =
   let i = initInterpreter("myscript.nim", vmReport)
@@ -67,8 +70,9 @@ proc main() =
   let foreignProc = i.selectRoutine("hostProgramRunsThis")
   if foreignProc == nil:
     quit "script does not export a proc of the name: 'hostProgramRunsThis'"
-  let res = i.callRoutine(foreignProc, [newFloatNode(nkFloatLit, 0.9),
-                                        newFloatNode(nkFloatLit, 0.1)])
+  let typ = foreignProc.typ[1]
+  let res = i.callRoutine(foreignProc, [newFloatTypeNode(0.9, typ),
+                                        newFloatTypeNode(0.1, typ)])
   doAssert res.kind == nkFloatLit
   echo res.floatVal
 

From 0b144dfc6c15c49dd379b4d7f170a04dffc57d7d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 8 Apr 2024 00:03:07 +0200
Subject: [PATCH 059/169] cgen: simpler `openArray` parameter handling (#1271)

## Summary

Handle the special treatment of `openArray` types when emitting
parameter declarations, and remove the `kind` parameter from
`cgen.getTypeDesc` and friends.

## Details

When requesting the type name/description for an `openArray[T]` type in
a parameter position, the `openArray[T]` type was effectively treated
as a `ptr T`. The relevant logic was in `mapType` and
`getOpenArrayDesc`, with the `kind` parameter providing the context
necessary for deciding how to interpret `openArray`.

Not only is this error-prone (i.e., when passing the wrong `TSymKind`),
it's also unnecessarily complex. Requesting the element type in
`genProcParams` and then appending the pointer specification (`*`)
achieves the same.

The `kind` parameter is removed from `getTypeDesc` and friends, and
`tyOpenArray` types are always committed to the type cache (which was
previously not possible). In addition, emitting an extra `Len`
parameter per nested `openArray` type (e.g.: `openArray[openArray[T]]`)
is removed -- these are not accounted for anywhere else.
---
 compiler/backend/ccgexprs.nim |  16 ++--
 compiler/backend/ccgtypes.nim | 139 ++++++++++++++++------------------
 compiler/backend/cgen.nim     |  64 +++-------------
 3 files changed, 84 insertions(+), 135 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index c48ddd6484e..55569fb331f 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -146,7 +146,7 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
 proc genAssignment(p: BProc, dest, src: TLoc) =
   # This function replaces all other methods for generating
   # the assignment operation in C.
-  case mapType(p.config, dest.t, skVar)
+  case mapType(p.config, dest.t)
   of ctChar, ctBool, ctInt, ctInt8, ctInt16, ctInt32, ctInt64,
      ctFloat, ctFloat32, ctFloat64,
      ctUInt, ctUInt8, ctUInt16, ctUInt32, ctUInt64,
@@ -465,7 +465,7 @@ proc unaryArith(p: BProc, e, x: CgNode, d: var TLoc, op: TMagic) =
 proc genDeref(p: BProc, e: CgNode, d: var TLoc) =
   let
     src = e.operand
-    mt = mapType(p.config, src.typ, mapTypeChooser(p, src))
+    mt = mapType(p.config, src.typ)
   if mt in {ctArray, ctPtrToArray} and lfEnforceDeref notin d.flags:
     # XXX the amount of hacks for C's arrays is incredible, maybe we should
     # simply wrap them in a struct? --> Losing auto vectorization then?
@@ -503,11 +503,11 @@ proc genDeref(p: BProc, e: CgNode, d: var TLoc) =
     else:
       # in C89, dereferencing a pointer requires a pointer to complete type.
       # Make sure that the element type is fully defined by querying its name:
-      discard getTypeDesc(p.module, e.typ, skVar)
+      discard getTypeDesc(p.module, e.typ)
       putIntoDest(p, d, e, "(*$1)" % [rdLoc(a)], a.storage)
 
 proc genAddr(p: BProc, e: CgNode, mutate: bool, d: var TLoc) =
-  if mapType(p.config, e.operand.typ, mapTypeChooser(p, e.operand)) == ctArray:
+  if mapType(p.config, e.operand.typ) == ctArray:
     expr(p, e.operand, d)
   else:
     var a: TLoc
@@ -1681,10 +1681,10 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
   of mNewSeqOfCap: genNewSeqOfCap(p, e, d)
   of mSizeOf:
     let t = e[1].typ.skipTypes({tyTypeDesc})
-    putIntoDest(p, d, e, "((NI)sizeof($1))" % [getTypeDesc(p.module, t, skVar)])
+    putIntoDest(p, d, e, "((NI)sizeof($1))" % [getTypeDesc(p.module, t)])
   of mAlignOf:
     let t = e[1].typ.skipTypes({tyTypeDesc})
-    putIntoDest(p, d, e, "((NI)NIM_ALIGNOF($1))" % [getTypeDesc(p.module, t, skVar)])
+    putIntoDest(p, d, e, "((NI)NIM_ALIGNOF($1))" % [getTypeDesc(p.module, t)])
   of mOffsetOf:
     var dotExpr: CgNode
     case e[1].kind
@@ -1693,7 +1693,7 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     else:
       internalError(p.config, e.info, "unknown ast")
     let t = dotExpr[0].typ.skipTypes({tyTypeDesc})
-    let tname = getTypeDesc(p.module, t, skVar)
+    let tname = getTypeDesc(p.module, t)
     let member =
       if dotExpr.kind == cnkTupleAccess:
         "Field" & rope(dotExpr[1].intVal)
@@ -1964,7 +1964,7 @@ proc useConst*(m: BModule; id: ConstId) =
   # one the constant is part of
   if q != m and not containsOrIncl(m.declaredThings, sym.id):
     let headerDecl = "extern NIM_CONST $1 $2;$n" %
-        [getTypeDesc(m, sym.typ, skVar), q.consts[id].r]
+        [getTypeDesc(m, sym.typ), q.consts[id].r]
     m.s[cfsData].add(headerDecl)
 
 proc genConstDefinition*(q: BModule; id: ConstId) =
diff --git a/compiler/backend/ccgtypes.nim b/compiler/backend/ccgtypes.nim
index bc6966efb1f..cbadf38337f 100644
--- a/compiler/backend/ccgtypes.nim
+++ b/compiler/backend/ccgtypes.nim
@@ -109,7 +109,7 @@ proc mapSetType(conf: ConfigRef; typ: PType): TCTypeKind =
   of 8: result = ctInt64
   else: result = ctArray
 
-proc mapType(conf: ConfigRef; typ: PType; kind: TSymKind): TCTypeKind =
+proc mapType(conf: ConfigRef; typ: PType): TCTypeKind =
   ## Maps a Nim type to a C type
   case typ.kind
   of tyNone, tyTyped: result = ctVoid
@@ -118,24 +118,22 @@ proc mapType(conf: ConfigRef; typ: PType; kind: TSymKind): TCTypeKind =
   of tyNil: result = ctPtr
   of tySet: result = mapSetType(conf, typ)
   of tyOpenArray, tyVarargs:
-    if kind == skParam: result = ctArray
-    else: result = ctNimOpenArray
+    result = ctNimOpenArray
   of tyArray, tyUncheckedArray: result = ctArray
   of tyObject, tyTuple: result = ctStruct
   of tyUserTypeClasses:
     doAssert typ.isResolvedUserTypeClass
-    return mapType(conf, typ.lastSon, kind)
+    return mapType(conf, typ.lastSon)
   of tyGenericBody, tyGenericInst, tyGenericParam, tyDistinct, tyOrdinal,
      tyTypeDesc, tyAlias, tySink, tyInferred, tyEnum:
-    result = mapType(conf, lastSon(typ), kind)
-  of tyRange: result = mapType(conf, typ[0], kind)
+    result = mapType(conf, lastSon(typ))
+  of tyRange: result = mapType(conf, typ[0])
   of tyPtr, tyVar, tyLent, tyRef:
     var base = skipTypes(typ.lastSon, typedescInst)
     case base.kind
     of tyArray, tyUncheckedArray: result = ctPtrToArray
     of tyOpenArray, tyVarargs:
-      if kind == skParam: result = ctPtrToArray
-      else:               result = ctNimOpenArray
+      result = ctNimOpenArray
     of tySet:
       if mapSetType(conf, base) == ctArray: result = ctPtrToArray
       else: result = ctPtr
@@ -148,19 +146,19 @@ proc mapType(conf: ConfigRef; typ: PType; kind: TSymKind): TCTypeKind =
   of tyInt..tyUInt64:
     result = TCTypeKind(ord(typ.kind) - ord(tyInt) + ord(ctInt))
   of tyStatic:
-    if typ.n != nil: result = mapType(conf, lastSon typ, kind)
+    if typ.n != nil: result = mapType(conf, lastSon typ)
     else: doAssert(false, "mapType: " & $typ.kind)
   else: doAssert(false, "mapType: " & $typ.kind)
 
 proc mapReturnType(conf: ConfigRef; typ: PType): TCTypeKind =
   #if skipTypes(typ, typedescInst).kind == tyArray: result = ctPtr
   #else:
-  result = mapType(conf, typ, skResult)
+  result = mapType(conf, typ)
 
 proc isImportedType(t: PType): bool =
   result = t.sym != nil and sfImportc in t.sym.flags
 
-proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKind): Rope
+proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope
 
 proc isInvalidReturnType(conf: ConfigRef; rettype: PType): bool =
   # Arrays and sets cannot be returned by a C procedure, because C is
@@ -169,7 +167,7 @@ proc isInvalidReturnType(conf: ConfigRef; rettype: PType): bool =
   # keep synchronized with ``mirpasses.eligibleForRvo``
   if rettype == nil: result = true
   else:
-    case mapType(conf, rettype, skResult)
+    case mapType(conf, rettype)
     of ctArray:
       result = not (skipTypes(rettype, typedescInst).kind in
           {tyVar, tyLent, tyRef, tyPtr})
@@ -287,7 +285,7 @@ proc getTypeForward(m: BModule, typ: PType; sig: SigHash): Rope =
     doAssert m.forwTypeCache[sig] == result
   else: internalError(m.config, "getTypeForward(" & $typ.kind & ')')
 
-proc getTypeDescWeak(m: BModule; t: PType; check: var IntSet; kind: TSymKind): Rope =
+proc getTypeDescWeak(m: BModule; t: PType; check: var IntSet): Rope =
   ## like getTypeDescAux but creates only a *weak* dependency. In other words
   ## we know we only need a pointer to it so we only generate a struct forward
   ## declaration:
@@ -320,18 +318,18 @@ proc getTypeDescWeak(m: BModule; t: PType; check: var IntSet; kind: TSymKind): R
 
       pushType(m, t)
   else:
-    result = getTypeDescAux(m, t, check, kind)
+    result = getTypeDescAux(m, t, check)
 
 proc getSeqPayloadType(m: BModule; t: PType): Rope =
   var check = initIntSet()
-  result = getTypeDescWeak(m, t, check, skParam) & "_Content"
+  result = getTypeDescWeak(m, t, check) & "_Content"
   #result = getTypeForward(m, t, hashType(t)) & "_Content"
 
 proc seqV2ContentType(m: BModule; t: PType; check: var IntSet) =
   let sig = hashType(t)
   let result = cacheGetType(m.typeCache, sig)
   if result == "":
-    discard getTypeDescAux(m, t, check, skVar)
+    discard getTypeDescAux(m, t, check)
   else:
     # little hack for now to prevent multiple definitions of the same
     # Seq_Content:
@@ -340,7 +338,7 @@ $3ifndef $2_Content_PP
 $3define $2_Content_PP
 struct $2_Content { NI cap; $1 data[SEQ_DECL_SIZE];};
 $3endif$N
-      """, [getTypeDescAux(m, t.skipTypes(abstractInst)[0], check, skVar), result, rope"#"])
+      """, [getTypeDescAux(m, t.skipTypes(abstractInst)[0], check), result, rope"#"])
 
 proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
   ## Sets up and returns the locs of the parameter symbols for procedure
@@ -361,7 +359,7 @@ proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
       continue
 
     let storage =
-      if mapType(m.config, param.typ.skipTypes({tyVar, tyLent}), skParam) == ctArray:
+      if mapType(m.config, param.typ.skipTypes({tyVar, tyLent})) == ctArray:
         # something that's represented as a C array. Since an indirection is
         # involved, we don't know where the location resides
         OnUnknown
@@ -383,40 +381,46 @@ proc genProcParams(m: BModule, t: PType, rettype, params: var Rope,
   if t[0] == nil or isInvalidReturnType(m.config, t[0]):
     rettype = ~"void"
   else:
-    rettype = getTypeDescAux(m, t[0], check, skResult)
+    rettype = getTypeDescAux(m, t[0], check)
   for i in 1..<t.n.len:
     m.config.internalAssert(t.n[i].kind == nkSym, t.n.info, "genProcParams")
     var param = t.n[i].sym
     if locs[i].k == locNone: continue
     if params != "": params.add(~", ")
-    if lfIndirect in locs[i].flags:
-      params.add(getTypeDescWeak(m, param.typ, check, skParam))
+
+    var arr = param.typ.skipTypes({tyGenericInst})
+    if arr.kind in {tyVar, tyLent, tySink}:
+      arr = arr.lastSon
+    let isOpenArray = arr.kind in {tyOpenArray, tyVarargs}
+
+    if isOpenArray:
+      # declare the pointer field for openArray:
+      params.add(getTypeDescWeak(m, arr.base, check))
+      params.add("*")
+    elif lfIndirect in locs[i].flags:
+      params.add(getTypeDescWeak(m, param.typ, check))
       params.add(~"*")
     elif weakDep:
-      params.add(getTypeDescWeak(m, param.typ, check, skParam))
+      params.add(getTypeDescWeak(m, param.typ, check))
     else:
-      params.add(getTypeDescAux(m, param.typ, check, skParam))
+      params.add(getTypeDescAux(m, param.typ, check))
     params.add(~" ")
     if sfNoalias in param.flags:
       params.add(~"NIM_NOALIAS ")
     params.add(locs[i].r)
     # declare the len field for open arrays:
-    var arr = param.typ.skipTypes({tyGenericInst})
-    if arr.kind in {tyVar, tyLent, tySink}: arr = arr.lastSon
-    var j = 0
-    while arr.kind in {tyOpenArray, tyVarargs}:
+    if isOpenArray:
       # need to pass hidden parameter:
-      params.addf(", NI $1Len_$2", [locs[i].r, j.rope])
-      inc(j)
-      arr = arr[0].skipTypes({tySink})
+      params.addf(", NI $1Len_$2", [locs[i].r, 0.rope])
+
   if t[0] != nil and isInvalidReturnType(m.config, t[0]):
     var arr = t[0]
     if params != "": params.add(", ")
     if mapReturnType(m.config, t[0]) != ctArray:
-      params.add(getTypeDescWeak(m, arr, check, skResult))
+      params.add(getTypeDescWeak(m, arr, check))
       params.add("*")
     else:
-      params.add(getTypeDescAux(m, arr, check, skResult))
+      params.add(getTypeDescAux(m, arr, check))
     params.addf(" Result", [])
   if t.callConv == ccClosure and declareEnvironment:
     if params != "": params.add(", ")
@@ -492,17 +496,17 @@ proc genRecordFieldsAux(m: BModule, n: PNode,
     let fieldType = field.typ.skipTypes(abstractInst)
     if fieldType.kind == tyUncheckedArray:
       result.addf("$1 $2[SEQ_DECL_SIZE];$n",
-          [getTypeDescAux(m, fieldType.elemType, check, skField), sname])
+          [getTypeDescAux(m, fieldType.elemType, check), sname])
     elif fieldType.kind == tySequence:
       # we need to use a weak dependency here for trecursive_table.
-      result.addf("$1$3 $2;$n", [getTypeDescWeak(m, field.typ, check, skField), sname, noAlias])
+      result.addf("$1$3 $2;$n", [getTypeDescWeak(m, field.typ, check), sname, noAlias])
     elif field.bitsize != 0:
-      result.addf("$1$4 $2:$3;$n", [getTypeDescAux(m, field.typ, check, skField), sname, rope($field.bitsize), noAlias])
+      result.addf("$1$4 $2:$3;$n", [getTypeDescAux(m, field.typ, check), sname, rope($field.bitsize), noAlias])
     else:
       # TODO: C++ remove
       # don't use fieldType here because we need the
       # tyGenericInst for C++ template support
-      result.addf("$1$3 $2;$n", [getTypeDescAux(m, field.typ, check, skField), sname, noAlias])
+      result.addf("$1$3 $2;$n", [getTypeDescAux(m, field.typ, check), sname, noAlias])
   else: internalError(m.config, n.info, "genRecordFieldsAux()")
 
 proc getRecordFields(m: BModule, typ: PType, check: var IntSet): Rope =
@@ -545,7 +549,7 @@ proc getRecordDesc(m: BModule, typ: PType, name: Rope,
         hasField = true
     else:
       appcg(m, result, " {$n  $1 Sup;$n",
-                      [getTypeDescAux(m, typ[0].skipTypes(skipPtrs), check, skField)])
+                      [getTypeDescAux(m, typ[0].skipTypes(skipPtrs), check)])
       hasField = true
   else:
     result.addf(" {$n", [name])
@@ -565,25 +569,23 @@ proc getTupleDesc(m: BModule, typ: PType, name: Rope,
   var desc = ""
   for i in 0..<typ.len:
     desc.addf("$1 Field$2;$n",
-         [getTypeDescAux(m, typ[i], check, skField), rope(i)])
+         [getTypeDescAux(m, typ[i], check), rope(i)])
   if desc == "": result.add("char dummy;\L")
   else: result.add(desc)
   result.add("};\L")
 
-proc getOpenArrayDesc(m: BModule, t: PType, check: var IntSet; kind: TSymKind): Rope =
+proc getOpenArrayDesc(m: BModule, t: PType, check: var IntSet): Rope =
   let sig = hashType(t)
-  if kind == skParam:
-    result = getTypeDescWeak(m, t[0], check, kind) & "*"
-  else:
+  if true:
     result = cacheGetType(m.typeCache, sig)
     if result == "":
       result = getTypeName(m, t, sig)
       m.typeCache[sig] = result
-      let elemType = getTypeDescWeak(m, t[0], check, kind)
+      let elemType = getTypeDescWeak(m, t[0], check)
       m.s[cfsTypes].addf("typedef struct {$n$2* Field0;$nNI Field1;$n} $1;$n",
                          [result, elemType])
 
-proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKind): Rope =
+proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope =
   # returns only the type's name
 
   var t = origTyp.skipTypes(irrelevantForBackend)
@@ -601,9 +603,7 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
       addAbiCheck(m, t, result)
 
   result = getTypePre(m, t, sig)
-  # note: ``openArray`` types map to different C types depending on the
-  # context, so we always re-compute the C type for them
-  if result != "" and t.kind != tyOpenArray:
+  if result != "":
     excl(check, t.id)
     return
   case t.kind
@@ -611,8 +611,7 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
     let star = "*"
     var et = origTyp.skipTypes(abstractInst).lastSon
     var etB = et.skipTypes(abstractInst)
-    let origBase = etB
-    if mapType(m.config, t, kind) == ctPtrToArray:
+    if mapType(m.config, t) == ctPtrToArray:
       if etB.kind == tySet:
         et = getSysType(m.g.graph, unknownLineInfo, tyUInt8)
       else:
@@ -623,25 +622,17 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
       # no restriction! We have a forward declaration for structs
       let name = getTypeForward(m, et, hashType et)
       result = name & star
-      m.typeCache[sig] = result
     of tySequence:
-        result = getTypeDescWeak(m, et, check, kind) & star
-        m.typeCache[sig] = result
+        result = getTypeDescWeak(m, et, check) & star
     of tyOpenArray:
-      result = getTypeDescAux(m, etB, check, kind)
+      result = getTypeDescAux(m, etB, check)
     else:
       # else we have a strong dependency  :-(
-      result = getTypeDescAux(m, et, check, kind) & star
-      m.typeCache[sig] = result
+      result = getTypeDescAux(m, et, check) & star
 
-    # HACK: an openArray is mapped to different types depending on what context
-    #       we're in (`kind`). The context is not stored together with the cached
-    #       type, so we force the type to be computed again next time by deleting
-    #       the entry created above
-    if origBase.kind == tyOpenArray:
-      m.typeCache.del(sig)
+    m.typeCache[sig] = result
   of tyOpenArray, tyVarargs:
-    result = getOpenArrayDesc(m, t, check, kind)
+    result = getOpenArrayDesc(m, t, check)
   of tyEnum:
     result = cacheGetType(m.typeCache, sig)
     if result == "":
@@ -649,7 +640,7 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
       if not (sfImportc in t.sym.flags and t.sym.magic == mNone):
         m.typeCache[sig] = result
         m.s[cfsTypes].addf("typedef $1 $2;$n",
-          [getTypeDescAux(m, t.lastSon, check, skVar), result])
+          [getTypeDescAux(m, t.lastSon, check), result])
         when false:
           let owner = hashOwner(t.sym)
           if not gDebugInfo.hasEnum(t.sym.name.s, t.sym.info.line, owner):
@@ -676,12 +667,12 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
             "void* ClE_0;$n} $1;$n",
              [result, rettype, desc])
   of tySequence:
-      result = getTypeDescWeak(m, t, check, kind)
+      result = getTypeDescWeak(m, t, check)
   of tyUncheckedArray:
     result = getTypeName(m, origTyp, sig)
     m.typeCache[sig] = result
     if not isImportedType(t):
-      let foo = getTypeDescAux(m, t[0], check, kind)
+      let foo = getTypeDescAux(m, t[0], check)
       m.s[cfsTypes].addf("typedef $1 $2[1];$n", [foo, result])
   of tyArray:
     var n: BiggestInt = toInt64(lengthOrd(m.config, t))
@@ -689,7 +680,7 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
     result = getTypeName(m, origTyp, sig)
     m.typeCache[sig] = result
     if not isImportedType(t):
-      let foo = getTypeDescAux(m, t[1], check, kind)
+      let foo = getTypeDescAux(m, t[1], check)
       m.s[cfsTypes].addf("typedef $1 $2[$3];$n",
            [foo, result, rope(n)])
   of tyObject, tyTuple:
@@ -720,16 +711,16 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet; kind: TSymKin
              [result, rope(getSize(m.config, t))])
   of tyGenericInst, tyDistinct, tyOrdinal, tyTypeDesc, tyAlias, tySink,
      tyUserTypeClass, tyUserTypeClassInst, tyInferred:
-    result = getTypeDescAux(m, lastSon(t), check, kind)
+    result = getTypeDescAux(m, lastSon(t), check)
   else:
     internalError(m.config, "getTypeDescAux(" & $t.kind & ')')
     result = ""
   # fixes bug #145:
   excl(check, t.id)
 
-proc getTypeDesc(m: BModule, typ: PType; kind = skParam): Rope =
+proc getTypeDesc(m: BModule, typ: PType): Rope =
   var check = initIntSet()
-  result = getTypeDescAux(m, typ, check, kind)
+  result = getTypeDescAux(m, typ, check)
 
 type
   TClosureTypeKind = enum ## In C closures are mapped to 3 different things.
@@ -762,7 +753,7 @@ proc finishTypeDescriptions(m: BModule) =
     if t.skipTypes(abstractInst).kind == tySequence:
       seqV2ContentType(m, t, check)
     else:
-      discard getTypeDescAux(m, t, check, skParam)
+      discard getTypeDescAux(m, t, check)
     inc(i)
   m.typeStack.setLen 0
 
@@ -810,7 +801,7 @@ proc genTypeInfoAuxBase(m: BModule; typ, origType: PType;
   if tfIncompleteStruct in typ.flags:
     size = rope"void*"
   else:
-    size = getTypeDesc(m, origType, skVar)
+    size = getTypeDesc(m, origType)
   m.s[cfsTypeInit3].addf(
     "$1.size = sizeof($2);$n$1.align = NIM_ALIGNOF($2);$n$1.kind = $3;$n$1.base = $4;$n",
     [name, size, rope(nimtypeKind), base]
@@ -890,7 +881,7 @@ proc genObjectFields(m: BModule, typ, origType: PType, n: PNode, expr: Rope;
     m.s[cfsTypeInit3].addf("$1.kind = 3;$n" &
         "$1.offset = offsetof($2, $3);$n" & "$1.typ = $4;$n" &
         "$1.name = $5;$n" & "$1.sons = &$6[0];$n" &
-        "$1.len = $7;$n", [expr, getTypeDesc(m, origType, skVar),
+        "$1.len = $7;$n", [expr, getTypeDesc(m, origType),
                            m.fields[field],
                            genTypeInfoV1(m, field.typ, info),
                            makeCString(field.name.s),
@@ -925,7 +916,7 @@ proc genObjectFields(m: BModule, typ, origType: PType, n: PNode, expr: Rope;
       ensureObjectFields(m, field, typ)
       m.s[cfsTypeInit3].addf("$1.kind = 1;$n" &
           "$1.offset = offsetof($2, $3);$n" & "$1.typ = $4;$n" &
-          "$1.name = $5;$n", [expr, getTypeDesc(m, origType, skVar),
+          "$1.name = $5;$n", [expr, getTypeDesc(m, origType),
           m.fields[field], genTypeInfoV1(m, field.typ, info),
           makeCString(field.name.s)])
   else: internalError(m.config, n.info, "genObjectFields")
@@ -963,7 +954,7 @@ proc genTupleInfo(m: BModule, typ, origType: PType, name: Rope; info: TLineInfo)
           "$1.offset = offsetof($2, Field$3);$n" &
           "$1.typ = $4;$n" &
           "$1.name = \"Field$3\";$n",
-           [tmp2, getTypeDesc(m, origType, skVar), rope(i), genTypeInfoV1(m, a, info)])
+           [tmp2, getTypeDesc(m, origType), rope(i), genTypeInfoV1(m, a, info)])
     m.s[cfsTypeInit3].addf("$1.len = $2; $1.kind = 2; $1.sons = &$3[0];$n",
          [expr, rope(typ.len), tmp])
   else:
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 5281810949e..5d1cc9f408e 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -363,55 +363,14 @@ include ccgtypes
 
 # ------------------------------ Manager of temporaries ------------------
 
-func mapTypeChooser(p: BProc, n: CgNode): TSymKind =
-  case n.kind
-  of cnkField:
-    skField
-  of cnkProc:
-    skProc
-  of cnkConst:
-    skConst
-  of cnkGlobal:
-    skVar
-  of cnkLocal:
-    if n.local == resultId:
-      skResult
-    elif p.locals[n.local].k == locParam:
-      skParam
-    else:
-      skVar
-  else:
-    skVar
-
-func mapTypeChooser(a: TLoc): TSymKind =
-  let n = a.lode
-  case n.kind
-  of cnkField:
-    skField
-  of cnkProc:
-    skProc
-  of cnkConst:
-    skConst
-  of cnkGlobal:
-    skVar
-  of cnkLocal:
-    if n.local == resultId:
-      skResult
-    elif a.k == locParam:
-      skParam
-    else:
-      skVar
-  else:
-    skVar
-
 proc addrLoc(conf: ConfigRef; a: TLoc): Rope =
   result = a.r
-  if lfIndirect notin a.flags and mapType(conf, a.t, mapTypeChooser(a)) != ctArray:
+  if lfIndirect notin a.flags and mapType(conf, a.t) != ctArray:
     result = "(&" & result & ")"
 
 proc byRefLoc(p: BProc; a: TLoc): Rope =
   result = a.r
-  if lfIndirect notin a.flags and mapType(p.config, a.t, mapTypeChooser(a)) != ctArray:
+  if lfIndirect notin a.flags and mapType(p.config, a.t) != ctArray:
     result = "(&" & result & ")"
 
 proc rdCharLoc(a: TLoc): Rope =
@@ -471,14 +430,13 @@ proc genObjectInit(p: BProc, section: TCProcSection, t: PType, a: TLoc,
         let tmp = defaultValueExpr(p, objType, a.lode.info)
         linefmt(p, cpsStmts,
             "#nimCopyMem((void*)$1, (NIM_CONST void*)&$2, sizeof($3));$n",
-            [rdLoc(a), rdLoc(tmp), getTypeDesc(p.module, objType, mapTypeChooser(a))])
+            [rdLoc(a), rdLoc(tmp), getTypeDesc(p.module, objType)])
       else:
         let tmp = defaultValueExpr(p, t, a.lode.info)
         genAssignment(p, a, tmp)
 
 proc constructLoc(p: BProc, loc: var TLoc; doInitObj = true) =
-  let kind = mapTypeChooser(loc)
-  case mapType(p.config, loc.t, kind)
+  case mapType(p.config, loc.t)
   of ctChar, ctBool, ctInt, ctInt8, ctInt16, ctInt32, ctInt64,
      ctFloat, ctFloat32, ctFloat64,
      ctUInt, ctUInt8, ctUInt16, ctUInt32, ctUInt64:
@@ -491,7 +449,7 @@ proc constructLoc(p: BProc, loc: var TLoc; doInitObj = true) =
     linefmt(p, cpsStmts, "$1.len = 0; $1.p = NIM_NIL;$n", [rdLoc(loc)])
   of ctArray, ctStruct, ctNimOpenArray:
     linefmt(p, cpsStmts, "#nimZeroMem((void*)$1, sizeof($2));$n",
-            [addrLoc(p.config, loc), getTypeDesc(p.module, loc.t, kind)])
+            [addrLoc(p.config, loc), getTypeDesc(p.module, loc.t)])
 
     if doInitObj:
       genObjectInit(p, cpsStmts, loc.t, loc, constructObj)
@@ -512,7 +470,7 @@ proc initLocalVar(p: BProc, v: LocalId, immediateAsgn: bool) =
 proc getTemp(p: BProc, t: PType, result: var TLoc) =
   inc(p.labels)
   result.r = "T" & rope(p.labels) & "_"
-  linefmt(p, cpsLocals, "$1 $2;$n", [getTypeDesc(p.module, t, skVar), result.r])
+  linefmt(p, cpsLocals, "$1 $2;$n", [getTypeDesc(p.module, t), result.r])
   result.k = locTemp
   result.lode = lodeTyp t
   result.storage = OnStack
@@ -542,7 +500,7 @@ proc localVarDecl(p: BProc; n: CgNode, decl: Local): Rope =
   if decl.alignment > 0:
     result.addf("NIM_ALIGN($1) ", [$decl.alignment])
 
-  result.add getTypeDesc(p.module, decl.typ, skVar)
+  result.add getTypeDesc(p.module, decl.typ)
   if true:
     if sfRegister in decl.flags: result.add(" register")
     if sfVolatile in decl.flags: result.add(" volatile")
@@ -582,7 +540,7 @@ proc defineGlobalVar*(m: BModule, id: GlobalId) =
     if exfNoDecl notin s.extFlags:
       incl(m.declaredThings, s.id)
       var decl = ""
-      var td = getTypeDesc(m, m.globals[id].t, skVar)
+      var td = getTypeDesc(m, m.globals[id].t)
       if true:
         if s.kind in {skLet, skVar, skField, skForVar} and s.alignment > 0:
           decl.addf "NIM_ALIGN($1) ", [rope(s.alignment)]
@@ -674,7 +632,7 @@ proc fillDynlibProcLoc(m: BModule, id: ProcedureId) =
 proc symInDynamicLib*(m: BModule, id: ProcedureId) =
   fillDynlibProcLoc(m, id)
   m.s[cfsVars].addf("$2 $1;$n",
-                    [m.procs[id].name, getTypeDesc(m, m.g.env[id].typ, skVar)])
+                    [m.procs[id].name, getTypeDesc(m, m.g.env[id].typ)])
 
 
 proc varInDynamicLib(m: BModule, id: GlobalId) =
@@ -684,7 +642,7 @@ proc varInDynamicLib(m: BModule, id: GlobalId) =
   incl(m.globals[id].flags, lfIndirect)
   m.globals[id].r = tmp  # from now on we only need the internal name
   m.s[cfsVars].addf("$2* $1;$n",
-      [tmp, getTypeDesc(m, sym.typ, skVar)])
+      [tmp, getTypeDesc(m, sym.typ)])
 
 proc cgsym(m: BModule, name: string): Rope =
   let sym = magicsys.getCompilerProc(m.g.graph, name)
@@ -923,7 +881,7 @@ proc genVarPrototype(m: BModule, id: GlobalId) =
       if sym.kind in {skLet, skVar, skField, skForVar} and sym.alignment > 0:
         m.s[cfsVars].addf "NIM_ALIGN($1) ", [rope(sym.alignment)]
       m.s[cfsVars].add("extern ")
-      m.s[cfsVars].add(getTypeDesc(m, sym.typ, skVar))
+      m.s[cfsVars].add(getTypeDesc(m, sym.typ))
       if exfDynamicLib in sym.extFlags: m.s[cfsVars].add("*")
       if sfRegister in sym.flags: m.s[cfsVars].add(" register")
       if sfVolatile in sym.flags: m.s[cfsVars].add(" volatile")

From b8a4beac54dc40a7d4b4a23c9122f2cc15df710c Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 9 Apr 2024 19:42:42 +0200
Subject: [PATCH 060/169] cgen: improve code generation for `seq` types (#1272)

## Summary

* only emit a single `seq` payload type definition per C file
* only emit the full C type definition for a `seq` if not used in a
  pointer-like type (e.g.: `ptr seq[T]`, `ref seq[T]`)

Together, these improvements reduce the amount of C code output by the
NimSkull compiler, slightly improving compile times.

## Details

Move the `tySequence` handling from `getTypeDescWeak` to
`getTypeDescAux`, preventing different instances referring to the same
type, or the same instance, being pushed to the type stack multiple
times within a single module.

For each `tySequence` type instance pushed to the type stack, a payload
is emitted, with preventing duplicates previously being deferred to the
C compiler through use of a C pre-processor guard (`#ifdef`). Since the
type instance is now only pushed to the type stack once per module, the
pre-processor guard is unnecessary and thus removed.

In addition, for `ptr seq`, `ref seq`, etc. types, only a forward-
declaration of the sequence type is requested, preventing the full type
and all its dependencies being pulled in.

Finally, the `trecursive_table` test, intended to catch C code
generator bugs with recursive `seq` types, is fixed. Since `p` was
neither used nor exported, the `T` type was never actually processed by
the code generator.
---
 compiler/backend/ccgtypes.nim      | 68 +++++++++++++-----------------
 tests/ccgbugs/trecursive_table.nim |  2 +-
 2 files changed, 31 insertions(+), 39 deletions(-)

diff --git a/compiler/backend/ccgtypes.nim b/compiler/backend/ccgtypes.nim
index cbadf38337f..999d266f41f 100644
--- a/compiler/backend/ccgtypes.nim
+++ b/compiler/backend/ccgtypes.nim
@@ -294,29 +294,6 @@ proc getTypeDescWeak(m: BModule; t: PType; check: var IntSet): Rope =
   of tyObject, tyTuple:
     result = getTypeForward(m, t, hashType(t))
     pushType(m, t)
-  of tySequence:
-      let sig = hashType(t)
-      m.config.internalAssert(skipTypes(etB[0], typedescInst).kind != tyEmpty,
-                              "cannot map the empty seq type to a C type")
-
-      result = cacheGetType(m.forwTypeCache, sig)
-      if result == "":
-        result = getTypeName(m, t, sig)
-        if not isImportedType(t):
-          m.forwTypeCache[sig] = result
-          addForwardStructFormat(m, rope"struct", result)
-          let payload = result & "_Content"
-          addForwardStructFormat(m, rope"struct", payload)
-
-      if cacheGetType(m.typeCache, sig) == "":
-        m.typeCache[sig] = result
-        #echo "adding ", sig, " ", typeToString(t), " ", m.module.name.s
-        appcg(m, m.s[cfsTypes],
-          "struct $1 {$N" &
-          "  NI len; $1_Content* p;$N" &
-          "};$N", [result])
-
-      pushType(m, t)
   else:
     result = getTypeDescAux(m, t, check)
 
@@ -329,16 +306,12 @@ proc seqV2ContentType(m: BModule; t: PType; check: var IntSet) =
   let sig = hashType(t)
   let result = cacheGetType(m.typeCache, sig)
   if result == "":
+    # the struct definition hasn't been emitted yet
     discard getTypeDescAux(m, t, check)
   else:
-    # little hack for now to prevent multiple definitions of the same
-    # Seq_Content:
-    appcg(m, m.s[cfsTypes], """$N
-$3ifndef $2_Content_PP
-$3define $2_Content_PP
-struct $2_Content { NI cap; $1 data[SEQ_DECL_SIZE];};
-$3endif$N
-      """, [getTypeDescAux(m, t.skipTypes(abstractInst)[0], check), result, rope"#"])
+    # emit the payload type:
+    appcg(m, m.s[cfsTypes], "struct $2_Content { NI cap; $1 data[SEQ_DECL_SIZE];};$N",
+          [getTypeDescAux(m, t.skipTypes(abstractInst)[0], check), result])
 
 proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
   ## Sets up and returns the locs of the parameter symbols for procedure
@@ -497,9 +470,6 @@ proc genRecordFieldsAux(m: BModule, n: PNode,
     if fieldType.kind == tyUncheckedArray:
       result.addf("$1 $2[SEQ_DECL_SIZE];$n",
           [getTypeDescAux(m, fieldType.elemType, check), sname])
-    elif fieldType.kind == tySequence:
-      # we need to use a weak dependency here for trecursive_table.
-      result.addf("$1$3 $2;$n", [getTypeDescWeak(m, field.typ, check), sname, noAlias])
     elif field.bitsize != 0:
       result.addf("$1$4 $2:$3;$n", [getTypeDescAux(m, field.typ, check), sname, rope($field.bitsize), noAlias])
     else:
@@ -618,12 +588,10 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope =
         et = elemType(etB)
       etB = et.skipTypes(abstractInst)
     case etB.kind
-    of tyObject, tyTuple:
+    of tyObject, tyTuple, tySequence:
       # no restriction! We have a forward declaration for structs
       let name = getTypeForward(m, et, hashType et)
       result = name & star
-    of tySequence:
-        result = getTypeDescWeak(m, et, check) & star
     of tyOpenArray:
       result = getTypeDescAux(m, etB, check)
     else:
@@ -667,7 +635,31 @@ proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope =
             "void* ClE_0;$n} $1;$n",
              [result, rettype, desc])
   of tySequence:
-      result = getTypeDescWeak(m, t, check)
+    # a sequence type is two structs underneath: one for the seq itself, and
+    # one for its payload
+    m.config.internalAssert(skipTypes(t[0], typedescInst).kind != tyEmpty,
+                            "cannot map the empty seq type to a C type")
+
+    result = cacheGetType(m.forwTypeCache, sig)
+    if result == "":
+      result = getTypeName(m, origTyp, sig)
+      if not isImportedType(t):
+        m.forwTypeCache[sig] = result
+        addForwardStructFormat(m, structOrUnion(t), result)
+
+    # it's possible that the element type cannot be emitted yet because it
+    # depends on the sequence type (a cyclic type). For this reason, the
+    # payload type is only forward-declared here, and the actual definition
+    # is emitted later
+    addForwardStructFormat(m, structOrUnion(t), result & "_Content")
+    # note: force push the type (by not using ``pushType``)
+    m.typeStack.add origTyp
+
+    m.typeCache[sig] = result
+    appcg(m, m.s[cfsTypes],
+      "struct $1 {$N" &
+      "  NI len; $1_Content* p;$N" &
+      "};$N", [result])
   of tyUncheckedArray:
     result = getTypeName(m, origTyp, sig)
     m.typeCache[sig] = result
diff --git a/tests/ccgbugs/trecursive_table.nim b/tests/ccgbugs/trecursive_table.nim
index 3406a1c31f5..fd9480941c3 100644
--- a/tests/ccgbugs/trecursive_table.nim
+++ b/tests/ccgbugs/trecursive_table.nim
@@ -13,5 +13,5 @@ type
     of eY:
       nil
 
-proc p*(x: Table[string, T]) =
+proc p*(x: Table[string, T]) {.exportc.} =
   discard

From 8e2d4c7ad7d60816cabe0e2df5e16bdabb71ea9d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 9 Apr 2024 21:22:59 +0200
Subject: [PATCH 061/169] sem: reduce cascading errors in call expressions
 (#1274)

## Summary

* reduce cascading errors in call expressions when there's one or more
  erroneous argument expressions (especially noticeable with
  `nim check` and `nimsuggest`)
* reduce cascading errors with generic type instantiation expressions
* a macro/template with an `untyped` parameter is no longer ambiguous
  with another macro/template that has a `typed` parameter, when the
  argument has an error

## Details

There was already support for "faux matches", but it stopped working
with the proliferation of `nkError` usage. A "faux match" is a match
during overload resolution that could only work because unknown types
where treated as wildcards.

Upon encountering an erroneous argument, instead of failing the match,
`matchesAux` now continues, with `paramTypesMatchAux` also letting the
error node through. This restores basic faux match support in the case
of errors.

Multiple other changes/fixes are required to make faux matches work
properly for errors:
* the `fauxMatch` field of `TCandidate` wasn't reset by
  `initCandidate`, leading to faux matches carrying over to other
  candidates
* for proper error propagation, `semResolvedCall` needs to wrap error
  matches in a wrapper error
* `semGeneric` needs to account for faux matches, by reporting the
  errors, if any

Special-casing `typed` parameters is no longer needed -- the same
parameter type matching as with other non-`untyped` parameters apply.

### Recovery through `untyped`

So that error-recovery through `untyped` templates/macros continues to
work, `cmpCandidates` always gives a higher weight to non-erroneous
candidates. If both candidates are erroneous, the normal comparison
applies.

This also fixes the overload tie behaviour between `typed` and
`untyped` parameters in the face of errors (refer to
`tuntyped_overload_tie_with_typed_with_error.nim`).

### Ambiguous faux matches

If overload resolution finds two equally well matching candidates, but
both only matched because of errors, `resolveOverloads` doesn't report
an ambiguity error, since it'd only be follow-up error.

### Other tests

`tcon1.nim` had to be adjusted to produce the same results. Due to the
missing closing parentheses, and faux matches now working again,
the `p` overload three parameter was marked as being used *twice*,
leading to it being shown before the other overload (which was
considered to only be used *once*).

Finally, two new tests are added for preventing future regressions with
faux matches.
---
 compiler/sem/semcall.nim                      | 11 ++++-
 compiler/sem/semtypes.nim                     | 10 +++-
 compiler/sem/sigmatch.nim                     | 45 +++++++++--------
 nimsuggest/tests/tcon1.nim                    |  2 +-
 tests/errmsgs/tcall_argument_error.nim        | 49 +++++++++++++++++++
 .../errmsgs/tcall_argument_error_ambigous.nim | 20 ++++++++
 ...ped_overload_tie_with_typed_with_error.nim | 12 ++---
 7 files changed, 116 insertions(+), 33 deletions(-)
 create mode 100644 tests/errmsgs/tcall_argument_error.nim
 create mode 100644 tests/errmsgs/tcall_argument_error_ambigous.nim

diff --git a/compiler/sem/semcall.nim b/compiler/sem/semcall.nim
index 7e1f8b188a9..62eb231b1a6 100644
--- a/compiler/sem/semcall.nim
+++ b/compiler/sem/semcall.nim
@@ -394,7 +394,11 @@ proc resolveOverloads(c: PContext, n, nOrig: PNode,
     c.config.internalAssert result.state == csMatch
     #writeMatches(result)
     #writeMatches(alt)
-    if c.config.m.errorOutputs == {}:
+    if result.fauxMatch == tyError:
+      # don't report an ambiguity error when the candidates both only matched
+      # due to errors
+      assert alt.fauxMatch == tyError
+    elif c.config.m.errorOutputs == {}:
       # quick error message for performance of 'compiles' built-in:
       globalReport(c.config, n.info, reportSem(rsemAmbiguous))
 
@@ -530,7 +534,10 @@ proc semResolvedCall(c: PContext, x: TCandidate,
   if x.hasFauxMatch:
     result = x.call
     result[0] = newSymNode(finalCallee, getCallLineInfo(result[0]))
-    if containsGenericType(result.typ) or x.fauxMatch == tyUnknown:
+    if x.fauxMatch == tyError:
+      # at least one argument expression was erroneous
+      result = c.config.wrapError(result)
+    elif containsGenericType(result.typ) or x.fauxMatch == tyUnknown:
       result.typ = newTypeS(x.fauxMatch, c)
       if result.typ.kind == tyError: incl result.typ.flags, tfCheckedForDestructor
     return
diff --git a/compiler/sem/semtypes.nim b/compiler/sem/semtypes.nim
index 6dbd5dc5a31..091d9c54fbd 100644
--- a/compiler/sem/semtypes.nim
+++ b/compiler/sem/semtypes.nim
@@ -1714,7 +1714,15 @@ proc semGeneric(c: PContext, n: PNode, s: PSym, prev: PType): PType =
     m.isNoCall = true
     matches(c, n, copyNodeWithKids(n), m)
 
-    if m.state != csMatch:
+    case m.state
+    of csMatch:
+      if m.fauxMatch == tyError:
+        # not a real match, report the errors and return
+        # XXX: this needs to use proper error propagation
+        for it in walkErrors(c.config, m.call):
+          localReport(c.config, it)
+        return newOrPrevType(tyError, prev, c)
+    else:
       localReport(c.config, n.info):
         block:
           var r = reportTyp(rsemCannotInstantiateWithParameter, t, ast = n)
diff --git a/compiler/sem/sigmatch.nim b/compiler/sem/sigmatch.nim
index db356e36ae6..0669d5c492b 100644
--- a/compiler/sem/sigmatch.nim
+++ b/compiler/sem/sigmatch.nim
@@ -140,6 +140,7 @@ proc initCandidate*(ctx: PContext, c: var TCandidate, callee: PType) =
   c.calleeSym = nil
   c.call = nil
   c.baseTypeMatch = false
+  c.fauxMatch = tyNone
   c.genericConverter = false
   c.inheritancePenalty = 0
   c.error = SemCallMismatch()
@@ -284,6 +285,15 @@ proc writeMatches*(c: TCandidate) =
   echo "  inheritance: ", c.inheritancePenalty
 
 proc cmpCandidates*(a, b: TCandidate): int =
+  # an non-erroneous candidate is always preferred over a non-erroneous one.
+  # This is only necessary to allow recovery through ``untyped``
+  if a.fauxMatch == tyError:
+    if b.fauxMatch != tyError:
+      return -1
+    # for two errorneous candidates, pick the better one
+  elif b.fauxMatch == tyError:
+    return 1
+
   result = a.exactMatches - b.exactMatches
   if result != 0: return
   result = a.genericMatches - b.genericMatches
@@ -2233,17 +2243,8 @@ proc instantiateRoutineExpr(c: PContext, bindings: TIdTable, n: PNode): PNode =
   else:
     discard "result is already set"
 
-template acceptsTyped(callee: PSym, typ: PType): bool =
-  callee != nil and callee.kind in {skMacro, skTemplate} and
-    typ != nil and (typ.kind == tyTyped or
-                    typ.kind == tyVarargs and typ[0].kind == tyTyped)
-
 proc paramTypesMatchAux(m: var TCandidate, f, a: PType,
                         argSemantized: PNode): PNode =
-  if argSemantized.isError and not acceptsTyped(m.calleeSym, f):
-    result = argSemantized
-    return
-  
   var
     fMaybeStatic = f.skipTypes({tyDistinct})
     arg = argSemantized
@@ -2293,6 +2294,10 @@ proc paramTypesMatchAux(m: var TCandidate, f, a: PType,
   let oldInheritancePenalty = m.inheritancePenalty
   var r = typeRel(m, f, a)
 
+  if a != nil and a.kind == tyError:
+    # if the argument is an error, a match, if any, is a faux match
+    m.fauxMatch = tyError
+
   # This special typing rule for macros and templates is not documented
   # anywhere and breaks symmetry. It's hard to get rid of though, my
   # custom seqs example fails to compile without this:
@@ -2416,10 +2421,10 @@ proc paramTypesMatchAux(m: var TCandidate, f, a: PType,
       result = implicitConv(nkHiddenSubConv, f, arg, m, c)
   of isNone:
     # do not do this in ``typeRel`` as it then can't infer T in ``ref T``:
-    # xxx: likely a latent bug, as tyError is simply a const equal to tyProxy
-    if a.kind in {tyProxy, tyUnknown}:
+    if a.kind in {tyError, tyUnknown}:
       inc(m.genericMatches)
-      m.fauxMatch = a.kind
+      if m.fauxMatch != tyError: # don't go back from error matches
+        m.fauxMatch = a.kind
       result = arg
       return
     elif a.kind == tyVoid and f.matchesVoidProc and arg.kind == nkStmtList:
@@ -2940,8 +2945,8 @@ proc matchesAux(c: PContext, n, nOrig: PNode, m: var TCandidate, marker: var Int
       else:
         setSon(m.call, formal.position + 1, arg)
 
-      if operand.kind == nkError and acceptsTyped(m.calleeSym, formal.typ):
-        discard "typed params accept errors, rejected in evalTemplateArgs"
+      if operand.kind == nkError:
+        discard "could be a faux match, rejected in semResolvedCall"
       elif arg.isError:
         noMatchDueToError()
 
@@ -2974,9 +2979,7 @@ proc matchesAux(c: PContext, n, nOrig: PNode, m: var TCandidate, marker: var Int
               else:
                 copyTree(operand)
             
-            if operand.isError:
-              noMatchDueToError()
-            elif operand.typ != nil and operand.typ.kind != tyUntyped:
+            if operand.typ != nil and operand.typ.kind != tyUntyped:
               # don't overwrite a potentially semmed/typed value in `n[a]`
               n[a] = operand
         elif formal != nil and formal.typ.kind == tyVarargs: # extra varargs
@@ -3003,8 +3006,8 @@ proc matchesAux(c: PContext, n, nOrig: PNode, m: var TCandidate, marker: var Int
             container.add arg
             incrIndexType(container.typ)
 
-          if operand.kind == nkError and acceptsTyped(m.calleeSym, formal.typ):
-            discard "typed params accept errors, rejected in evalTemplateArgs"
+          if operand.kind == nkError:
+            discard "could be a faux match, rejected in semResolvedCall"
           elif arg.kind == nkError:
             noMatchDueToError()
 
@@ -3097,8 +3100,8 @@ proc matchesAux(c: PContext, n, nOrig: PNode, m: var TCandidate, marker: var Int
 
             noMatch()
 
-          if operand.kind == nkError and acceptsTyped(m.calleeSym, formal.typ):
-            discard "typed params accept errors, rejected in evalTemplateArgs"
+          if operand.kind == nkError:
+            discard "could be a faux match, rejected in semResolvedCall"
           elif arg.kind == nkError:
             noMatchDueToError()
 
diff --git a/nimsuggest/tests/tcon1.nim b/nimsuggest/tests/tcon1.nim
index 1e0b219ddd5..fc9b6f5ea4c 100644
--- a/nimsuggest/tests/tcon1.nim
+++ b/nimsuggest/tests/tcon1.nim
@@ -16,7 +16,7 @@ test("hello here", #[!]#)
 testB(#[!]#
 
 # dot expressions
-"from behind".test(#[!]#
+"from behind".test(#[!]#)
 
 # two params matched, so disqualify the lower airity `test`
 # TODO: this doesn't work, because dot exprs, overloads, etc aren't currently
diff --git a/tests/errmsgs/tcall_argument_error.nim b/tests/errmsgs/tcall_argument_error.nim
new file mode 100644
index 00000000000..13b6f157e53
--- /dev/null
+++ b/tests/errmsgs/tcall_argument_error.nim
@@ -0,0 +1,49 @@
+discard """
+  description: '''
+    Ensure no redundant errors are reported in check mode when a call argument
+    has an error
+  '''
+  cmd: "$nim check --hints:off $options $file"
+  action: reject
+  nimoutfull: true
+  nimout: '''
+tcall_argument_error.nim(44, 14) Error: undeclared identifier: 'missing'
+tcall_argument_error.nim(46, 21) Error: undeclared identifier: 'missing'
+tcall_argument_error.nim(48, 11) Error: undeclared identifier: 'missing'
+tcall_argument_error.nim(48, 10) Error: type mismatch: got <>
+but expected one of:
+proc p(x, y: int): int
+  first type mismatch at position: 2
+  missing parameter: y
+proc p(x, y: string): string
+  first type mismatch at position: 2
+  missing parameter: y
+
+expression: p(missing)
+tcall_argument_error.nim(49, 11) Error: undeclared identifier: 'missing'
+tcall_argument_error.nim(49, 10) Error: type mismatch: got <>
+but expected one of:
+proc p(x, y: int): int
+  first type mismatch at position: 3
+  extra argument given
+proc p(x, y: string): string
+  first type mismatch at position: 2
+  required type for y: string
+  but expression '1' is of type: int literal(1)
+
+expression: p(missing, 1, 2)
+'''
+"""
+
+proc p(x, y: string): string =
+  discard
+
+proc p(x, y: int): int =
+  discard
+
+discard p(1, missing)
+# nested call, where the inner call expression has an error:
+discard p("", p("", missing))
+# if an argument is erroneous, arity is still considered:
+discard p(missing) # no overload with matching arity
+discard p(missing, 1, 2) # no overload with matching arity
diff --git a/tests/errmsgs/tcall_argument_error_ambigous.nim b/tests/errmsgs/tcall_argument_error_ambigous.nim
new file mode 100644
index 00000000000..567e00c520e
--- /dev/null
+++ b/tests/errmsgs/tcall_argument_error_ambigous.nim
@@ -0,0 +1,20 @@
+discard """
+  description: '''
+    Ensure no "ambiguous call" error is reported when an argument, of which
+    the type is needed for disambiguating, is erroneous
+  '''
+  cmd: "$nim check --hints:off $options $file"
+  action: reject
+  nimoutfull: true
+  nimout: '''
+tcall_argument_error_ambigous.nim(20, 14) Error: undeclared identifier: 'missing'
+'''
+"""
+
+proc p(x: int, y: float): int =
+  discard
+
+proc p(x: int, y: int): int =
+  discard
+
+discard p(1, missing)
diff --git a/tests/lang_callable/overload/tuntyped_overload_tie_with_typed_with_error.nim b/tests/lang_callable/overload/tuntyped_overload_tie_with_typed_with_error.nim
index 1fb7d494662..0a209001208 100644
--- a/tests/lang_callable/overload/tuntyped_overload_tie_with_typed_with_error.nim
+++ b/tests/lang_callable/overload/tuntyped_overload_tie_with_typed_with_error.nim
@@ -1,14 +1,10 @@
 discard """
   description: '''
-    Ensure that overloads separated by `typed` and `untyped` parameters tie,
-    resulting in an ambiguity error, if that argument is an `nkError`.
-
-    This isn't ideal, but it works until `untyped` parameters result in eager
-    matching over any other parameter type.
+    Ensure that overloads separated by `typed` and `untyped` parameters don't
+    result in a tie, if the argument in question is erroneous (i.e., an
+    `nkError`).
   '''
-  errormsg: "ambiguous call"
-  line: 22
-  column: 2
+  action: compile
 """
 
 import std/macros

From 5b430c685b000d0fbae4800c603ef028028c8c91 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 10 Apr 2024 22:02:24 +0200
Subject: [PATCH 062/169] mir: add dedicated 'mutable' version for view
 creation (#1273)

## Summary

Encode in syntax whether a `mnkView`/`mnkToSlice` creates a mutable
views, by introducing two new node kinds. This allows creation of a
data-flow graph without access to type information.

## Details

* add `mnkMutView` and `mnkToMutSlice` to the MIR
* `mirgen` picks which operation to use based on the expressions
  return type
* `mirexec.computeDfg` now decides the data-flow operation(s) for a
  view creation operation based purely on syntax
* the mutable versions are currently pretty-printed in the same way as
  their non-mutable counterpart
* no new CGIR node kinds are introduced, as they're not needed
---
 compiler/backend/cgirgen.nim |  4 ++--
 compiler/mir/mirgen.nim      | 19 +++++++++++++++----
 compiler/mir/mirtrees.nim    |  8 +++++---
 compiler/mir/utils.nim       |  4 ++--
 compiler/sem/mirexec.nim     | 12 ++++++------
 doc/mir.rst                  |  3 +++
 6 files changed, 33 insertions(+), 17 deletions(-)

diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 810ae605c04..57b1713c1d2 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -971,14 +971,14 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
     op cnkConv, valueToIr(tree, cl, cr)
   of mnkStdConv:
     op cnkHiddenConv, valueToIr(tree, cl, cr)
-  of mnkToSlice:
+  of mnkToSlice, mnkToMutSlice:
     treeOp cnkToSlice:
       res.add valueToIr(tree, cl, cr)
   of mnkAddr:
     op cnkAddr, lvalueToIr(tree, cl, cr)
   of mnkDeref:
     op cnkDeref, atomToIr(tree, cl, cr)
-  of mnkView:
+  of mnkView, mnkMutView:
     op cnkHiddenAddr, lvalueToIr(tree, cl, cr)
   of mnkDerefView:
     op cnkDerefView, atomToIr(tree, cl, cr)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 3b14298f7f8..80f488db1ed 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1728,6 +1728,16 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
   template recurse() =
     genx(c, e, i - 1)
 
+  proc viewOp(kind: MirNodeKind, typ: PType): MirNodeKind {.nimcall.} =
+    # pick the correct kind based on the var-ness
+    let isMutable = typ.skipTypes(abstractInst).kind == tyVar
+    case kind
+    of mnkView:
+      if isMutable: mnkMutView    else: mnkView
+    of mnkToSlice:
+      if isMutable: mnkToMutSlice else: mnkToSlice
+    else: unreachable()
+
   case n.kind
   of pirProc:
     c.use toValue(c.env.procedures.add(n.sym), n.sym.typ)
@@ -1818,7 +1828,7 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     c.buildOp mnkAddr, n.typ:
       recurse()
   of pirView:
-    c.buildOp mnkView, n.typ:
+    c.buildOp viewOp(mnkView, n.typ), n.typ:
       recurse()
   of pirCast:
     c.buildOp mnkCast, n.typ:
@@ -1830,12 +1840,13 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     c.buildOp mnkStdConv, n.typ:
       recurse()
   of pirToSlice:
-    c.buildOp mnkToSlice, n.typ:
+    c.buildOp viewOp(mnkToSlice, n.typ), n.typ:
       recurse()
   of pirToSubSlice:
     # the array operand is a PMIR expression already, but the operands
     # specifying the bounds are not
     let
+      op = viewOp(mnkToSlice, n.typ)
       a = n.orig[2]
       b = n.orig[3]
     if optBoundsCheck in c.userOptions and needsBoundCheck(n.orig[1], a, b):
@@ -1849,12 +1860,12 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
           c.emitByVal lo
           c.emitByVal hi
 
-      c.buildTree mnkToSlice, n.typ:
+      c.buildTree op, n.typ:
         c.use arr
         c.use lo
         c.use hi
     else:
-      c.buildTree mnkToSlice, n.typ:
+      c.buildTree op, n.typ:
         recurse()
         genArgExpression(c, a, sink=false)
         genArgExpression(c, b, sink=false)
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 5bf4f28722d..93acdefbdf4 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -132,6 +132,7 @@ type
     mnkDeref  ## dereference a ``ptr`` or ``ref`` value
 
     mnkView      ## create a first-class safe alias from an lvalue
+    mnkMutView   ## create a safe mutable view from an lvalue
     mnkDerefView ## dereference a first-class safe alias
 
     mnkStdConv    ## a standard conversion. Produce a new value.
@@ -148,6 +149,7 @@ type
                   ##   upper bound
     # XXX: consider using a separate operator for the slice-from-sub-sequence
     #      operation
+    mnkToMutSlice ## version of ``mnkToSlice`` for creating a mutable slice
 
     mnkCall   ## invoke a procedure and pass along the provided arguments.
               ## Used for both static and dynamic calls
@@ -343,7 +345,7 @@ const
                          mnkAddr, mnkDeref, mnkView, mnkDerefView, mnkStdConv,
                          mnkConv, mnkCast, mnkRaise, mnkTag, mnkArg,
                          mnkName, mnkConsume, mnkVoid, mnkCopy, mnkMove,
-                         mnkSink, mnkDestroy}
+                         mnkSink, mnkDestroy, mnkMutView, mnkToMutSlice}
     ## Nodes that start sub-trees but that always have a single sub node.
 
   ArgumentNodes* = {mnkArg, mnkName, mnkConsume}
@@ -380,8 +382,8 @@ const
                       mnkPathConv, mnkDeref, mnkDerefView, mnkTemp, mnkAlias,
                       mnkLocal, mnkParam, mnkConst, mnkGlobal}
   RvalueExprKinds* = {mnkType, mnkProc, mnkConv, mnkStdConv, mnkCast, mnkAddr,
-                      mnkView, mnkToSlice} + UnaryOps + BinaryOps +
-                     LiteralDataNodes
+                      mnkView, mnkMutView, mnkToSlice, mnkToMutSlice} +
+                     UnaryOps + BinaryOps + LiteralDataNodes
   ExprKinds* =       {mnkCall, mnkCheckedCall, mnkSetConstr, mnkArrayConstr,
                       mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
                       mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 7475111a796..3f3118cbdef 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -350,10 +350,10 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   of mnkAddr:
     tree "addr ":
       valueToStr()
-  of mnkView:
+  of mnkView, mnkMutView:
     tree "borrow ":
       valueToStr()
-  of mnkToSlice:
+  of mnkToSlice, mnkToMutSlice:
     tree "toOpenArray ":
       commaSeparated:
         valueToStr()
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index 07695603289..2b5874ae0f5 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -256,14 +256,14 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
     # handles aren't tracked however, the operation is conservatively
     # treated as a mutation
     emitLvalueOp(env, opMutate, tree, at, tree.operand(source))
-  of mnkView:
+  of mnkView, mnkMutView:
     # if the created view supports mutation, treat the creation as a
     # mutation itself
     let opc =
-      if tree[source].typ.kind == tyVar: opMutate
-      else:                              opUse
+      if tree[source].kind == mnkView: opUse
+      else:                            opMutate
     emitLvalueOp(env, opc, tree, at, tree.operand(source))
-  of mnkToSlice:
+  of mnkToSlice, mnkToMutSlice:
     # slices aren't tracked at the moment, so the mere creation of a slice is
     # treated as a usage of the sequence. If the resulting openArray supports
     # mutation, creation of the slice is treated as a mutation. To ensure the
@@ -274,8 +274,8 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
       emitLvalueOp(env, opUse, tree, at, tree.operand(source, 2))
 
     let opc =
-      if tree[source].typ.kind == tyVar: opMutate
-      else:                              opUse
+      if tree[source].kind == mnkToSlice: opUse
+      else:                               opMutate
     emitLvalueOp(env, opc, tree, at, tree.operand(source, 0))
   of mnkCopy, mnkSink:
     # until it's collapsed, a sink is conservatively treated as only a
diff --git a/doc/mir.rst b/doc/mir.rst
index a7f171dea9a..7f8a69d1f9f 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -121,13 +121,16 @@ Semantics
          | Addr     LVALUE               # create a pointer from the lvalue
          | View     LVALUE               # create a view (`var`/`lent`) of the
                                          # lvalue
+         | MutView  LVALUE
          | ToSlice  VALUE                # create an `openArray` slice of
                                          # the full sequence
+         | MutToSlice LVALUE
          | ToSlice  VALUE, VALUE, VALUE  # create an `openArray` slice from the
                                          # first operand, starting at the lower
                                          # bound (second parameter) and ending
                                          # at the upper bound (inclusive, third
                                          # parameter)
+         | MutToSlice LVALUE, VALUE, VALUE
 
   ASGN_SRC = RVALUE
            | VALUE

From 03791e764b405637ef6e3e17709189cd31147e5c Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 12 Apr 2024 20:47:26 +0200
Subject: [PATCH 063/169] mir: distinguish between proc values and references
 (#1275)

## Summary

Introduce `mnkProcVal`, for taking over the "procedural value" meaning
of `mnkProc`, the latter which only means "reference to procedure" now.
This clarifies the syntax a bit, but, more importantly, allows
`mnkProc` nodes to not require a type.

## Details

* add the `mnkProcVal` kind and update the grammar
* where the value interpretation was used, replace usages of `mnkProc`
  with `mnkProcVal`
* for the sake of keeping the code generators as is, `mnkProc` is still
  translated to a typed `cnkProc`
* `mirconstr.buildCall` no longer requires a procedure type
* all static calls use `mnkProc` instead of `mnkProcVal`
---
 compiler/backend/backends.nim      | 10 +++++-----
 compiler/backend/cgirgen.nim       | 26 +++++++++++++++++---------
 compiler/backend/compat.nim        |  2 +-
 compiler/mir/datatables.nim        |  4 ++--
 compiler/mir/mirconstr.nim         |  6 +++---
 compiler/mir/mirgen.nim            |  7 +++----
 compiler/mir/mirpasses.nim         |  7 +++----
 compiler/mir/mirtrees.nim          | 15 ++++++++-------
 compiler/mir/utils.nim             |  7 ++++---
 compiler/sem/aliasanalysis.nim     |  6 +++---
 compiler/sem/injectdestructors.nim |  3 +--
 compiler/sem/mirexec.nim           |  4 ++--
 compiler/vm/packed_env.nim         |  2 +-
 doc/mir.rst                        |  4 ++--
 14 files changed, 55 insertions(+), 48 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index a61fba16fee..fece22dbef7 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -281,7 +281,7 @@ iterator deps*(tree: MirTree): lent MirNode =
       # skip over the name slot:
       i = NodePosition tree.operand(i, 1)
       continue
-    of mnkProc:
+    of mnkProc, mnkProcVal:
       yield tree[i]
     of mnkGlobal:
       yield tree[i]
@@ -436,7 +436,7 @@ proc genLoadLib(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
 
   bu.subTree MirNode(kind: mnkAsgn):
     bu.use loc
-    bu.buildCall env.procedures.add(loadLib), loadLib.typ, loadLib.typ[0]:
+    bu.buildCall env.procedures.add(loadLib), loadLib.typ[0]:
       bu.emitByVal name
 
   bu.wrapTemp(graph.getSysType(unknownLineInfo, tyBool)):
@@ -480,7 +480,7 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
 
       # if none of the candidates worked, a run-time error is reported:
       bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), errorProc.typ, voidTyp:
+        bu.buildCall env.procedures.add(errorProc), voidTyp:
           bu.emitByVal literal(env.getOrIncl(path.strVal), path.typ)
       bu.add endNode(mnkStmtList)
   else:
@@ -498,7 +498,7 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
     bu.subTree mnkIf:
       bu.use cond
       bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), errorProc.typ, voidTyp:
+        bu.buildCall env.procedures.add(errorProc), voidTyp:
           bu.emitByVal nameTemp
 
 proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
@@ -558,7 +558,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
 
     # generate the code for ``sym = cast[typ](nimGetProcAddr(lib, extname))``
     let tmp = bu.wrapTemp(loadProc.typ[0]):
-      bu.buildCall env.procedures.add(loadProc), loadProc.typ, loadProc.typ[0]:
+      bu.buildCall env.procedures.add(loadProc), loadProc.typ[0]:
         bu.emitByVal toValue(libVar, lib.name.typ)
         bu.emitByVal literal(env.getOrIncl(extname.strVal), extname.typ)
 
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 57b1713c1d2..6600ab3c83c 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -254,7 +254,7 @@ proc convToIr(cl: TranslateCl, n: CgNode, info: TLineInfo, dest: PType): CgNode
 
 proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
   case n.kind
-  of mnkProc:
+  of mnkProcVal:
     CgNode(kind: cnkProc, info: info, typ: n.typ, prc: n.prc)
   of mnkGlobal:
     CgNode(kind: cnkGlobal, info: info, typ: n.typ, global: n.global)
@@ -320,7 +320,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
     lvalueToIr(tree, cl, tree.get(cr), cr, false)
 
   case n.kind
-  of mnkLocal, mnkGlobal, mnkParam, mnkTemp, mnkAlias, mnkConst, mnkProc:
+  of mnkLocal, mnkGlobal, mnkParam, mnkTemp, mnkAlias, mnkConst, mnkProcVal:
     return atomToIr(n, cl, info)
   of mnkPathNamed:
     let obj = recurse()
@@ -358,7 +358,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
     result = newOp(cnkDeref, info, n.typ, atomToIr(tree, cl, cr))
   of mnkDerefView:
     result = newOp(cnkDerefView, info, n.typ, atomToIr(tree, cl, cr))
-  of AllNodeKinds - LvalueExprKinds - {mnkProc}:
+  of AllNodeKinds - LvalueExprKinds - {mnkProcVal}:
     unreachable(n.kind)
 
   leave(tree, cr)
@@ -370,7 +370,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl,
 proc valueToIr(tree: MirBody, cl: var TranslateCl,
                cr: var TreeCursor): CgNode =
   case tree[cr].kind
-  of mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkAlias,
+  of mnkProcVal, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkAlias,
      mnkType, LiteralDataNodes:
     atomToIr(tree, cl, cr)
   of mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv, mnkPathVariant,
@@ -393,7 +393,7 @@ proc argToIr(tree: MirBody, cl: var TranslateCl,
     # it is one, the expression must be an lvalue
     result = (true, lvalueToIr(tree, cl, cr))
     leave(tree, cr)
-  of LiteralDataNodes, mnkType, mnkProc, mnkNone:
+  of LiteralDataNodes, mnkType, mnkProcVal, mnkNone:
     # not a tag but an atom
     result = (false, atomToIr(n, cl, cr.info))
   of LvalueExprKinds:
@@ -403,16 +403,24 @@ proc argToIr(tree: MirBody, cl: var TranslateCl,
 
   leave(tree, cr)
 
+proc calleeToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode =
+  case tree[cr].kind
+  of mnkMagic:
+    newMagicNode(tree.get(cr).magic, cr.info)
+  of mnkProc:
+    let prc = tree.get(cr).prc
+    # assign a type for the CGIR node, the code generators currently need it
+    CgNode(kind: cnkProc, typ: cl.env[][prc].typ, info: cr.info, prc: prc)
+  else:
+    valueToIr(tree, cl, cr)
+
 proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
               cr: var TreeCursor): CgNode =
   ## Translate a valid call-like tree to the CG IR.
   let info = cr.info
   result = newExpr((if n.kind == mnkCall: cnkCall else: cnkCheckedCall),
                    info, n.typ)
-  result.add: # the callee
-    case tree[cr].kind
-    of mnkMagic: newMagicNode(tree.get(cr).magic, info)
-    else:        valueToIr(tree, cl, cr)
+  result.add calleeToIr(tree, cl, cr)
 
   # the code generators currently require some magics to not have any
   # arguments wrapped in ``cnkHiddenAddr`` nodes
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index a7df7f69db9..6360bf6f04d 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -200,7 +200,7 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
     of mnkAstLit:
       CgNode(kind: cnkAstLit, info: unknownLineInfo, typ: n.typ,
              astLit: env[n.ast])
-    of mnkProc:
+    of mnkProcVal:
       CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: n.typ)
     of AllNodeKinds - ConstrTreeNodes + {mnkEnd, mnkField}:
       # 'end' nodes are skipped manually
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index b8d1604862f..5d5391e9a37 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -39,7 +39,7 @@ func hashTree(tree: ConstrTree): Hash =
       result = result !& hash(n.strVal)
     of mnkAstLit:
       result = result !& hash(n.ast)
-    of mnkProc:
+    of mnkProcVal:
       result = result !& hash(n.prc.ord)
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
        mnkClosureConstr, mnkObjConstr:
@@ -73,7 +73,7 @@ proc cmp(a, b: ConstrTree): bool =
       a.strVal == b.strVal
     of mnkAstLit:
       a.ast == b.ast
-    of mnkProc:
+    of mnkProcVal:
       a.prc == b.prc
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
        mnkClosureConstr, mnkObjConstr:
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index a783367a995..47eda209e64 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -98,7 +98,7 @@ func toValue*(id: GlobalId, typ: PType): Value =
   Value(node: MirNode(kind: mnkGlobal, typ: typ, global: id))
 
 func toValue*(id: ProcedureId, typ: PType): Value =
-  Value(node: MirNode(kind: mnkProc, typ: typ, prc: id))
+  Value(node: MirNode(kind: mnkProcVal, typ: typ, prc: id))
 
 func toValue*(kind: range[mnkParam..mnkLocal], id: LocalId,
               typ: PType): Value =
@@ -356,12 +356,12 @@ template buildMagicCall*(bu: var MirBuilder, m: TMagic, t: PType,
     bu.add MirNode(kind: mnkMagic, magic: m)
     body
 
-template buildCall*(bu: var MirBuilder, prc: ProcedureId, pt, t: PType,
+template buildCall*(bu: var MirBuilder, prc: ProcedureId, t: PType,
                     body: untyped) =
   ## Build and emits a call tree to the active buffer. `pt` is the type of the
   ## procedure.
   bu.subTree MirNode(kind: mnkCall, typ: t):
-    bu.use toValue(prc, pt)
+    bu.add procNode(prc)
     body
 
 func emitByVal*(bu: var MirBuilder, y: Value) =
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 80f488db1ed..69a8415f7a4 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -685,7 +685,7 @@ proc genCallee(c: var TCtx, n: PNode) =
     let s = n.sym
     if s.magic == mNone or s.magic in c.config.magicsToKeep:
       # reference the procedure by symbol
-      c.use toValue(c.env.procedures.add(s), s.typ)
+      c.add procNode(c.env.procedures.add(s))
     else:
       # don't use a symbol
       c.add MirNode(kind: mnkMagic, magic: s.magic)
@@ -1215,7 +1215,7 @@ proc genRaise(c: var TCtx, n: PNode) =
       cp = c.graph.getCompilerProc("prepareException")
     c.buildStmt mnkVoid:
       c.buildTree mnkCall, typeOrVoid(c, nil):
-        c.use toValue(c.env.procedures.add(cp), cp.typ)
+        c.add procNode(c.env.procedures.add(cp))
         c.subTree mnkArg:
           # lvalue conversion to the base ``Exception`` type:
           c.buildTree mnkPathConv, cp.typ[1]:
@@ -2234,8 +2234,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
       c.subTree mnkBranch:
         c.subTree mnkVoid:
           let p = c.graph.getCompilerProc("nimUnhandledException")
-          c.builder.buildCall c.env.procedures.add(p), p.typ,
-                              typeOrVoid(c, p.typ[0]):
+          c.builder.buildCall c.env.procedures.add(p), typeOrVoid(c, p.typ[0]):
             discard
     c.add endNode(mnkTry)
 
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 05ec8772114..3c978e9e715 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -428,13 +428,12 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
   ## * at the end of a loop's body
   let
     voidType = graph.getSysType(unknownLineInfo, tyVoid)
-    prc = graph.getCompilerProc("nimProfile")
-    prcId = env.procedures.add(prc)
+    prcId = env.procedures.add(graph.getCompilerProc("nimProfile"))
 
   # insert the entry call within the outermost scope:
   changes.insert(tree, tree.child(NodePosition 0, 0), NodePosition 0, bu):
     bu.subTree mnkVoid:
-      bu.buildCall prcId, prc.typ, voidType:
+      bu.buildCall prcId, voidType:
         discard "no arguments"
 
   for i in search(tree, {mnkEnd}):
@@ -442,7 +441,7 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
       # insert the call before the end node:
       changes.insert(tree, i - 1, i, bu):
         bu.subTree mnkVoid:
-          bu.buildCall prcId, prc.typ, voidType:
+          bu.buildCall prcId, voidType:
             discard "no arguments"
 
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 93acdefbdf4..0b44d015827 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -57,7 +57,8 @@ type
     mnkNone
 
     # entity names:
-    mnkProc   ## procedure
+    mnkProc   ## procedure reference; only allowed in callee slots
+    mnkProcVal## procedural value
     mnkConst  ## named constant
     mnkGlobal ## global location
     mnkParam  ## parameter
@@ -278,7 +279,7 @@ type
       ## non-critical meta-data associated with the node (e.g., origin
       ## information)
     case kind*: MirNodeKind
-    of mnkProc:
+    of mnkProc, mnkProcVal:
       prc*: ProcedureId
     of mnkGlobal:
       global*: GlobalId
@@ -360,12 +361,12 @@ const
 
   ConstrTreeNodes* = {mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr,
                       mnkTupleConstr, mnkClosureConstr, mnkObjConstr,
-                      mnkProc, mnkArg, mnkField, mnkEnd} + LiteralDataNodes
+                      mnkProcVal, mnkArg, mnkField, mnkEnd} + LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
   # --- semantics-focused sets:
 
-  Atoms* = {mnkNone .. mnkType} - {mnkField}
+  Atoms* = {mnkNone .. mnkType} - {mnkField, mnkProc}
     ## Nodes that may be appear in atom-expecting slots.
 
   StmtNodes* = {mnkScope, mnkStmtList, mnkIf, mnkCase, mnkRepeat, mnkTry,
@@ -381,9 +382,9 @@ const
   LvalueExprKinds* = {mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathVariant,
                       mnkPathConv, mnkDeref, mnkDerefView, mnkTemp, mnkAlias,
                       mnkLocal, mnkParam, mnkConst, mnkGlobal}
-  RvalueExprKinds* = {mnkType, mnkProc, mnkConv, mnkStdConv, mnkCast, mnkAddr,
-                      mnkView, mnkMutView, mnkToSlice, mnkToMutSlice} +
-                     UnaryOps + BinaryOps + LiteralDataNodes
+  RvalueExprKinds* = {mnkType, mnkProcVal, mnkConv, mnkStdConv, mnkCast,
+                      mnkAddr, mnkView, mnkMutView, mnkToSlice,
+                      mnkToMutSlice} + UnaryOps + BinaryOps + LiteralDataNodes
   ExprKinds* =       {mnkCall, mnkCheckedCall, mnkSetConstr, mnkArrayConstr,
                       mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
                       mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 3f3118cbdef..7c19220796d 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -25,7 +25,7 @@ import
 func `$`(n: MirNode): string =
   result.add substr($n.kind, 3) # cut off the prefix
   case n.kind
-  of mnkProc:
+  of mnkProc, mnkProcVal:
     result.add " prc: "
     result.addInt n.prc.uint32
   of mnkConst:
@@ -205,7 +205,8 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
       result.addName(n.cnst, "<C", c)
   of mnkGlobal:
     result.addName(n.global, "<G", c)
-  of mnkProc:
+  of mnkProc, mnkProcVal:
+    # procedure references are also handled here for simplicity
     result.addName(n.prc, "<P", c)
   of mnkTemp, mnkAlias:
     result.add "_" & $n.local.int
@@ -243,7 +244,7 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.add "type("
     result.add $n.typ
     result.add ")"
-  of AllNodeKinds - Atoms:
+  of AllNodeKinds - Atoms - mnkProc:
     result.add "<error: " & $n.kind & ">"
 
 proc singleToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index cc1a82646b8..dc55551c1f7 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -60,8 +60,8 @@ type
     long: seq[PathInstr]
 
 const
-  Roots = {mnkProc, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp, mnkCall,
-           mnkDeref, mnkDerefView}
+  Roots = {mnkProcVal, mnkConst, mnkGlobal, mnkParam, mnkLocal, mnkTemp,
+           mnkCall, mnkDeref, mnkDerefView}
   PathOps = {mnkPathPos, mnkPathNamed, mnkPathArray, mnkPathConv,
              mnkPathVariant}
 
@@ -72,7 +72,7 @@ func isSameRoot(an, bn: MirNode): bool =
   case an.kind
   of mnkParam, mnkLocal, mnkTemp:
     result = an.local == bn.local
-  of mnkProc:
+  of mnkProcVal:
     result = an.prc == bn.prc
   of mnkConst:
     result = an.cnst == bn.cnst
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 61d21c44289..ca44b7803e6 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -502,8 +502,7 @@ template buildVoidCall*(bu: var MirBuilder, env: var MirEnv, p: PSym,
                        body: untyped) =
   let prc = p # prevent multi evaluation
   bu.subTree mnkVoid:
-    bu.subTree MirNode(kind: mnkCall, typ: getVoidType(graph)):
-      bu.use toValue(env.procedures.add(prc), prc.typ)
+    bu.buildCall env.procedures.add(prc), getVoidType(graph):
       body
 
 proc genWasMoved(bu: var MirBuilder, graph: ModuleGraph, target: Value) =
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index 2b5874ae0f5..6d5d6f3bf4c 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -224,7 +224,7 @@ func emitForArgs(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
       emitLvalueOp(env, opConsume, tree, at, tree.operand(it))
     of mnkName:
       emitForValue(env, tree, at, tree.skip(tree.operand(it), mnkTag))
-    of mnkField, mnkMagic:
+    of mnkField, mnkMagic, mnkProc:
       discard
     else:
       emitLvalueOp(env, opUse, tree, at, OpValue it)
@@ -291,7 +291,7 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   of LvalueExprKinds:
     # raw usage of an lvalue
     emitLvalueOp(env, opUse, tree, at, OpValue source)
-  of mnkNone, LiteralDataNodes, mnkProc:
+  of mnkNone, LiteralDataNodes, mnkProcVal:
     discard "okay, ignore"
   of AllNodeKinds - ExprKinds - {mnkNone} + {mnkType}:
     unreachable(tree[source].kind)
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index 4ab0160344a..d861e6ff736 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -391,7 +391,7 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
   of mnkStrLit:
     # the ID indexes into the string BiTable, it can be packed directly
     enc.put e, PackedDataNode(kind: pdkString, pos: t[n].strVal.uint32)
-  of mnkProc:
+  of mnkProcVal:
     # the ID is stable, it can be packed directly
     enc.put e, PackedDataNode(kind: pdkIntLit, pos: t[n].prc.uint32)
   of mnkArrayConstr, mnkSeqConstr:
diff --git a/doc/mir.rst b/doc/mir.rst
index 7f8a69d1f9f..bd992f41f58 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -44,7 +44,7 @@ Semantics
          | DerefView   NAME              # dereference a `var` or `lent`
 
   VALUE = <Literal>
-        | <Proc>
+        | <ProcVal>
         | <Type>
         | LVALUE
 
@@ -388,7 +388,7 @@ ones).
 
 .. code-block:: literal
 
-  VALUE = <Proc>
+  VALUE = <ProcVal>
         | <Literal>
         | COMPLEX
 

From 8e9e2df2062645d91959c009c77fa198887a6a42 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 13 Apr 2024 00:58:40 +0200
Subject: [PATCH 064/169] fix: internal compiler errors with closure iterators
 (#1276)

## Summary

Fix two bugs with the closure iterator transformation that resulted in
internal compiler errors. One affected yields in `while` loops, the
other yields in object down-conversion expressions.

## Details

1. whether a split is required wasn't propagated upwards for
   `nkWhileStmt` statements, leading to their enclosing statement-list
   expressions to not be lifted, if there was no other source for
   splits
2. the `nkObjDownConv` node wasn't properly handled by
   `lowerStmtListExpr`, meaning that the statement-list expression
   unpacking wasn't performed

Two regression tests are added to `titer_issues.nim`.
---
 compiler/sem/closureiters.nim             |  5 ++--
 tests/lang_callable/iter/titer_issues.nim | 30 ++++++++++++++++++++++-
 2 files changed, 31 insertions(+), 4 deletions(-)

diff --git a/compiler/sem/closureiters.nim b/compiler/sem/closureiters.nim
index 3f9d6d1ba1e..4fdeb93dc03 100644
--- a/compiler/sem/closureiters.nim
+++ b/compiler/sem/closureiters.nim
@@ -690,7 +690,7 @@ proc lowerStmtListExprs(ctx: var Ctx, n: PNode, needsSplit: var bool): PNode =
         [st, n]
 
   of nkCast, nkHiddenStdConv, nkHiddenSubConv, nkConv, nkObjUpConv,
-      nkDerefExpr, nkHiddenDeref:
+     nkObjDownConv, nkDerefExpr, nkHiddenDeref:
     var ns = false
     for i in ord(n.kind == nkCast)..<n.len:
       n[i] = ctx.lowerStmtListExprs(n[i], ns)
@@ -743,8 +743,7 @@ proc lowerStmtListExprs(ctx: var Ctx, n: PNode, needsSplit: var bool): PNode =
 
   of nkWhileStmt:
     assert isTrue(n[0])
-    var bodyNeedsSplit = false
-    n[1] = ctx.lowerStmtListExprs(n[1], bodyNeedsSplit)
+    n[1] = ctx.lowerStmtListExprs(n[1], needsSplit)
 
   of nkDotExpr, nkCheckedFieldExpr:
     var ns = false
diff --git a/tests/lang_callable/iter/titer_issues.nim b/tests/lang_callable/iter/titer_issues.nim
index 6ae0e7c281d..2f8ed43d25d 100644
--- a/tests/lang_callable/iter/titer_issues.nim
+++ b/tests/lang_callable/iter/titer_issues.nim
@@ -277,4 +277,32 @@ block ref_construction_argument:
     yield a.i
 
   for i in iter(RefObj(i: 1)):
-    doAssert i == 3
\ No newline at end of file
+    doAssert i == 3
+
+block while_loop_in_closure_iterator_expression:
+  # a ``while`` loop with a yield inside and part of an expression was
+  # not transformed properly, leading to an internal compiler error
+  iterator iter() {.closure.} =
+    var val = block:
+      while true: # while loop part of a block expression
+        yield
+      1
+    doAssert val == 1
+
+  let it = iter
+  it()
+  it()
+
+block yield_in_obj_down_conversion:
+  # an object down-conversion containing a yield wasn't processed properly,
+  # leading to an internal compiler error
+  type Obj = ref object of RootObj
+
+  iterator iter() {.closure.} =
+    var x: ref RootObj
+    var val = Obj((;yield; x))
+    doAssert val.isNil
+
+  let it = iter
+  it()
+  it()

From 63c2686fd24f76e18c89c525830981e0b1514be7 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 17 Apr 2024 00:35:02 +0200
Subject: [PATCH 065/169] mir: use `TypeId` (#1277)

## Summary

Store references to types as `TypeId` instead of `PType`, making
`MirNode` a plain data-type. Besides speeding up the compiler, this
also paves the way to a data-oriented type IR for the MIR.

## Details

### Overview

* all MIR-level types use `TypeId` instead of `PType` (currently only
  `MirNode` and `Local`)
* the new `TypeEnv` type from the `mirtypes` module manages the type
  storage and mappings
* a `TypeEnv` instance is embedded in `MirEnv`
* registering a `PType` with `TypeEnv` yields a `TypeId`
* querying type information requires access to a `TypeEnv` instance

### Mapping Types

`TypeEnv` stores the `PType`-to-`TypeId` mappings in a `TypeTable`.
`TypeTable`, provided by the new `typemaps` module, is a custom
`Table` type that de-duplicates the `PType` keys by using structural
or symbolic comparison/hashing for the keys, thereby significantly
reducing the number of mappings and registered types.

At the moment, `PType` is still used as the type IR, so `TypeEnv` only
stores a `PType` for each `TypeId`.

The built-in types are mapped to statically known IDs, making some
translation and MIR construction easier.

### Constant expressions

To not require passing a `TypeEnv` to `datatables.getOrPut`, only the
type IDs are compared. This doesn't produce the same results as
`sameBackendType`, which ignores, for example, the distinct type
modifiers and aliases. As a result, `IntAlias(1)` and `int(1)` now
result in two `DataTable` entries instead of one.

Only using `TypeId` comparison/hashing does speed up `getOrPut`,
however.

### CGIR

* the CGIR still uses `PType`
* `cgirgen` turns the input `TypeId`s back into `PType`s
* since `cgirgen` creates new `PType` and assigns them to `Local`s,
  access to a *mutable* `MirEnv` is now required (in order to register
  the new `PType`s)

### VM backend

Packing constant data requires querying type information, and access to
a `TypeEnv` is thus required. A pointer to the `TypeEnv` instance is
passed along in `DataEncoder`.

### VM Evaluation Pass

Initializing the JIT environment requires a basic type environment,
which is not present when using the VM evaluation pass, as the `system`
module isn't yet processed at the time the `PEvalContext` is
initialized.

To delay setting up the JIT environment as much as necessary, the
evaluation pass is restructured:
* only a VM instance is assigned to the `ModuleGraph` at the start
* `setupGlobalCtx` creates a proper evaluation context from the
  instance
* evaluating statements, which now calls `setupGlobalCtx`, is prevented
  for declarative statements

This ensures that `initJit` is only called after the processing of the
`system` module has set up the basic type environment.

### Compiler Performance

`MirNode` being a plain data-type (no destructor) significantly speeds
up all MIR processing that creates new nodes or copies/moves them,
especially `TreeChangeset` application (~ -70%).

In addition, no copy/sink/destroy needing to be injected for `MirNode`s
also speeds up bootstrapping, since it means less work for the
destructor injection pass.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/backends.nim      |  50 ++--
 compiler/backend/cgen.nim          |   2 +-
 compiler/backend/cgendata.nim      |   3 +-
 compiler/backend/cgirgen.nim       |  79 +++---
 compiler/backend/compat.nim        |  26 +-
 compiler/backend/jsbackend.nim     |   2 +-
 compiler/backend/jsgen.nim         |   7 +-
 compiler/front/scripting.nim       |   4 +-
 compiler/mir/datatables.nim        |  10 +-
 compiler/mir/injecthooks.nim       |  30 +--
 compiler/mir/mirbodies.nim         |   2 +-
 compiler/mir/mirconstr.nim         |  40 +--
 compiler/mir/mirenv.nim            |  14 +-
 compiler/mir/mirgen.nim            | 391 ++++++++++++++---------------
 compiler/mir/mirpasses.nim         |  35 +--
 compiler/mir/mirtrees.nim          |   9 +-
 compiler/mir/mirtypes.nim          | 100 ++++++++
 compiler/mir/typemaps.nim          | 188 ++++++++++++++
 compiler/mir/utils.nim             |  41 ++-
 compiler/sem/injectdestructors.nim |  59 ++---
 compiler/vm/compilerbridge.nim     |  57 +++--
 compiler/vm/nimeval.nim            |   4 +-
 compiler/vm/packed_env.nim         |  14 +-
 compiler/vm/vmbackend.nim          |  10 +-
 compiler/vm/vmgen.nim              |  35 +--
 compiler/vm/vmjit.nim              |  13 +-
 compiler/vm/vmserialize.nim        |   6 +-
 tests/compiler/tdatatables.nim     |   9 +-
 28 files changed, 789 insertions(+), 451 deletions(-)
 create mode 100644 compiler/mir/mirtypes.nim
 create mode 100644 compiler/mir/typemaps.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index fece22dbef7..1f4730c3385 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -31,6 +31,7 @@ import
     mirgen,
     mirpasses,
     mirtrees,
+    mirtypes,
     sourcemaps,
     utils
   ],
@@ -363,7 +364,7 @@ proc translate*(id: ProcedureId, body: PNode, graph: ModuleGraph,
   # now apply the passes:
   process(result, prc, graph, idgen, env)
 
-proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
+proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
                  owner: PSym, body: sink MirBody): Body =
   ## Translates the MIR code provided by `code` into ``CgNode`` IR and,
   ## if enabled, echoes the result.
@@ -420,7 +421,7 @@ proc produceFragmentsForGlobals(
       if hasDestructor(s.typ):
         prepare(deinit, result.deinit.source, graph.emptyNode)
         deinit.setSource(result.deinit.source.add(it[0]))
-        genDestroy(deinit, graph, env, toValue(global, s.typ))
+        genDestroy(deinit, graph, env, toValue(global, env.types.add(s.typ)))
 
   (result.init.code, result.init.locals) =
     finish(init, result.init.source, graph.emptyNode)
@@ -436,11 +437,11 @@ proc genLoadLib(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
 
   bu.subTree MirNode(kind: mnkAsgn):
     bu.use loc
-    bu.buildCall env.procedures.add(loadLib), loadLib.typ[0]:
+    bu.buildCall env.procedures.add(loadLib), env.types.add(loadLib.typ[0]):
       bu.emitByVal name
 
-  bu.wrapTemp(graph.getSysType(unknownLineInfo, tyBool)):
-    bu.buildMagicCall mIsNil, graph.getSysType(unknownLineInfo, tyBool):
+  bu.wrapTemp(BoolType):
+    bu.buildMagicCall mIsNil, BoolType:
       bu.emitByVal loc
 
 proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
@@ -451,8 +452,7 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
   ## expression used with the ``.dynlib`` pragma.
   let
     errorProc = graph.getCompilerProc("nimLoadLibraryError")
-    voidTyp   = graph.getSysType(path.info, tyVoid)
-    val       = toValue(libVar, env[libVar].typ)
+    val       = toValue(libVar, env.types.add(env[libVar].typ))
 
   if path.kind in nkStrKinds:
     # the library name is known at compile-time
@@ -467,11 +467,10 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
       bu.add MirNode(kind: mnkStmtList) # manual, for less visual nesting
       for candidate in candidates.items:
         var tmp = genLoadLib(bu, graph, env, val):
-          literal(env.getOrIncl(candidate),
-                  graph.getSysType(path.info, tyString))
+          literal(env.getOrIncl(candidate), StringType)
 
-        tmp = bu.wrapTemp(graph.getSysType(path.info, tyBool)):
-          bu.buildMagicCall mNot, graph.getSysType(path.info, tyBool):
+        tmp = bu.wrapTemp(BoolType):
+          bu.buildMagicCall mNot, BoolType:
             bu.emitByVal tmp
 
         bu.subTree mnkIf:
@@ -480,16 +479,13 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
 
       # if none of the candidates worked, a run-time error is reported:
       bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), voidTyp:
-          bu.emitByVal literal(env.getOrIncl(path.strVal), path.typ)
+        bu.buildCall env.procedures.add(errorProc), VoidType:
+          bu.emitByVal literal(env.getOrIncl(path.strVal), StringType)
       bu.add endNode(mnkStmtList)
   else:
     # the name of the dynamic library to load the procedure from is only known
     # at run-time
-    let
-      strType = graph.getSysType(path.info, tyString)
-
-    let nameTemp = bu.allocTemp(strType)
+    let nameTemp = bu.allocTemp(StringType)
     bu.buildStmt mnkDef:
       bu.use nameTemp
       generateCode(graph, env, conf.tconfig, path, bu, source)
@@ -498,7 +494,7 @@ proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
     bu.subTree mnkIf:
       bu.use cond
       bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), voidTyp:
+        bu.buildCall env.procedures.add(errorProc), VoidType:
           bu.emitByVal nameTemp
 
 proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
@@ -512,7 +508,6 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
     loadProc = graph.getCompilerProc("nimGetProcAddr")
     path     = transformExpr(graph, m.idgen, m.sym, lib.path)
     extname  = newStrNode(nkStrLit, sym.extname)
-    voidTyp  = graph.getSysType(path.info, tyVoid)
 
   extname.typ = graph.getSysType(lib.path.info, tyCstring)
 
@@ -521,9 +516,9 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
 
   let dest =
     if sym.kind in routineKinds:
-      toValue(env.procedures[sym], sym.typ)
+      toValue(env.procedures[sym], env.types.add(sym.typ))
     else:
-      toValue(env.globals[sym], sym.typ)
+      toValue(env.globals[sym], env.types.add(sym.typ))
 
   # the scope makes sure that locals are destroyed once loading the
   # procedure has finished
@@ -540,7 +535,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
       bu.use tmp
       generateCode(graph, env, conf.tconfig, path, bu, result.source)
     bu.subTree mnkVoid:
-      bu.buildMagicCall mAsgnDynlibVar, voidTyp:
+      bu.buildMagicCall mAsgnDynlibVar, VoidType:
         bu.emitByName(dest, ekReassign)
         bu.emitByVal(tmp)
   else:
@@ -549,6 +544,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
     let
       isNew = lib.name in env.globals
       libVar = env.globals.add(lib.name)
+      rtyp = env.types.add(loadProc.typ[0])
 
     if not isNew:
       # the library hasn't been loaded yet
@@ -557,13 +553,13 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
         data.libs.add sym.annex
 
     # generate the code for ``sym = cast[typ](nimGetProcAddr(lib, extname))``
-    let tmp = bu.wrapTemp(loadProc.typ[0]):
-      bu.buildCall env.procedures.add(loadProc), loadProc.typ[0]:
-        bu.emitByVal toValue(libVar, lib.name.typ)
-        bu.emitByVal literal(env.getOrIncl(extname.strVal), extname.typ)
+    let tmp = bu.wrapTemp(rtyp):
+      bu.buildCall env.procedures.add(loadProc), rtyp:
+        bu.emitByVal toValue(libVar, env.types.add(lib.name.typ))
+        bu.emitByVal literal(env.getOrIncl(extname.strVal), CstringType)
 
     bu.subTree mnkVoid:
-      bu.buildMagicCall mAsgnDynlibVar, voidTyp:
+      bu.buildMagicCall mAsgnDynlibVar, VoidType:
         bu.emitByName(dest, ekReassign)
         bu.emitByVal tmp
 
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 5d1cc9f408e..b7440c80ba5 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -500,7 +500,7 @@ proc localVarDecl(p: BProc; n: CgNode, decl: Local): Rope =
   if decl.alignment > 0:
     result.addf("NIM_ALIGN($1) ", [$decl.alignment])
 
-  result.add getTypeDesc(p.module, decl.typ)
+  result.add getTypeDesc(p.module, p.module.g.env[decl.typ])
   if true:
     if sfRegister in decl.flags: result.add(" register")
     if sfVolatile in decl.flags: result.add(" volatile")
diff --git a/compiler/backend/cgendata.nim b/compiler/backend/cgendata.nim
index 7fd0b6ace29..5f939582a67 100644
--- a/compiler/backend/cgendata.nim
+++ b/compiler/backend/cgendata.nim
@@ -310,7 +310,8 @@ proc newProc*(prc: PSym, module: BModule): BProc =
 
 proc newModuleList*(g: ModuleGraph): BModuleList =
   BModuleList(typeInfoMarker: initTable[SigHash, tuple[str: Rope, owner: int32]](),
-    config: g.config, graph: g, nimtvDeclared: initIntSet())
+    config: g.config, graph: g, nimtvDeclared: initIntSet(),
+    env: initMirEnv(g))
 
 iterator cgenModules*(g: BModuleList): BModule =
   for m in g.modulesClosed:
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 6600ab3c83c..86c38ade5b2 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -30,6 +30,7 @@ import
     mirbodies,
     mirenv,
     mirtrees,
+    mirtypes,
     sourcemaps
   ],
   compiler/modules/[
@@ -56,8 +57,8 @@ type
     graph: ModuleGraph
     idgen: IdGenerator
     env: ptr MirEnv
-      ## read-only reference to the MirEnv. Stored here to prevent excessive
-      ## parameter passing
+      ## read/write reference to the MirEnv. Stored here to prevent excessive
+      ## parameter passing. Only the type environment is potentially modified
 
     owner: PSym
 
@@ -149,6 +150,9 @@ template `[]=`(x: CgNode, i: BackwardsIndex, n: CgNode) =
 template add(x: CgNode, y: CgNode) =
   x.kids.add y
 
+template map(cl: TranslateCl, id: TypeId): lent PType =
+  cl.env.types[id]
+
 proc copyTree(n: CgNode): CgNode =
   case n.kind
   of cnkAtoms:
@@ -253,43 +257,44 @@ proc convToIr(cl: TranslateCl, n: CgNode, info: TLineInfo, dest: PType): CgNode
     result = newOp(cnkLvalueConv, info, dest, n)
 
 proc atomToIr(n: MirNode, cl: TranslateCl, info: TLineInfo): CgNode =
+  let typ = cl.map(n.typ)
   case n.kind
   of mnkProcVal:
-    CgNode(kind: cnkProc, info: info, typ: n.typ, prc: n.prc)
+    CgNode(kind: cnkProc, info: info, typ: typ, prc: n.prc)
   of mnkGlobal:
-    CgNode(kind: cnkGlobal, info: info, typ: n.typ, global: n.global)
+    CgNode(kind: cnkGlobal, info: info, typ: typ, global: n.global)
   of mnkConst:
-    CgNode(kind: cnkConst, info: info, typ: n.typ, cnst: n.cnst)
+    CgNode(kind: cnkConst, info: info, typ: typ, cnst: n.cnst)
   of mnkLocal, mnkParam, mnkTemp:
-    newLocalRef(n.local, info, cl.locals[n.local].typ)
+    newLocalRef(n.local, info, cl.map(cl.locals[n.local].typ))
   of mnkAlias:
     # the type of the node doesn't match the real one
     let
       id = n.local
-      typ = cl.locals[id].typ
+      typ = cl.map(cl.locals[id].typ)
     # the view is auto-dereferenced here for convenience
     newOp(cnkDerefView, info, typ.base, newLocalRef(id, info, typ))
   of mnkNilLit:
-    CgNode(kind: cnkNilLit, info: info, typ: n.typ)
+    CgNode(kind: cnkNilLit, info: info, typ: typ)
   of mnkIntLit:
-    CgNode(kind: cnkIntLit, info: info, typ: n.typ,
+    CgNode(kind: cnkIntLit, info: info, typ: typ,
            intVal: cl.env[].getInt(n.number))
   of mnkUIntLit:
-    CgNode(kind: cnkUIntLit, info: info, typ: n.typ,
+    CgNode(kind: cnkUIntLit, info: info, typ: typ,
            intVal: cl.env[].getInt(n.number))
   of mnkFloatLit:
-    CgNode(kind: cnkFloatLit, info: info, typ: n.typ,
+    CgNode(kind: cnkFloatLit, info: info, typ: typ,
            floatVal: cl.env[].getFloat(n.number))
   of mnkStrLit:
-    CgNode(kind: cnkStrLit, info: info, typ: n.typ, strVal: n.strVal)
+    CgNode(kind: cnkStrLit, info: info, typ: typ, strVal: n.strVal)
   of mnkAstLit:
-    CgNode(kind: cnkAstLit, info: info, typ: n.typ, astLit: cl.env[][n.ast])
+    CgNode(kind: cnkAstLit, info: info, typ: typ, astLit: cl.env[][n.ast])
   of mnkType:
-    newTypeNode(info, n.typ)
+    newTypeNode(info, typ)
   of mnkNone:
     # type arguments do use `mnkNone` in some situtations, so keep
     # the type
-    CgNode(kind: cnkEmpty, info: info, typ: n.typ)
+    CgNode(kind: cnkEmpty, info: info, typ: typ)
   of AllNodeKinds - Atoms:
     unreachable("not an atom: " & $n.kind)
 
@@ -301,8 +306,8 @@ proc tbExceptItem(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor
                  ): CgNode =
   let n {.cursor.} = get(tree, cr)
   case n.kind
-  of mnkLocal: newLocalRef(n.local, cr.info, n.typ)
-  of mnkType:  newTypeNode(cr.info, n.typ)
+  of mnkLocal: newLocalRef(n.local, cr.info, cl.map(n.typ))
+  of mnkType:  newTypeNode(cr.info, cl.map(n.typ))
   else:        unreachable()
 
 
@@ -314,7 +319,9 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   ## context-dependent -- `preferField` disambiguates whether it should be
   ## turned into a field access rather than a (pseudo) access of the tagged
   ## union.
-  let info = cr.info
+  let
+    info = cr.info
+    typ = cl.map(n.typ)
 
   template recurse(): CgNode =
     lvalueToIr(tree, cl, tree.get(cr), cr, false)
@@ -324,7 +331,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
     return atomToIr(n, cl, info)
   of mnkPathNamed:
     let obj = recurse()
-    result = newExpr(cnkFieldAccess, info, n.typ,
+    result = newExpr(cnkFieldAccess, info, typ,
                      [obj, newFieldNode(lookupInType(obj.typ, n.field.int))])
   of mnkPathVariant:
     if preferField:
@@ -337,7 +344,7 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
       # variant access itself has no ``CgNode`` counterpart at the moment
       result = recurse()
   of mnkPathPos:
-    result = newExpr(cnkTupleAccess, info, n.typ,
+    result = newExpr(cnkTupleAccess, info, typ,
                      [recurse(),
                       CgNode(kind: cnkIntLit, intVal: n.position.BiggestInt)])
   of mnkPathArray:
@@ -350,14 +357,15 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
       else:
         recurse()
 
-    result = newExpr(cnkArrayAccess, info, n.typ, [arg, atomToIr(tree, cl, cr)])
+    result = newExpr(cnkArrayAccess, info, typ,
+                     [arg, atomToIr(tree, cl, cr)])
   of mnkPathConv:
-    result = convToIr(cl, recurse(), info, n.typ)
+    result = convToIr(cl, recurse(), info, typ)
   # dereferences are allowed at the end of a path tree
   of mnkDeref:
-    result = newOp(cnkDeref, info, n.typ, atomToIr(tree, cl, cr))
+    result = newOp(cnkDeref, info, typ, atomToIr(tree, cl, cr))
   of mnkDerefView:
-    result = newOp(cnkDerefView, info, n.typ, atomToIr(tree, cl, cr))
+    result = newOp(cnkDerefView, info, typ, atomToIr(tree, cl, cr))
   of AllNodeKinds - LvalueExprKinds - {mnkProcVal}:
     unreachable(n.kind)
 
@@ -419,7 +427,7 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   ## Translate a valid call-like tree to the CG IR.
   let info = cr.info
   result = newExpr((if n.kind == mnkCall: cnkCall else: cnkCheckedCall),
-                   info, n.typ)
+                   info, cl.map(n.typ))
   result.add calleeToIr(tree, cl, cr)
 
   # the code generators currently require some magics to not have any
@@ -474,28 +482,28 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   let
     entity {.cursor.} = get(tree, cr) # the name of the defined entity
     info = cr.info
+    typ {.cursor.} = cl.map(entity.typ)
 
   var def: CgNode
 
   case entity.kind
   of mnkLocal, mnkTemp:
     let id = entity.local
-    def = newLocalRef(id, info, cl.locals[id].typ)
+    def = newLocalRef(id, info, typ)
   of mnkParam:
     # ignore 'def's for parameters
     def = newEmpty()
   of mnkGlobal:
-    def = CgNode(kind: cnkGlobal, info: info, typ: entity.typ,
+    def = CgNode(kind: cnkGlobal, info: info, typ: typ,
                  global: entity.global)
   of mnkAlias:
     # MIR aliases are translated to var/lent views
     assert n.kind in {mnkBind, mnkBindMut}, "alias can only be defined by binds"
-    assert entity.typ != nil
     let
-      typ = makeVarType(cl.owner, entity.typ, cl.idgen,
+      typ = makeVarType(cl.owner, typ, cl.idgen,
                         if n.kind == mnkBind: tyLent else: tyVar)
     # override the original type
-    cl.locals[entity.local].typ = typ
+    cl.locals[entity.local].typ = cl.env.types.add(typ)
 
     def = newLocalRef(entity.local, info, typ)
   else:
@@ -957,12 +965,12 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   let info = cr.info
 
   template op(kind: CgNodeKind, e: CgNode): CgNode =
-    let r = newOp(kind, info, n.typ, e)
+    let r = newOp(kind, info, cl.map(n.typ), e)
     leave(tree, cr)
     r
 
   template treeOp(k: CgNodeKind, body: untyped): CgNode =
-    let res {.inject.} = newExpr(k, info, n.typ)
+    let res {.inject.} = newExpr(k, info, cl.map(n.typ))
     while tree[cr].kind != mnkEnd:
       body
     leave(tree, cr)
@@ -1003,9 +1011,10 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
     treeOp cnkClosureConstr:
       res.add argToIr(tree, cl, cr)[1]
   of mnkObjConstr:
-    assert n.typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
+    let typ = cl.map(n.typ)
+    assert typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
-      let f = newFieldNode(lookupInType(n.typ, get(tree, cr).field))
+      let f = newFieldNode(lookupInType(typ, get(tree, cr).field))
       res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
   of mnkCall:
     callToIr(tree, cl, n, cr)
@@ -1087,7 +1096,7 @@ proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   result = newStmt(cnkStmtList, unknownLineInfo)
   result.kids = move stmts
 
-proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: MirEnv,
+proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
                  owner: PSym,
                  body: sink MirBody): Body =
   ## Generates the ``CgNode`` IR corresponding to the input MIR `body`,
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 6360bf6f04d..72e299ce21f 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -24,7 +24,8 @@ import
   ],
   compiler/mir/[
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/utils/[
     bitsets,
@@ -140,13 +141,17 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
   ## a ``CgNode`` tree. Obsolete once the code generators use the MIR
   ## directly.
   proc translateAux(t: MirTree, i: var int, env: MirEnv): CgNode =
+    let
+      n {.cursor.}   = t[i]
+      typ {.cursor.} = env[n.typ]
+
     template recurse(): CgNode =
       translateAux(t, i, env)
 
     template tree(k: CgNodeKind, body: untyped): CgNode =
       ## Convenience template for setting up the tree node and iterating the
       ## input node's child nodes.
-      let res {.inject.} = newExpr(k, unknownLineInfo, n.typ)
+      let res {.inject.} = newExpr(k, unknownLineInfo, typ)
       res.kids.newSeq(t[i - 1].len)
       for j in 0..<res.len:
         res.kids[j] = body
@@ -154,12 +159,11 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
       inc i # consume the end node
       res
 
-    let n {.cursor.} = t[i]
     inc i # advance to the first child node
     case n.kind
     of mnkObjConstr:
       tree cnkObjConstr:
-        let field = lookupInType(n.typ, t[i].field.int)
+        let field = lookupInType(typ, t[i].field.int)
         inc i # advance to the arg node
         CgNode(kind: cnkBinding, info: unknownLineInfo,
                kids: @[CgNode(kind: cnkField, field: field),
@@ -184,24 +188,24 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
       inc i # skip the end node
       x
     of mnkNilLit:
-      CgNode(kind: cnkNilLit, info: unknownLineInfo, typ: n.typ)
+      CgNode(kind: cnkNilLit, info: unknownLineInfo, typ: typ)
     of mnkIntLit:
-      CgNode(kind: cnkIntLit, info: unknownLineInfo, typ: n.typ,
+      CgNode(kind: cnkIntLit, info: unknownLineInfo, typ: typ,
              intVal: env.getInt(n.number))
     of mnkUIntLit:
-      CgNode(kind: cnkUIntLit, info: unknownLineInfo, typ: n.typ,
+      CgNode(kind: cnkUIntLit, info: unknownLineInfo, typ: typ,
              intVal: env.getInt(n.number))
     of mnkFloatLit:
-      CgNode(kind: cnkFloatLit, info: unknownLineInfo, typ: n.typ,
+      CgNode(kind: cnkFloatLit, info: unknownLineInfo, typ: typ,
              floatVal: env.getFloat(n.number))
     of mnkStrLit:
-      CgNode(kind: cnkStrLit, info: unknownLineInfo, typ: n.typ,
+      CgNode(kind: cnkStrLit, info: unknownLineInfo, typ: typ,
              strVal: n.strVal)
     of mnkAstLit:
-      CgNode(kind: cnkAstLit, info: unknownLineInfo, typ: n.typ,
+      CgNode(kind: cnkAstLit, info: unknownLineInfo, typ: typ,
              astLit: env[n.ast])
     of mnkProcVal:
-      CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: n.typ)
+      CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: typ)
     of AllNodeKinds - ConstrTreeNodes + {mnkEnd, mnkField}:
       # 'end' nodes are skipped manually
       unreachable(n.kind)
diff --git a/compiler/backend/jsbackend.nim b/compiler/backend/jsbackend.nim
index 6c3cc7e1dbd..522639afb50 100644
--- a/compiler/backend/jsbackend.nim
+++ b/compiler/backend/jsbackend.nim
@@ -121,7 +121,7 @@ proc generateCode*(graph: ModuleGraph, mlist: sink ModuleList) =
   ## Entry point into the JS backend. Generates the code for all modules and
   ## writes it to the output file.
   let
-    globals = newGlobals()
+    globals = newGlobals(graph)
     bconf = BackendConfig(tconfig: TranslationConfig(magicsToKeep: NonMagics))
 
   var
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index 4b2f294f25e..e636ffe2688 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -264,9 +264,8 @@ template endBlock(p: PProc, frmt: FormatStr = "}$n", args: varargs[Rope]) =
   dec p.extraIndent
   lineF(p, frmt, args)
 
-proc newGlobals*(): PGlobals =
-  new(result)
-  result.typeInfoGenerated = initIntSet()
+proc newGlobals*(g: ModuleGraph): PGlobals =
+  PGlobals(env: initMirEnv(g))
 
 proc rdLoc(a: TCompRes): Rope {.inline.} =
   if a.typ != etyBaseIndex:
@@ -1522,7 +1521,7 @@ proc setupLocalLoc(p: PProc, id: LocalId, kind: TSymKind; name = "") =
   ## computing the storage flags and a non-empty `name` overrides the
   ## mangled name.
   var loc = Loc(name: mangleName(p.fullBody[id], id),
-                typ: p.fullBody[id].typ,
+                typ: p.env[p.fullBody[id].typ],
                 storage: storage(p.fullBody[id].flags, kind,
                                  id in p.addrTaken))
 
diff --git a/compiler/front/scripting.nim b/compiler/front/scripting.nim
index 08f09bd5919..51cd5e9969d 100644
--- a/compiler/front/scripting.nim
+++ b/compiler/front/scripting.nim
@@ -45,7 +45,7 @@ import
   ]
 
 from compiler/vm/vmlegacy import legacyReportsVmTracer
-from compiler/vm/vmjit import registerCallback
+from compiler/vm/vmjit import registerCallback, initJit
 
 # we support 'cmpIgnoreStyle' natively for efficiency:
 from std/strutils import cmpIgnoreStyle, contains
@@ -225,7 +225,7 @@ proc runNimScript*(cache: IdentCache; scriptName: AbsoluteFile;
   #  during `setupVM`
   # - NimScript has access to the macro/compile-time APIs
   registerAdditionalOps(vm, disallowDanger)
-  graph.vm = PEvalContext(vm: vm)
+  graph.vm = PVmCtx(context: vm)
 
   graph.compileSystemModule()
   discard graph.processModule(m, idgen, stream)
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index 5d5391e9a37..d3e2636a782 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -5,10 +5,6 @@ import
   std/[
     hashes
   ],
-  compiler/ast/[
-    ast_types,
-    types
-  ],
   compiler/mir/[
     mirtrees
   ],
@@ -55,9 +51,7 @@ func hashTree(tree: ConstrTree): Hash =
   for _, it in tree.pairs:
     result = result !& hash(it)
 
-  # only hash the kind of the type. This trades more collisions for faster
-  # hashing
-  result = result !& hash(tree[0].typ.kind)
+  result = result !& hash(tree[0].typ)
   result = !$(result)
 
 proc cmp(a, b: ConstrTree): bool =
@@ -85,7 +79,7 @@ proc cmp(a, b: ConstrTree): bool =
     of AllNodeKinds - ConstrTreeNodes:
       unreachable(a.kind)
 
-  if not a[0].typ.sameBackendType(b[0].typ) or a.len != b.len:
+  if a[0].typ != b[0].typ or a.len != b.len:
     # the (backend-)type is different -> not the same constant expressions
     return false
 
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index 7991c478450..5fd03f8db13 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -22,10 +22,10 @@ import
     mirchangesets,
     mirconstr,
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/modules/[
-    magicsys,
     modulegraphs
   ],
   compiler/sem/[
@@ -115,8 +115,8 @@ proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
 
     inc n
 
-proc reportDiagnostics(g: ModuleGraph, body: MirBody,
-                       owner: PSym, diags: var seq[LocalDiag]) =
+proc reportDiagnostics(g: ModuleGraph, types: TypeEnv, body: MirBody,
+                       owner: PSym, diags: seq[LocalDiag]) =
   ## Reports all diagnostics in `diags` as ``SemReport``s and clear the list
   for diag in diags.items:
     let ast = body.sourceFor(diag.pos)
@@ -124,7 +124,7 @@ proc reportDiagnostics(g: ModuleGraph, body: MirBody,
       case diag.kind
       of ldkUnavailableTypeBound:
         SemReport(kind: rsemUnavailableTypeBound,
-                  typ: body[diag.pos].typ,
+                  typ: types[body[diag.pos].typ],
                   str: AttachedOpToStr[diag.op],
                   ast: ast,
                   sym: owner)
@@ -151,17 +151,17 @@ template genCopy(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
       src
 
     if graph.config.selectedGC == gcOrc and
-       cyclicType(tree[dst].typ.skipTypes(skipAliases + {tyDistinct}), graph):
+       cyclicType(env[tree[dst].typ].skipTypes(skipAliases + {tyDistinct}),
+                  graph):
       # pass whether the copy can potentially introduce cycles as the third
       # parameter:
       let c = maybeCyclic and couldIntroduceCycle(tree, dest)
-      bu.emitByVal literal(mnkIntLit, env.getOrIncl(BiggestInt(c)),
-                           graph.getSysType(unknownLineInfo, tyBool))
+      bu.emitByVal literal(mnkIntLit, env.getOrIncl(BiggestInt(c)), BoolType)
 
 proc genDestroy*(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
                  target: Value) =
   ## Emits a destructor call with `target` as the argument.
-  let destr = getOp(graph, target.typ, attachedDestructor)
+  let destr = getOp(graph, env[target.typ], attachedDestructor)
   bu.buildVoidCall(env, destr):
     bu.emitByName(target, ekMutate)
 
@@ -179,14 +179,14 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         stmt = tree.parent(i)
         typ  = tree[stmt, 0].typ
 
-      if not hasDestructor(typ):
+      if not hasDestructor(env[typ]):
         # nothing to insert
         continue
 
       let
         dest = tree.child(stmt, 0)
         src  = tree.child(i, 0)
-        op   = getOp(graph, typ, attachedAsgn)
+        op   = getOp(graph, env[typ], attachedAsgn)
 
       if sfError in op.flags:
         # emit an error if the hook is not available, but still continue
@@ -234,7 +234,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         stmt = tree.parent(i)
         typ  = tree[stmt, 0].typ
 
-      if not hasDestructor(typ) or
+      if not hasDestructor(env[typ]) or
          tree[stmt].kind in {mnkDef, mnkDefUnpack, mnkInit}:
         # nothing to do if:
         # * the type has no hooks
@@ -244,7 +244,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
       let
         dest = tree.child(stmt, 0)
         src  = tree.child(i, 0)
-        op   = getOp(graph, typ, attachedSink)
+        op   = getOp(graph, env[typ], attachedSink)
 
       # note: the move analyzer has to make sure that the source operand
       # doesn't overlap with the destination, so no temporary for the source is
@@ -272,7 +272,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
           bu.use loc
 
     of mnkDestroy:
-      let destr = getOp(graph, tree[tree.operand(i)].typ, attachedDestructor)
+      let destr = getOp(graph, env[tree[tree.operand(i)].typ], attachedDestructor)
       changes.replaceMulti(tree, i, bu):
         bu.buildVoidCall(env, destr):
           # XXX: the by-name passing and usage of ``ekMutate`` is not really
@@ -288,7 +288,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
       discard "nothing to do"
 
   # turn the collected diagnostics into reports and report them:
-  reportDiagnostics(graph, body, owner, diags)
+  reportDiagnostics(graph, env.types, body, owner, diags)
 
 proc injectHooks*(body: var MirBody, graph: ModuleGraph, env: var MirEnv,
                   owner: PSym) =
diff --git a/compiler/mir/mirbodies.nim b/compiler/mir/mirbodies.nim
index a6cac04050d..1105b95b1ae 100644
--- a/compiler/mir/mirbodies.nim
+++ b/compiler/mir/mirbodies.nim
@@ -17,7 +17,7 @@ type
   Local* = object
     ## Static information about a local location ('let' or 'var'). Not modified
     ## after initialization.
-    typ*: PType
+    typ*: TypeId
       ## type of the local
     alignment*: uint32
       ## alignment of the location, measured in bytes. 0 means "use default"
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 47eda209e64..bba849668f6 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -28,7 +28,7 @@ type
   Fragment* = object
     ## Identifies a fragment (usually a sub-tree) within the staging buffer.
     s: NodeSlice
-    typ*: PType
+    typ*: TypeId
 
   MirBuffer = object
     ## Accumulates in-progress MIR code and keeps track of additional state
@@ -61,7 +61,7 @@ type
     #      with changesets to work, but future refactorings should focus
     #      on making them hidden
 
-func typ*(val: Value): PType =
+func typ*(val: Value): TypeId =
   assert val.node.kind != mnkNone, "uninitialized"
   val.node.typ
 
@@ -72,36 +72,36 @@ func endNode*(k: MirNodeKind): MirNode {.inline.} =
   assert k in SubTreeNodes
   MirNode(kind: mnkEnd, start: k)
 
-func typeLit*(t: PType): Value =
+func typeLit*(t: TypeId): Value =
   Value(node: MirNode(kind: mnkType, typ: t))
 
 func literal*(kind: range[mnkIntLit..mnkFloatLit], n: NumberId,
-              typ: PType): Value =
+              typ: TypeId): Value =
   Value(node: MirNode(kind: kind, typ: typ, number: n))
 
-func literal*(str: StringId, typ: PType): Value =
+func literal*(str: StringId, typ: TypeId): Value =
   Value(node: MirNode(kind: mnkStrLit, typ: typ, strVal: str))
 
-func literal*(ast: AstId, typ: PType): Value =
+func literal*(ast: AstId, typ: TypeId): Value =
   Value(node: MirNode(kind: mnkAstLit, typ: typ, ast: ast))
 
-func temp*(typ: PType, id: LocalId): Value =
+func temp*(typ: TypeId, id: LocalId): Value =
   Value(node: MirNode(kind: mnkTemp, typ: typ, local: id))
 
-func alias*(typ: PType, id: LocalId): Value =
+func alias*(typ: TypeId, id: LocalId): Value =
   Value(node: MirNode(kind: mnkAlias, typ: typ, local: id))
 
-func toValue*(id: ConstId, typ: PType): Value =
+func toValue*(id: ConstId, typ: TypeId): Value =
   Value(node: MirNode(kind: mnkConst, typ: typ, cnst: id))
 
-func toValue*(id: GlobalId, typ: PType): Value =
+func toValue*(id: GlobalId, typ: TypeId): Value =
   Value(node: MirNode(kind: mnkGlobal, typ: typ, global: id))
 
-func toValue*(id: ProcedureId, typ: PType): Value =
+func toValue*(id: ProcedureId, typ: TypeId): Value =
   Value(node: MirNode(kind: mnkProcVal, typ: typ, prc: id))
 
 func toValue*(kind: range[mnkParam..mnkLocal], id: LocalId,
-              typ: PType): Value =
+              typ: TypeId): Value =
   Value(node: MirNode(kind: kind, typ: typ, local: id))
 
 # --------- MirBuffer interface ----------
@@ -196,7 +196,7 @@ template push*(bu: var MirBuilder, body: untyped): Fragment =
            typ: if start < bu.staging.len:
                   bu.staging[start].typ
                 else:
-                  nil)
+                  VoidType)
 
 func pop*(bu: var MirBuilder, f: Fragment) =
   ## Moves the expression/statement identified by `v` from the top of the
@@ -302,7 +302,7 @@ template scope*(bu: var MirBuilder, body: untyped) =
   bu.subTree MirNode(kind: mnkScope):
     body
 
-func allocTemp(bu: MirBuilder, t: PType; id: LocalId, alias: bool): Value =
+func allocTemp(bu: MirBuilder, t: TypeId; id: LocalId, alias: bool): Value =
   ## Allocates a new temporary or alias and returns it.
   let kind = if alias: mnkAlias
              else:     mnkTemp
@@ -310,7 +310,7 @@ func allocTemp(bu: MirBuilder, t: PType; id: LocalId, alias: bool): Value =
     result = Value(node: MirNode(kind: kind, typ: t, local: id),
                    info: someOpt bu.currentSourceId)
 
-template allocTemp*(bu: var MirBuilder, t: PType, alias = false): Value =
+template allocTemp*(bu: var MirBuilder, t: TypeId, alias = false): Value =
   # XXX: the only purpose of this is to work around a ``strictFuncs`` bug
   let id = bu.addLocal(Local(typ: t))
   allocTemp(bu, t, id, alias)
@@ -322,7 +322,7 @@ func use*(bu: var MirBuilder, val: sink Value) {.inline.} =
   else:
     bu.add val.node
 
-template wrapTemp*(bu: var MirBuilder, t: PType,
+template wrapTemp*(bu: var MirBuilder, t: TypeId,
                   body: untyped): Value =
   ## Emits a definition of a temporary with `body` as the initializer
   ## expression.
@@ -332,7 +332,7 @@ template wrapTemp*(bu: var MirBuilder, t: PType,
     body
   val
 
-template wrapAlias*(bu: var MirBuilder, t: PType, body: untyped): Value =
+template wrapAlias*(bu: var MirBuilder, t: TypeId, body: untyped): Value =
   ## Emits an ``mnkBind`` statement with `body` as the lvalue expression.
   ## Returns the name of the alias.
   let val = allocTemp(bu, t, true)
@@ -341,7 +341,7 @@ template wrapAlias*(bu: var MirBuilder, t: PType, body: untyped): Value =
     body
   val
 
-template wrapMutAlias*(bu: var MirBuilder, t: PType, body: untyped): Value =
+template wrapMutAlias*(bu: var MirBuilder, t: TypeId, body: untyped): Value =
   ## Emits a ``mnkBindMut`` statement with `body` as the lvalue expression.
   ## Returns the name of the alias.
   let val = allocTemp(bu, t, true)
@@ -350,13 +350,13 @@ template wrapMutAlias*(bu: var MirBuilder, t: PType, body: untyped): Value =
     body
   val
 
-template buildMagicCall*(bu: var MirBuilder, m: TMagic, t: PType,
+template buildMagicCall*(bu: var MirBuilder, m: TMagic, t: TypeId,
                          body: untyped) =
   bu.subTree MirNode(kind: mnkCall, typ: t):
     bu.add MirNode(kind: mnkMagic, magic: m)
     body
 
-template buildCall*(bu: var MirBuilder, prc: ProcedureId, t: PType,
+template buildCall*(bu: var MirBuilder, prc: ProcedureId, t: TypeId,
                     body: untyped) =
   ## Build and emits a call tree to the active buffer. `pt` is the type of the
   ## procedure.
diff --git a/compiler/mir/mirenv.nim b/compiler/mir/mirenv.nim
index 9cf1f43f09d..e5456fa3d4b 100644
--- a/compiler/mir/mirenv.nim
+++ b/compiler/mir/mirenv.nim
@@ -12,7 +12,11 @@ import
   ],
   compiler/mir/[
     datatables,
-    mirtrees
+    mirtrees,
+    mirtypes
+  ],
+  compiler/modules/[
+    modulegraphs
   ],
   compiler/ic/[
     bitabs
@@ -42,6 +46,8 @@ type
     globals*:    SymbolTable[GlobalId, PSym]
       ## includes both normal globals and threadvars
     procedures*: SymbolTable[ProcedureId, PSym]
+    types*: TypeEnv
+      ## the type environment
 
     numbers*: BiTable[BiggestInt]
       ## all numerical values referenced by the MIR, stored as bit patterns
@@ -102,6 +108,9 @@ func checkpoint*[I, T](tab: SymbolTable[I, T]): Checkpoint =
 
 # ------- MirEnv API --------
 
+proc initMirEnv*(g: ModuleGraph): MirEnv =
+  MirEnv(types: initTypeEnv(g))
+
 func `[]`*(env: MirEnv, id: ConstId): lent PSym {.inline.} =
   env.constants.data[id]
 
@@ -138,6 +147,9 @@ func getOrIncl*(env: var MirEnv, str: string): StringId {.inline.} =
   ## If not registered already, adds `str` to the environment.
   StringId env.strings.getOrIncl(str)
 
+template `[]`*(env: MirEnv, id: TypeId): PType =
+  env.types[id]
+
 func setData*(env: var MirEnv, id: ConstId, data: DataId) =
   ## Sets the body for the constant identified by `id`.
   synchronize(env.bodies, env.constants.data)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 69a8415f7a4..1000586c2be 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -66,7 +66,6 @@ import
     ast,
     astalgo,
     astmsgs, # for generating the field error message
-    lineinfos,
     trees,
     types,
     wordrecg
@@ -77,6 +76,7 @@ import
     mirconstr,
     mirenv,
     mirtrees,
+    mirtypes,
     proto_mir,
     sourcemaps
   ],
@@ -219,15 +219,10 @@ func initDestination(v: sink Value, isFirst, sink: bool): Destination =
 
   Destination(isSome: true, val: v, flags: flags)
 
-proc typeOrVoid(g: ModuleGraph, t: PType): PType =
-  ## Returns `t` if it's not 'nil' - the ``void`` type otherwise
-  if t != nil: t
-  else:        g.getSysType(unknownLineInfo, tyVoid)
-
-proc typeOrVoid(c: TCtx, t: PType): PType {.inline.} =
-  ## Returns `t` if it's not 'nil' - the ``void`` type otherwise
-  # TODO: cache the void type
-  typeOrVoid(c.graph, t)
+proc typeToMir(c: var TCtx, t: PType): TypeId =
+  ## Turns `t` into a MIR type and returns the latter's ID.
+  if t.isNil: VoidType
+  else:       c.env.types.add(t)
 
 func nextLabel(c: var TCtx): LabelId =
   result = LabelId(c.numLabels)
@@ -257,8 +252,9 @@ template useSource(bu: var MirBuilder, sp: var SourceProvider,
 
 # -------------- Symbol translation --------------
 
-func localToMir(s: PSym): Local =
-  Local(typ: s.typ, flags: s.flags,
+func localToMir(c: var TCtx, s: PSym): Local =
+  Local(typ: c.env.types.add(s.typ),
+        flags: s.flags,
         isImmutable: s.kind in {skLet, skForVar},
         name: s.name,
         alignment:
@@ -268,8 +264,8 @@ func localToMir(s: PSym): Local =
             0
         )
 
-template paramToMir(s: PSym): Local =
-  localToMir(s)
+template paramToMir(c: var TCtx, s: PSym): Local =
+  localToMir(c, s)
 
 # -------------- builder/convenience routines -------------
 
@@ -310,41 +306,42 @@ func addLocal(c: var TCtx, s: PSym): LocalId =
   ## Translates `s` to its MIR representation, registers it with body, and
   ## establishes a mapping.
   assert s.id notin c.localsMap
-  result = c.addLocal(localToMir(s))
+  result = c.addLocal(localToMir(c, s))
   c.localsMap[s.id] = result
 
 proc empty(c: var TCtx, n: PNode): MirNode =
-  MirNode(kind: mnkNone, typ: n.typ)
+  MirNode(kind: mnkNone, typ: c.typeToMir(n.typ))
 
-func intLiteral(env: var MirEnv, val: BiggestInt, typ: PType): Value =
+func intLiteral(env: var MirEnv, val: BiggestInt, typ: TypeId): Value =
   literal(mnkIntLit, env.getOrIncl(val), typ)
 
-func uintLiteral(env: var MirEnv, val: BiggestUInt, typ: PType): Value =
+func uintLiteral(env: var MirEnv, val: BiggestUInt, typ: TypeId): Value =
   literal(mnkUIntLit, env.getOrIncl(val), typ)
 
-func floatLiteral(env: var MirEnv, val: BiggestFloat, typ: PType): Value =
+func floatLiteral(env: var MirEnv, val: BiggestFloat, typ: TypeId): Value =
   literal(mnkFloatLit, env.getOrIncl(val), typ)
 
 func astLiteral(env: var MirEnv, val: PNode, typ: PType): Value =
-  literal(env.asts.add(val), typ)
+  literal(env.asts.add(val), env.types.add(typ))
 
 proc toIntLiteral(env: var MirEnv, val: Int128, typ: PType): Value =
   ## Interprets `val` based on `typ`.
   if isUnsigned(typ):
-    uintLiteral(env, val.toUInt, typ)
+    uintLiteral(env, val.toUInt, env.types.add(typ))
   else:
-    intLiteral(env, val.toInt, typ)
+    intLiteral(env, val.toInt, env.types.add(typ))
 
 proc toIntLiteral(env: var MirEnv, n: PNode): Value =
   ## Translates an integer value (represented by `n`) to its MIR
   ## counterpart.
   assert n.kind in nkIntLiterals
+  let typ = env.types.add(n.typ)
   # use the type for deciding what whether it's a signed or unsigned value
   case n.typ.skipTypes(abstractRange + {tyEnum}).kind
   of tyInt..tyInt64, tyBool:
-    intLiteral(env, n.intVal, n.typ)
+    intLiteral(env, n.intVal, typ)
   of tyUInt..tyUInt64, tyChar, tyPtr, tyPointer, tyProc:
-    uintLiteral(env, cast[BiggestUInt](n.intVal), n.typ)
+    uintLiteral(env, cast[BiggestUInt](n.intVal), typ)
   else:
     unreachable()
 
@@ -363,28 +360,29 @@ proc toFloatLiteral(env: var MirEnv, n: PNode): Value =
   else:
     unreachable()
 
-  floatLiteral(env, val, n.typ)
+  floatLiteral(env, val, env.types.add(n.typ))
 
-func strLiteral(env: var MirEnv, str: string, typ: PType): Value =
+func strLiteral(env: var MirEnv, str: string, typ: TypeId): Value =
   literal(env.getOrIncl(str), typ)
 
 func nameNode(c: var TCtx, s: PSym): MirNode =
+  let t = c.typeToMir(s.typ)
   case s.kind
   of skTemp:
     # temporaries are always locals, even if marked with the ``sfGlobal``
     # flag
-    MirNode(kind: mnkLocal, typ: s.typ, local: c.localsMap[s.id])
+    MirNode(kind: mnkLocal, typ: t, local: c.localsMap[s.id])
   of skConst:
-    MirNode(kind: mnkConst, typ: s.typ, cnst: c.env.constants.add(s))
+    MirNode(kind: mnkConst, typ: t, cnst: c.env.constants.add(s))
   of skParam:
-    MirNode(kind: mnkParam, typ: s.typ, local: LocalId(1 + s.position))
+    MirNode(kind: mnkParam, typ: t, local: LocalId(1 + s.position))
   of skResult:
-    MirNode(kind: mnkLocal, typ: s.typ, local: resultId)
+    MirNode(kind: mnkLocal, typ: t, local: resultId)
   of skVar, skLet, skForVar:
     if sfGlobal in s.flags:
-      MirNode(kind: mnkGlobal, typ: s.typ, global: c.env.globals.add(s))
+      MirNode(kind: mnkGlobal, typ: t, global: c.env.globals.add(s))
     else:
-      MirNode(kind: mnkLocal, typ: s.typ, local: c.localsMap[s.id])
+      MirNode(kind: mnkLocal, typ: t, local: c.localsMap[s.id])
   else:
     unreachable(s.kind)
 
@@ -392,7 +390,7 @@ func genLocation(c: var TCtx, n: PNode): Value =
   let f = c.builder.push: c.builder.add(nameNode(c, n.sym))
   c.builder.popSingle(f)
 
-template allocTemp(c: var TCtx, typ: PType; alias=false): Value =
+template allocTemp(c: var TCtx, typ: TypeId; alias=false): Value =
   ## Allocates a new ID for a temporary and returns the name.
   c.builder.allocTemp(typ, alias)
 
@@ -411,10 +409,10 @@ proc genx(c: var TCtx, n: PNode; consume: bool = false) =
   let e = exprToPmir(c, n, consume, false)
   genx(c, e, e.high)
 
-func getTemp(c: var TCtx, typ: PType): Value =
+func getTemp(c: var TCtx, typ: TypeId): Value =
   ## Allocates a new temporary and emits a definition for it into the
   ## final buffer.
-  assert typ != nil
+  assert typ != VoidType
   result = c.allocTemp(typ)
   withFront c.builder:
     c.subTree mnkDef:
@@ -424,16 +422,16 @@ func getTemp(c: var TCtx, typ: PType): Value =
 template buildStmt(c: var TCtx, k: MirNodeKind, body: untyped) =
   c.builder.buildStmt(k, body)
 
-template buildMagicCall(c: var TCtx, m: TMagic, t: PType, body: untyped) =
+template buildMagicCall(c: var TCtx, m: TMagic, t: TypeId, body: untyped) =
   c.builder.buildMagicCall(m, t, body)
 
-template buildCheckedMagicCall(c: var TCtx, m: TMagic, t: PType,
+template buildCheckedMagicCall(c: var TCtx, m: TMagic, t: TypeId,
                                body: untyped) =
   c.subTree MirNode(kind: mnkCheckedCall, typ: t):
     c.add MirNode(kind: mnkMagic, magic: m)
     body
 
-template buildDefectMagicCall(c: var TCtx, m: TMagic, t: PType,
+template buildDefectMagicCall(c: var TCtx, m: TMagic, t: TypeId,
                               body: untyped) =
   ## Builds and emits a call to the `m` magic with return type `t`. The call
   ## is only marked as potentially raising if panics are not enabled.
@@ -466,7 +464,7 @@ proc toValue(c: var TCtx, e: PMirExpr, i: int, def: MirNodeKind): Value =
     result = c.builder.popSingle(f)
   else:
     # needs a temporary
-    result = c.allocTemp(e[i].typ, def in {mnkBind, mnkBindMut})
+    result = c.allocTemp(c.typeToMir(e[i].typ), def in {mnkBind, mnkBindMut})
     withFront c.builder:
       c.subTree def:
         c.use result
@@ -512,20 +510,18 @@ proc genOperand(c: var TCtx, n: PNode) =
   wantValue(e)
   genx(c, e, e.high)
 
-proc genOp(c: var TCtx, k: MirNodeKind, t: PType, n: PNode) =
-  assert t != nil
+proc genOp(c: var TCtx, k: MirNodeKind, t: TypeId, n: PNode) =
   c.subTree MirNode(kind: k, typ: t):
     genOperand(c, n)
 
-template buildOp(c: var TCtx, k: MirNodeKind, t: PType, body: untyped) =
-  assert t != nil
+template buildOp(c: var TCtx, k: MirNodeKind, t: TypeId, body: untyped) =
   c.subTree MirNode(kind: k, typ: t):
     body
 
-template wrapTemp(c: var TCtx, t: PType, body: untyped): Value =
+template wrapTemp(c: var TCtx, t: TypeId, body: untyped): Value =
   ## Assigns the expression emitted by `body` to a temporary and
   ## returns the name of the latter.
-  assert t != nil
+  assert t != VoidType
   let res = c.allocTemp(t)
   c.buildStmt mnkDef:
     c.use res
@@ -533,14 +529,14 @@ template wrapTemp(c: var TCtx, t: PType, body: untyped): Value =
 
   res
 
-template wrapAndUse(c: var TCtx, t: PType, body: untyped) =
+template wrapAndUse(c: var TCtx, t: TypeId, body: untyped) =
   ## Assigns the expression emitted by `body` to a temporary
   ## and immediately emits a use thereof.
   let tmp = c.wrapTemp(t):
     body
   c.use tmp
 
-template buildTree(c: var TCtx, k: MirNodeKind, t: PType, body: untyped) =
+template buildTree(c: var TCtx, k: MirNodeKind, t: TypeId, body: untyped) =
   c.subTree MirNode(kind: k, typ: t):
     body
 
@@ -569,8 +565,8 @@ proc genAndOr(c: var TCtx, n: PNode, dest: Destination) =
   # condition:
   var v = dest.val
   if n[0].sym.magic == mOr:
-    v = c.wrapTemp n.typ:
-      c.buildMagicCall mNot, n.typ:
+    v = c.wrapTemp BoolType:
+      c.buildMagicCall mNot, BoolType:
         c.emitByVal v
 
   c.subTree mnkIf:
@@ -585,19 +581,19 @@ proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
     conf = c.graph.config
     discr = call[2].sym
   c.buildStmt mnkVoid:
-    c.buildDefectMagicCall mChckField, typeOrVoid(c, nil):
+    c.buildDefectMagicCall mChckField, VoidType:
       # set operand:
       c.emitByVal c.genRd(call[1])
       # discriminator value operand:
       c.subTree mnkArg:
-        c.subTree MirNode(kind: mnkPathNamed, typ: discr.typ,
+        c.subTree MirNode(kind: mnkPathNamed, typ: c.typeToMir(discr.typ),
                           field: discr.position.int32):
           c.use access
       # inverted flag:
-      c.emitByVal intLiteral(c.env, ord(inverted), call.typ)
+      c.emitByVal intLiteral(c.env, ord(inverted), BoolType)
       # error message operand:
       c.emitByVal strLiteral(c.env, genFieldDefect(conf, field, discr),
-                             c.graph.getSysType(call.info, tyString))
+                             StringType)
 
 proc genCheckedVariantAccess(c: var TCtx, variant: Value, name: PIdent,
                              check: PNode): PSym =
@@ -632,7 +628,7 @@ proc genTypeExpr(c: var TCtx, n: PNode): Value =
   of nkSym:
     case n.sym.kind
     of skType:
-      typeLit(n.sym.typ)
+      typeLit c.typeToMir(n.sym.typ)
     of skVar, skLet, skForVar, skTemp, skParam:
       # a first-class type value stored in a location
       genLocation(c, n)
@@ -640,12 +636,12 @@ proc genTypeExpr(c: var TCtx, n: PNode): Value =
       unreachable()
   of nkBracketExpr:
     # the type description of a generic type, e.g. ``seq[int]``
-    typeLit(n.typ)
+    typeLit c.typeToMir(n.typ)
   of nkTupleTy, nkStaticTy, nkRefTy, nkPtrTy, nkVarTy, nkDistinctTy, nkProcTy,
      nkIteratorTy, nkSharedTy, nkTupleConstr:
-    typeLit(n.typ)
+    typeLit c.typeToMir(n.typ)
   of nkTypeOfExpr, nkType:
-    typeLit(n.typ)
+    typeLit c.typeToMir(n.typ)
   else:
     unreachable("not a type expression")
 
@@ -732,7 +728,7 @@ proc genArgs(c: var TCtx, n: PNode) =
       if n[i].typ.kind == tyTypeDesc:
         c.emitByVal genTypeExpr(c, n[i])
       else:
-        c.emitByVal typeLit(n[i].typ)
+        c.emitByVal typeLit(c.typeToMir(n[i].typ))
     elif t.isCompileTimeOnly:
       # don't translate arguments to compile-time-only parameters. To ease the
       # translation to ``CgNode``, we don't omit them completely but only
@@ -773,7 +769,7 @@ proc genCall(c: var TCtx, n: PNode) =
   if tfNoSideEffect notin fntyp.flags:
     effects.incl geMutateGlobal
 
-  c.subTree MirNode(kind: kind, typ: typeOrVoid(c, fntyp[0]),
+  c.subTree MirNode(kind: kind, typ: c.typeToMir(fntyp[0]),
                     effects: effects):
     genCallee(c, n[0])
     genArgs(c, n)
@@ -788,7 +784,7 @@ proc genMacroCallArgs(c: var TCtx, n: PNode, kind: TSymKind, fntyp: PType) =
     genCallee(c, n[1])
   of skTemplate:
     # for late template invocations, the callee template is an argument
-    c.emitByVal astLiteral(c.env, n[1], n[1].typ)
+    c.emitByVal literal(c.env.asts.add(n[1]), VoidType)
   else:
     unreachable(kind)
 
@@ -829,7 +825,7 @@ proc genInSetOp(c: var TCtx, n: PNode) =
       x  = n[2]
       elemTyp = x.typ.skipTypes(abstractRange)
       leOp = getMagicLeForType(elemTyp) # less-equal op
-      res = getTemp(c, n.typ) # the temporary to write the result to
+      res = getTemp(c, BoolType) # the temporary to write the result to
 
     # the evaluation order is reversed here: the second operand comes
     # first
@@ -840,22 +836,22 @@ proc genInSetOp(c: var TCtx, n: PNode) =
 
     c.buildStmt mnkIf:
       # condition: ``a <= x:``
-      c.wrapAndUse(n.typ):
-        c.buildMagicCall leOp, n.typ:
+      c.wrapAndUse(BoolType):
+        c.buildMagicCall leOp, BoolType:
           c.emitByVal a
           c.emitByVal val
       # the outer body:
       c.subTree mnkStmtList:
         # condition: ``x <= b:``
         c.subTree mnkIf:
-          c.wrapAndUse(n.typ):
-            c.buildMagicCall leOp, n.typ:
+          c.wrapAndUse(BoolType):
+            c.buildMagicCall leOp, BoolType:
               c.emitByVal val
               c.emitByVal b
           c.subTree mnkStmtList:
             var sv: Value
             if se.kind == nkCurly and not isDeepConstExpr(se):
-              sv = c.allocTemp(se.typ)
+              sv = c.allocTemp(c.typeToMir(se.typ))
               c.subTree mnkDef:
                 c.use sv
                 genSetConstr(c, se)
@@ -864,7 +860,7 @@ proc genInSetOp(c: var TCtx, n: PNode) =
 
             c.subTree mnkInit:
               c.use res
-              c.buildMagicCall mInSet, n.typ:
+              c.buildMagicCall mInSet, BoolType:
                 c.emitByVal sv
                 c.emitByVal val
 
@@ -887,21 +883,22 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   template arg(n: PNode) =
     c.emitOperandTree n, false
 
+  let rtyp = c.typeToMir(n.typ) ## call's return type
   case m
   of mAnd, mOr:
-    let tmp = getTemp(c, n.typ)
+    let tmp = getTemp(c, rtyp)
     withFront c.builder:
       genAndOr(c, n, Destination(isSome: true, val: tmp, flags: {dfOwns}))
     c.use tmp
   of mDefault:
     # use the canonical form:
-    c.buildMagicCall mDefault, n.typ:
+    c.buildMagicCall mDefault, rtyp:
       discard
   of mNew:
     # ``new`` has 2 variants. The standard one with zero arguments, and the
     # unsafe version that takes a ``size`` argument
     assert n.len == 1 or n.len == 2
-    c.buildMagicCall m, typeOrVoid(c, n.typ):
+    c.buildMagicCall m, rtyp:
       if n.len == 2:
         # the size argument
         arg n[1]
@@ -909,13 +906,13 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   of mWasMoved:
     # ``wasMoved`` has an effect that is not encoded by the parameter's type
     # (it kills the location), so we need to manually translate it
-    c.buildMagicCall m, typeOrVoid(c, n.typ):
+    c.buildMagicCall m, VoidType:
       c.emitByName ekKill, genLvalueOperand(c, n[1])
   of mConStrStr:
     # the `mConStrStr` magic is very special. Nested calls to it are flattened
     # into a single call in ``transf``. It can't be passed on to ``genCall``
     # since the number of arguments doesn't match with the number of parameters
-    c.buildMagicCall m, n.typ:
+    c.buildMagicCall m, rtyp:
       for i in 1..<n.len:
         arg n[i]
   of mInSet:
@@ -924,16 +921,16 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     # forward the wrapped arguments to the call; don't emit the intermediate array
     let x = n[1].skipConv
     assert x.kind == nkBracket
-    c.buildCheckedMagicCall m, typeOrVoid(c, n.typ):
+    c.buildCheckedMagicCall m, rtyp:
       # for the convenience of later transformations, the type of the would-be
       # array is passed along as the first argument
       if x.len > 0:
-        c.emitByVal typeLit(x.typ)
+        c.emitByVal typeLit(c.typeToMir(x.typ))
       for it in x.items:
         arg it
   of mOffsetOf:
     # an offsetOf call that has to be evaluated by the backend
-    c.buildMagicCall mOffsetOf, n.typ:
+    c.buildMagicCall mOffsetOf, rtyp:
       c.subTree mnkName:
         # prevent all checks and make sure that the original lvalue
         # expression reaches the code generators
@@ -952,35 +949,36 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     if optOverflowCheck in c.userOptions:
       const Map = [mAddI: mAddI, mSubI, mMulI, mDivI, mModI,
                    mSucc: mAddI, mPred: mSubI]
-      c.buildDefectMagicCall Map[m], n.typ:
+      c.buildDefectMagicCall Map[m], rtyp:
         arg n[1]
         arg n[2]
     else:
       const Map = [mAddI: mnkAdd, mSubI: mnkSub,
                    mMulI: mnkMul, mDivI: mnkDiv, mModI: mnkModI,
                    mSucc: mnkAdd, mPred: mnkSub]
-      c.buildTree Map[m], n.typ:
+      c.buildTree Map[m], rtyp:
         genArgExpression(c, n[1], sink=false)
         genArgExpression(c, n[2], sink=false)
 
   of mUnaryMinusI, mUnaryMinusI64:
     # negation can cause overflows too
     if optOverflowCheck in c.userOptions:
-      c.buildDefectMagicCall m, n.typ:
+      c.buildDefectMagicCall m, rtyp:
         arg n[1]
     else:
-      c.genOp(mnkNeg, n.typ, n[1])
+      c.genOp(mnkNeg, rtyp, n[1])
 
   of mInc, mDec:
     # ``inc a, b`` -> ``a = a + b``
     let
       typ = n[1].typ
+      rtyp = typeToMir(c, typ)
       dest = genAlias(c, n[1], true)
     c.buildStmt mnkAsgn:
       c.use dest
       if isUnsigned(typ):
         const magic = [mInc: mAddU, mDec: mSubU]
-        c.buildMagicCall magic[m], typ:
+        c.buildMagicCall magic[m], rtyp:
           c.emitByVal dest
           arg n[2]
       else:
@@ -1002,8 +1000,8 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
            typ.skipTypes(abstractInst).kind in {tyRange, tyEnum}:
           # needs an additional range check in order to ensure that the value
           # is in range
-          let val = c.wrapTemp(typ): op(c, dest, n, m)
-          c.buildDefectMagicCall mChckRange, typ:
+          let val = c.wrapTemp(rtyp): op(c, dest, n, m)
+          c.buildDefectMagicCall mChckRange, rtyp:
             c.emitByVal val
             c.emitByVal toIntLiteral(c.env, firstOrd(c.graph.config, typ), typ)
             c.emitByVal toIntLiteral(c.env, lastOrd(c.graph.config, typ), typ)
@@ -1015,7 +1013,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     # and panics are disabled, the call must be a checked call
     if optOverflowCheck in n[0].sym.options and
        optPanics notin c.graph.config.globalOptions:
-      c.buildTree mnkCheckedCall, n.typ:
+      c.buildTree mnkCheckedCall, rtyp:
         c.genCallee(n[0])
         arg n[1]
     else:
@@ -1023,52 +1021,52 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
 
   # float arithmetic operations:
   of mAddF64, mSubF64, mMulF64, mDivF64:
-    proc op(c: var TCtx, m: TMagic, a, b: PNode) =
+    proc op(c: var TCtx, m: TMagic, a, b: PNode, rtyp: TypeId) {.nimcall.} =
       if optInfCheck in c.userOptions:
         # needs an overflow check
-        c.buildDefectMagicCall m, n.typ:
+        c.buildDefectMagicCall m, rtyp:
           arg a
           arg b
       else:
         # the unchecked version can be used
         const Map = [mAddF64: mnkAdd, mSubF64: mnkSub,
                      mMulF64: mnkMul, mDivF64: mnkDiv]
-        c.buildTree Map[m], n.typ:
+        c.buildTree Map[m], rtyp:
           c.genArgExpression(a, sink=false)
           c.genArgExpression(b, sink=false)
 
     if optNaNCheck in c.userOptions:
-      let tmp = c.wrapTemp n.typ:
-        op(c, m, n[1], n[2])
+      let tmp = c.wrapTemp rtyp:
+        op(c, m, n[1], n[2], rtyp)
 
       c.buildStmt mnkVoid:
-        c.buildDefectMagicCall mChckNaN, typeOrVoid(c, nil):
+        c.buildDefectMagicCall mChckNaN, VoidType:
           c.emitByVal tmp
       c.use tmp
     else:
-      op(c, m, n[1], n[2])
+      op(c, m, n[1], n[2], rtyp)
   of mUnaryMinusF64:
-    c.genOp mnkNeg, n.typ, n[1]
+    c.genOp mnkNeg, rtyp, n[1]
 
   # magics that use incomplete symbols (most of them are generated by
   # ``liftdestructors``):
   of mDestroy:
     # ``mDestroy`` magic calls might be incomplete symbols, so we have to
     # translate them manually
-    c.buildMagicCall m, typeOrVoid(c, n.typ):
+    c.buildMagicCall m, rtyp:
       c.emitByName ekMutate, genLvalueOperand(c, n[1])
   of mNewSeq:
     # XXX: the first parameter is actually an ``out`` parameter -- the
     #      ``ekReassign`` effect could be used
     if n[0].typ == nil:
-      c.buildMagicCall m, typeOrVoid(c, n.typ):
+      c.buildMagicCall m, rtyp:
         c.emitByName ekMutate, genLvalueOperand(c, n[1])
         arg n[2]
     else:
       genCall(c, n)
   of mSetLengthStr, mCopyInternal:
     if n[0].typ == nil:
-      c.buildMagicCall m, typeOrVoid(c, n.typ):
+      c.buildMagicCall m, rtyp:
         c.emitByName ekMutate, genLvalueOperand(c, n[1])
         arg n[2]
     else:
@@ -1076,7 +1074,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   of mNot, mLtI, mLengthSeq, mLengthStr, mSamePayload:
     if n[0].typ == nil:
       # simple translation. None of the arguments need to be passed by lvalue
-      c.buildMagicCall m, n.typ:
+      c.buildMagicCall m, rtyp:
         for i in 1..<n.len:
           arg n[i]
 
@@ -1087,14 +1085,14 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     # calls where ``x`` is of an imported type with unknown alignment reach
     # here. The code-generators only care about the types in both cases, so
     # that's what we emit
-    c.buildMagicCall m, n.typ:
+    c.buildMagicCall m, rtyp:
       # skip the surrounding typedesc
-      c.emitByVal typeLit(n[1].typ.skipTypes({tyTypeDesc}))
+      c.emitByVal typeLit(c.typeToMir(n[1].typ.skipTypes({tyTypeDesc})))
   of mGetTypeInfoV2:
     if n[0].typ == nil:
       # the compiler-generated version always uses a type as the argument
-      c.buildMagicCall m, n.typ:
-        c.emitByVal typeLit(n[1].typ)
+      c.buildMagicCall m, rtyp:
+        c.emitByVal typeLit(c.typeToMir(n[1].typ))
     else:
       # only the compiler-generated version of the magic has a type parameter.
       # The normal one doesn't (see ``cyclebreaker.getDynamicTypeInfo``), so we
@@ -1110,13 +1108,13 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     of skTemplate:
       # a ``getAst`` call taking a template call expression. The arguments
       # need special handling, but the shape stays as is
-      c.buildMagicCall m, n.typ:
+      c.buildMagicCall m, rtyp:
         genMacroCallArgs(c, n, skTemplate, callee.sym.typ)
     of skMacro:
       # rewrite ``getAst(macro(a, b, c))`` -> ``macro(a, b, c)``
       # treat a macro call as potentially raising and as modifying global
       # data. While not wrong, it is pessimistic
-      c.subTree MirNode(kind: mnkCheckedCall, typ: n.typ,
+      c.subTree MirNode(kind: mnkCheckedCall, typ: rtyp,
                         effects: {geMutateGlobal}):
         # we can use the internal signature
         genMacroCallArgs(c, n, skMacro, callee.sym.internal)
@@ -1126,7 +1124,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   of mSwap:
     # turn calls to magic procedures that don't require symbols into MIR
     # magic calls
-    c.buildMagicCall m, n.typ:
+    c.buildMagicCall m, rtyp:
       genArgs(c, n)
   else:
     # no special transformation for the other magics:
@@ -1139,7 +1137,7 @@ proc genCallOrMagic(c: var TCtx, n: PNode) =
     genCall(c, n)
 
 proc genSetConstr(c: var TCtx, n: PNode) =
-  c.buildTree mnkSetConstr, n.typ:
+  c.buildTree mnkSetConstr, c.typeToMir(n.typ):
     for it in n.items:
       if it.kind == nkRange:
         # watch out! the operands don't have to be literal values
@@ -1150,42 +1148,33 @@ proc genSetConstr(c: var TCtx, n: PNode) =
         c.genArgExpression(it, sink=false)
 
 proc genArrayConstr(c: var TCtx, n: PNode, isConsume: bool) =
-  c.buildTree mnkArrayConstr, n.typ:
+  c.buildTree mnkArrayConstr, c.typeToMir(n.typ):
     for it in n.items:
       c.emitOperandTree it, isConsume
 
 proc genSeqConstr(c: var TCtx, n: PNode) =
-  c.buildTree mnkSeqConstr, n.typ:
+  c.buildTree mnkSeqConstr, c.typeToMir(n.typ):
     for it in n.items:
       c.emitOperandTree it, true
 
 proc genTupleConstr(c: var TCtx, n: PNode, isConsume: bool) =
   assert n.typ.skipTypes(abstractVarRange-{tyTypeDesc}).kind == tyTuple
-  c.buildTree mnkTupleConstr, n.typ:
+  c.buildTree mnkTupleConstr, c.typeToMir(n.typ):
     for it in n.items:
       c.emitOperandTree skipColon(it), isConsume
 
 proc genClosureConstr(c: var TCtx, n: PNode, isConsume: bool) =
-  c.buildTree mnkClosureConstr, n.typ:
+  c.buildTree mnkClosureConstr, c.typeToMir(n.typ):
     c.emitOperandTree n[0].skipConv, false # the procedural value
     # transf wraps the procedure operand in a conversion that we don't
     # need
 
-    c.subTree (if isConsume: mnkConsume else: mnkArg): # the environment
-      if n[1].kind == nkNilLit:
-        # it can happen that a ``nkNilLit`` has no type (i.e. its typ is nil) -
-        # we ensure that the nil literal has the correct type
-        # TODO: prevent a ``nkNilLit`` with no type information from being
-        #       created instead
-        c.add MirNode(kind: mnkNilLit,
-                      typ: c.graph.getSysType(n[1].info, tyNil))
-      else:
-        genArgExpression(c, n[1], isConsume)
+    c.emitOperandTree n[1], isConsume # the environment
 
 proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
   let isRef = n.typ.skipTypes(abstractInst).kind == tyRef
 
-  c.subTree MirNode(kind: mnkObjConstr, typ: n.typ, len: n.len-1):
+  c.subTree MirNode(kind: mnkObjConstr, typ: c.typeToMir(n.typ), len: n.len-1):
     for i in 1..<n.len:
       let it = n[i]
       let field = lookupFieldAgain(n.typ.skipTypes(abstractInst), it[0].sym)
@@ -1214,14 +1203,14 @@ proc genRaise(c: var TCtx, n: PNode) =
       typ = skipTypes(n[0].typ, abstractPtrs)
       cp = c.graph.getCompilerProc("prepareException")
     c.buildStmt mnkVoid:
-      c.buildTree mnkCall, typeOrVoid(c, nil):
+      c.buildTree mnkCall, VoidType:
         c.add procNode(c.env.procedures.add(cp))
         c.subTree mnkArg:
           # lvalue conversion to the base ``Exception`` type:
-          c.buildTree mnkPathConv, cp.typ[1]:
+          c.buildTree mnkPathConv, c.typeToMir(cp.typ[1]):
             c.use tmp
         c.emitByVal strLiteral(c.env, typ.sym.name.s,
-                               c.graph.getSysType(n.info, tyCstring))
+                               CstringType)
 
     # emit the raise statement:
     c.buildStmt mnkRaise:
@@ -1343,7 +1332,7 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
       # it to the type's default value.
       c.buildStmt mnkInit:
         c.add nameNode(c, s)
-        c.buildMagicCall mDefault, s.typ:
+        c.buildMagicCall mDefault, c.typeToMir(s.typ):
           discard
     else:
       # the definition doesn't imply default intialization
@@ -1407,7 +1396,7 @@ proc genVarTuple(c: var TCtx, n: PNode) =
 
   else:
     # generate the definition for the temporary:
-    let val = c.allocTemp(initExpr.typ)
+    let val = c.allocTemp(c.typeToMir(initExpr.typ))
     c.buildStmt mnkDefUnpack:
       c.use val
       # ensure that the temporary owns the tuple value:
@@ -1415,7 +1404,9 @@ proc genVarTuple(c: var TCtx, n: PNode) =
 
     # generate the unpack logic:
     for i in 0..<numDefs:
-      let lhs = n[i]
+      let
+        lhs = n[i]
+        typ = c.typeToMir(lhs.typ)
 
       if lhs.kind == nkSym:
         genLocDef(c, lhs, c.graph.emptyNode)
@@ -1427,8 +1418,8 @@ proc genVarTuple(c: var TCtx, n: PNode) =
         # definition above), and it's only used for unpacking; it can always be
         # moved out of. The temporary tuple is not destroyed, so no
         # destructive move is required
-        c.buildTree mnkMove, lhs.typ:
-          c.subTree MirNode(kind: mnkPathPos, typ: lhs.typ,
+        c.buildTree mnkMove, typ:
+          c.subTree MirNode(kind: mnkPathPos, typ: typ,
                             position: i.uint32):
             c.use val
 
@@ -1453,16 +1444,17 @@ proc genVarSection(c: var TCtx, n: PNode) =
           # the default value can be assigned in-place
           c.buildStmt mnkInit:
             genOperand(c, a[0])
-            c.buildMagicCall mDefault, a[0].typ:
+            c.buildMagicCall mDefault, c.typeToMir(a[0].typ):
               discard
         else:
           # a 'move' modifier is required for the assignment to later be
           # rewritten
+          let typ = c.typeToMir(a[0].typ)
           c.buildStmt mnkAsgn:
             genOperand(c, a[0])
-            c.buildTree mnkMove, a[0].typ:
-              c.wrapAndUse a[0].typ:
-                c.buildMagicCall mDefault, a[0].typ:
+            c.buildTree mnkMove, typ:
+              c.wrapAndUse typ:
+                c.buildMagicCall mDefault, typ:
                   discard
       else:
         unreachable()
@@ -1632,13 +1624,13 @@ proc genExceptBranch(c: var TCtx, n: PNode, dest: Destination) =
     for _, tn in branchLabels(n):
       case tn.kind
       of nkType:
-        c.add MirNode(kind: mnkType, typ: tn.typ)
+        c.add MirNode(kind: mnkType, typ: c.typeToMir(tn.typ))
       of nkInfix:
         # ``T as a`` doesn't get transformed to just ``T`` if ``T`` is the
         # type of an imported exception -- the local's name is used at the
         # MIR level
         let id = c.addLocal(tn[2].sym)
-        c.add MirNode(kind: mnkLocal, typ: tn[2].typ, local: id)
+        c.add MirNode(kind: mnkLocal, typ: c.typeToMir(tn[2].typ), local: id)
       else:
         unreachable()
 
@@ -1717,7 +1709,7 @@ proc toConstant(c: var TCtx, n: PNode): Value =
   ## Creates an anonymous constant from the constant expression `n`
   ## and returns the ``Value`` for it.
   let con = toConstId c.env.data.getOrPut(constDataToMir(c.env, n))
-  toValue(con, n.typ)
+  toValue(con, c.typeToMir(n.typ))
 
 proc genx(c: var TCtx, e: PMirExpr, i: int) =
   ## Translates the proto-MIR expression to MIR code and emits it into the
@@ -1738,19 +1730,20 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       if isMutable: mnkToMutSlice else: mnkToSlice
     else: unreachable()
 
+  let typ = c.typeToMir(n.typ)
   case n.kind
   of pirProc:
-    c.use toValue(c.env.procedures.add(n.sym), n.sym.typ)
+    c.use toValue(c.env.procedures.add(n.sym), typ)
   of pirLiteral:
     case n.orig.kind
     of nkNilLit:
-      c.add MirNode(kind: mnkNilLit, typ: n.typ)
+      c.add MirNode(kind: mnkNilLit, typ: typ)
     of nkIntLiterals:
       c.use toIntLiteral(c.env, n.orig)
     of nkFloatLiterals:
       c.use toFloatLiteral(c.env, n.orig)
     of nkStrLiterals:
-      c.use strLiteral(c.env, n.orig.strVal, n.typ)
+      c.use strLiteral(c.env, n.orig.strVal, typ)
     of nkNimNodeLit:
       c.use astLiteral(c.env, n.orig[0], n.typ)
     else:
@@ -1758,28 +1751,28 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
   of pirLocal, pirGlobal, pirParam, pirConst:
     c.add nameNode(c, n.sym)
   of pirDeref:
-    c.buildOp mnkDeref, n.typ:
+    c.buildOp mnkDeref, typ:
       c.use toValue(c, e, i - 1)
   of pirViewDeref:
-    c.buildOp mnkDerefView, n.typ:
+    c.buildOp mnkDerefView, typ:
       c.use toValue(c, e, i - 1)
   of pirTupleAccess:
-    c.subTree MirNode(kind: mnkPathPos, typ: n.typ, position: n.pos):
+    c.subTree MirNode(kind: mnkPathPos, typ: typ, position: n.pos):
       recurse()
   of pirFieldAccess:
-    c.subTree MirNode(kind: mnkPathNamed, typ: n.typ,
+    c.subTree MirNode(kind: mnkPathNamed, typ: typ,
                       field: n.field.position.int32):
       recurse()
   of pirArrayAccess, pirSeqAccess:
-    c.buildOp mnkPathArray, n.typ:
+    c.buildOp mnkPathArray, typ:
       recurse()
       c.use toValue(c, e, n.index)
   of pirVariantAccess:
-    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ,
+    c.subTree MirNode(kind: mnkPathVariant, typ: typ,
                       field: n.field.position.int32):
       recurse()
   of pirLvalueConv:
-    c.buildOp mnkPathConv, n.typ:
+    c.buildOp mnkPathConv, typ:
       recurse()
   of pirCheckedArrayAccess, pirCheckedSeqAccess:
     let
@@ -1787,11 +1780,11 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       idx = toValue(c, e, n.index)
 
     c.buildStmt mnkVoid:
-      c.buildDefectMagicCall mChckIndex, typeOrVoid(c, nil):
+      c.buildDefectMagicCall mChckIndex, VoidType:
         c.emitByVal arr
         c.emitByVal idx
 
-    c.buildOp mnkPathArray, n.typ:
+    c.buildOp mnkPathArray, typ:
       c.use arr
       c.use idx
   of pirCheckedVariantAccess:
@@ -1799,48 +1792,47 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       variant = toValue(c, e, i - 1)
       discr = genCheckedVariantAccess(c, variant, n.orig[0][1].sym.name,
                                       n.orig[n.nodeIndex])
-    c.subTree MirNode(kind: mnkPathVariant, typ: n.typ,
+    c.subTree MirNode(kind: mnkPathVariant, typ: typ,
                       field: discr.position.int32):
       c.use variant
   of pirCheckedObjConv:
     let
       val = toValue(c, e, i - 1)
-      boolType = c.graph.getSysType(n.orig.info, tyBool)
 
     c.buildStmt mnkIf:
       # the ``x != nil`` condtion:
-      c.wrapAndUse(boolType):
-        c.buildMagicCall mNot, boolType:
+      c.wrapAndUse(BoolType):
+        c.buildMagicCall mNot, BoolType:
           c.subTree mnkArg:
-            c.wrapAndUse(boolType):
-              c.buildMagicCall mIsNil, boolType:
+            c.wrapAndUse(BoolType):
+              c.buildMagicCall mIsNil, BoolType:
                 c.emitByVal val
       # the check:
       c.subTree mnkVoid:
-        c.buildDefectMagicCall mChckObj, typeOrVoid(c, nil):
+        c.buildDefectMagicCall mChckObj, VoidType:
           c.emitByVal val
-          c.emitByVal typeLit(n.check)
+          c.emitByVal typeLit(c.typeToMir(n.check))
 
-    c.buildOp mnkPathConv, n.typ:
+    c.buildOp mnkPathConv, typ:
       c.use val
 
   of pirAddr:
-    c.buildOp mnkAddr, n.typ:
+    c.buildOp mnkAddr, typ:
       recurse()
   of pirView:
-    c.buildOp viewOp(mnkView, n.typ), n.typ:
+    c.buildOp viewOp(mnkView, n.typ), typ:
       recurse()
   of pirCast:
-    c.buildOp mnkCast, n.typ:
+    c.buildOp mnkCast, typ:
       recurse()
   of pirConv:
-    c.buildOp mnkConv, n.typ:
+    c.buildOp mnkConv, typ:
       recurse()
   of pirStdConv:
-    c.buildOp mnkStdConv, n.typ:
+    c.buildOp mnkStdConv, typ:
       recurse()
   of pirToSlice:
-    c.buildOp viewOp(mnkToSlice, n.typ), n.typ:
+    c.buildOp viewOp(mnkToSlice, n.typ), typ:
       recurse()
   of pirToSubSlice:
     # the array operand is a PMIR expression already, but the operands
@@ -1855,32 +1847,32 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
         lo = genRd(c, a)
         hi = genRd(c, b)
       c.buildStmt mnkVoid:
-        c.buildDefectMagicCall mChckBounds, typeOrVoid(c, nil):
+        c.buildDefectMagicCall mChckBounds, VoidType:
           c.emitByVal arr
           c.emitByVal lo
           c.emitByVal hi
 
-      c.buildTree op, n.typ:
+      c.buildTree op, typ:
         c.use arr
         c.use lo
         c.use hi
     else:
-      c.buildTree op, n.typ:
+      c.buildTree op, typ:
         recurse()
         genArgExpression(c, a, sink=false)
         genArgExpression(c, b, sink=false)
   of pirCall:
     genCallOrMagic(c, n.orig)
   of pirChckRange:
-    c.buildDefectMagicCall mChckRange, n.typ:
+    c.buildDefectMagicCall mChckRange, typ:
       c.emitOperandTree n.orig[0], false
       c.emitOperandTree n.orig[1], false
       c.emitOperandTree n.orig[2], false
   of pirStringToCString:
-    c.buildMagicCall mStrToCStr, n.typ:
+    c.buildMagicCall mStrToCStr, typ:
       c.emitOperandTree n.orig[0], false
   of pirCStringToString:
-    c.buildMagicCall mCStrToStr, n.typ:
+    c.buildMagicCall mCStrToStr, typ:
       c.emitOperandTree n.orig[0], false
   of pirArrayConstr:
     genArrayConstr(c, n.orig, n.owning)
@@ -1911,7 +1903,7 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     # attempting to generate the code for a complex expression without a
     # destination specified -> assign the value resulting from it to a
     # temporary
-    let tmp = getTemp(c, n.typ)
+    let tmp = getTemp(c, typ)
 
     withFront c.builder:
       genComplexExpr(c, n.orig):
@@ -1919,30 +1911,30 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
 
     c.use tmp
   of pirCopy:
-    c.buildOp mnkCopy, n.typ:
+    c.buildOp mnkCopy, typ:
       recurse()
   of pirMove:
-    c.buildOp mnkMove, n.typ:
+    c.buildOp mnkMove, typ:
       recurse()
   of pirSink, pirDestructiveMove:
     # a destructive move is currently not translated into a move + wasMoved,
     # but rather into a sink, which is then, if necessary, later turned into
     # a destructive move
-    c.buildOp mnkSink, n.typ:
+    c.buildOp mnkSink, typ:
       recurse()
   of pirMat, pirMatCursor:
     let f = c.builder.push: recurse()
     # only materialize a temporary if the expression is not already a
     # temporary introduced by the PMIR-to-MIR translation
     if c.builder.staging[f.pos].kind != mnkTemp:
-      let tmp = c.allocTemp(n.typ)
+      let tmp = c.allocTemp(typ)
       withFront c.builder:
         c.subTree (if n.kind == pirMat: mnkDef else: mnkDefCursor):
           c.use tmp
           c.builder.pop(f)
       c.use tmp
   of pirMatLvalue:
-    let tmp = c.allocTemp(n.typ, true)
+    let tmp = c.allocTemp(typ, true)
     # make sure to create an alias that supports assignment, if requested
     c.buildStmt (if e[i-1].keep == kMutLvalue: mnkBindMut else: mnkBind):
       c.use tmp
@@ -2006,7 +1998,7 @@ proc gen(c: var TCtx, n: PNode) =
       c.buildStmt mnkSwitch:
         # the 'switch' operations expects a variant access as the first
         # operand
-        c.subTree MirNode(kind: mnkPathVariant, typ: dest[^2].typ,
+        c.subTree MirNode(kind: mnkPathVariant, typ: c.typeToMir(dest[^2].typ),
                           field: dest[^1].field.position.int32):
           genx(c, dest, dest.len - 2)
 
@@ -2107,7 +2099,8 @@ proc generateAssignment*(graph: ModuleGraph, env: var MirEnv,
   ## Translates an `nkIdentDefs` AST into MIR and emits the result into
   ## `builder`'s currently selected buffer.
   assert n.kind == nkIdentDefs and n.len == 3
-  var c = TCtx(context: skUnknown, graph: graph, config: config)
+  var c = TCtx(context: skUnknown, graph: graph, config: config,
+               env: move env)
   # treat the code as top-level code so that no 'def' is generated for
   # assignments to globals
   c.scopeDepth = 1
@@ -2115,11 +2108,11 @@ proc generateAssignment*(graph: ModuleGraph, env: var MirEnv,
   template swapState() =
     swap(c.sp.map, source)
     swap(c.builder, builder)
-    swap(c.env, env)
 
   swapState()
   genLocInit(c, n[0], n[2])
   swapState()
+  env = move c.env # move back
 
 proc generateCode*(graph: ModuleGraph, env: var MirEnv,
                    config: TranslationConfig, n: PNode,
@@ -2127,13 +2120,12 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv,
   ## Generates MIR code that is semantically equivalent to the expression or
   ## statement `n`, appending the resulting code and the corresponding origin
   ## information to `code` and `source`, respectively.
-  var c = TCtx(context: skUnknown, graph: graph, config: config)
+  var c = TCtx(context: skUnknown, graph: graph, config: config, env: move env)
   c.scopeDepth = 2 # assume that this is not top-level code
 
   template swapState() =
     swap(c.sp.map, source)
     swap(c.builder, builder)
-    swap(c.env, env)
 
   # for the duration of ``generateCode`` we move the state into ``TCtx``
   swapState()
@@ -2150,6 +2142,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv,
 
   # move the state back into the output parameters:
   swapState()
+  env = move c.env
 
 proc addParams(c: var TCtx, prc: PSym, signature: PType) =
   ## Translates the result variable and the parameters (taken from `signature`)
@@ -2163,16 +2156,16 @@ proc addParams(c: var TCtx, prc: PSym, signature: PType) =
     # not present
     add Local()
   else:
-    add localToMir(prc.ast[resultPos].sym)
+    add c.localToMir(prc.ast[resultPos].sym)
 
   # parameters:
   let params = signature.n
   for i in 1..<params.len:
-    add paramToMir(params[i].sym)
+    add c.paramToMir(params[i].sym)
 
   if signature.callConv == ccClosure:
     # environment parameter
-    add paramToMir(prc.ast[paramsPos][^1].sym)
+    add c.paramToMir(prc.ast[paramsPos][^1].sym)
 
 proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
                    config: TranslationConfig,  body: PNode): MirBody =
@@ -2189,11 +2182,9 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
   #assert nfTransf in body.flags, "transformed AST is expected as input"
 
   var c = TCtx(context: owner.kind, graph: graph, config: config,
-               userOptions: owner.options)
+               userOptions: owner.options, env: move env)
   c.sp.active = (body, c.sp.map.add(body))
 
-  swap(c.env, env)
-
   c.scopeDepth = 1
   c.add MirNode(kind: mnkScope)
   if sfNeverRaises in owner.flags:
@@ -2234,13 +2225,13 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
       c.subTree mnkBranch:
         c.subTree mnkVoid:
           let p = c.graph.getCompilerProc("nimUnhandledException")
-          c.builder.buildCall c.env.procedures.add(p), typeOrVoid(c, p.typ[0]):
+          c.builder.buildCall c.env.procedures.add(p), VoidType:
             discard
     c.add endNode(mnkTry)
 
   c.add endNode(mnkScope)
 
-  swap(c.env, env) # swap back
+  env = c.env
 
   # move the buffers into the result body
   let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
@@ -2251,14 +2242,15 @@ proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
   ## Only meant to be used by `vmjit <#vmjit>`_. Produces a MIR body for a
   ## standalone expression. The result of the expression is assigned to the
   ## special local with ID 0.
-  var c = TCtx(context: skUnknown, graph: graph, config: config)
+  var c = TCtx(context: skUnknown, graph: graph, config: config, env: move env)
   c.sp.active = (e, c.sp.map.add(e))
-  swap(c.env, env)
 
-  let res = c.addLocal(Local(typ: e.typ)) # the result variable
+  let
+    rtyp = c.typeToMir(e.typ)
+    res = c.addLocal(Local(typ: rtyp)) # the result variable
   c.scope:
     c.buildStmt mnkDef:
-      c.use toValue(mnkLocal, res, e.typ)
+      c.use toValue(mnkLocal, res, rtyp)
       if e.typ.kind == tyTypeDesc:
         # FIXME: this shouldn't happen, but type expressions are sometimes
         #        evaluated with the VM, such as a ``typeof(T.x)`` appearing as
@@ -2271,7 +2263,7 @@ proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
       else:
         c.genAsgnSource(e, {dfOwns, dfEmpty})
 
-  swap(c.env, env)
+  env = move c.env
 
   let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
   MirBody(locals: locals, source: move c.sp.map, code: code)
@@ -2280,12 +2272,15 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
   ## Translates the construction expression AST `n` representing some
   ## constant data to its corresponding MIR representation.
   proc constToMirAux(bu: var MirBuilder, env: var MirEnv, n: PNode) =
+    let typ =
+      if n.typ.isNil: VoidType
+      else:           env.types.add(n.typ)
     case n.kind
     of nkObjConstr:
       # no normalization/canonicalization takes place here, meaning that
       # ``Obj(a: 0, b: 1)`` and ``Obj(b: 1, a: 0)`` will result in two data
       # table entries, even though the values they represent are equivalent
-      bu.subTree MirNode(kind: mnkObjConstr, typ: n.typ, len: n.len-1):
+      bu.subTree MirNode(kind: mnkObjConstr, typ: typ, len: n.len-1):
         for i in 1..<n.len:
           bu.add MirNode(kind: mnkField, field: n[i][0].sym.position.int32)
           bu.subTree mnkArg:
@@ -2293,7 +2288,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
     of nkCurly:
       # similar to object construction, no normalization means that ``{1, 2}``
       # and ``{2, 1}`` results in two data table entries
-      bu.subTree MirNode(kind: mnkSetConstr, typ: n.typ, len: n.len):
+      bu.subTree MirNode(kind: mnkSetConstr, typ: typ, len: n.len):
         for it in n.items:
           constToMirAux(bu, env, it)
     of nkBracket, nkTupleConstr, nkClosure:
@@ -2305,7 +2300,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         of tyProc:                  mnkClosureConstr
         else:                       unreachable()
 
-      bu.subTree MirNode(kind: kind, typ: n.typ, len: n.len):
+      bu.subTree MirNode(kind: kind, typ: typ, len: n.len):
         for it in n.items:
           bu.subTree mnkArg:
             constToMirAux(bu, env, it.skipColon)
@@ -2314,9 +2309,9 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       # must either be another constant or a procedural value
       case n.sym.kind
       of skProc, skFunc, skConverter, skIterator:
-        bu.use toValue(env.procedures.add(n.sym), n.typ)
+        bu.use toValue(env.procedures.add(n.sym), typ)
       of skConst:
-        bu.use toValue(env.constants.add(n.sym), n.sym.typ)
+        bu.use toValue(env.constants.add(n.sym), typ)
       else:
         unreachable()
     of nkRange:
@@ -2324,20 +2319,20 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         constToMirAux(bu, env, n[0])
         constToMirAux(bu, env, n[1])
     of nkNilLit:
-      bu.add MirNode(kind: mnkNilLit, typ: n.typ)
+      bu.add MirNode(kind: mnkNilLit, typ: typ)
     of nkIntLiterals:
       bu.use toIntLiteral(env, n)
     of nkFloatLiterals:
       bu.use toFloatLiteral(env, n)
     of nkStrLiterals:
-      bu.use strLiteral(env, n.strVal, n.typ)
+      bu.use strLiteral(env, n.strVal, typ)
     of nkHiddenStdConv, nkHiddenSubConv:
       # doesn't translate to a MIR node itself, but the type overrides
       # that of the sub-expression
       let top = bu.staging.len
       constToMirAux(bu, env, n[1])
       # patch the type:
-      bu.staging[top].typ = n.typ
+      bu.staging[top].typ = typ
     else:
       unreachable(n.kind)
 
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 3c978e9e715..3e4d9a5d62d 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -22,6 +22,7 @@ import
     mirchangesets,
     mirconstr,
     mirtrees,
+    mirtypes,
     sourcemaps
   ],
   compiler/modules/[
@@ -102,7 +103,7 @@ proc overlapsConservative(tree: MirTree, a, b: Path, typA, typB: PType): bool =
   # use path-based analysis:
   result = overlaps(tree, a, b) != no
 
-proc preventRvo(tree: MirTree, changes: var Changeset) =
+proc preventRvo(tree: MirTree, types: TypeEnv, changes: var Changeset) =
   ## Injects intermediate temporaries for assignments where the source is an
   ## RVO-using call rvalue and the destination potentially aliases with a
   ## location accessible witin the call through one of the arguments.
@@ -122,7 +123,7 @@ proc preventRvo(tree: MirTree, changes: var Changeset) =
   for i in search(tree, {mnkAsgn}):
     let source = tree.operand(i, 1)
     if tree[source].kind notin CallKinds or tree[source, 0].kind == mnkMagic or
-       not eligibleForRvo(tree[source].typ):
+       not eligibleForRvo(types[tree[source].typ]):
       # the return-value optimization is not used
       continue
 
@@ -137,7 +138,7 @@ proc preventRvo(tree: MirTree, changes: var Changeset) =
           # special handling for openArrays: they are also able to observe the
           # result location
           if tree[it].kind == mnkTemp and
-             tree[it].typ.skipTypes(abstractVar).kind == tyOpenArray:
+             types[tree[it].typ].skipTypes(abstractVar).kind == tyOpenArray:
             # find the lvalue expression (if any) that the slice was created
             # from and use that for the overlap analysis
             let def = tree.child(findDef(tree, NodePosition it), 1)
@@ -154,7 +155,8 @@ proc preventRvo(tree: MirTree, changes: var Changeset) =
 
       if check and overlapsConservative(tree, path,
                                         computePath(tree, NodePosition arg),
-                                        tree[dest].typ, tree[arg].typ):
+                                        types[tree[dest].typ],
+                                        types[tree[arg].typ]):
         needsTemp = true
         break
 
@@ -194,7 +196,8 @@ proc lowerSwap(tree: MirTree, changes: var Changeset) =
       bu.asgnMove a, b
       bu.asgnMove b, temp
 
-proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
+proc eliminateTemporaries(tree: MirTree, types: TypeEnv,
+                          changes: var Changeset) =
   ## Where safe (i.e., observable program behaviour does not change), elides
   ## temporaries in a backend-agnostice way. This is an optimization.
   ##
@@ -256,9 +259,10 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
 
   template overlaps(a: Path, typ: PType, b: OpValue): bool =
     let x = NodePosition b
-    overlapsConservative(tree, a, computePath(tree, x), typ, tree[x].typ)
+    overlapsConservative(tree, a, computePath(tree, x), typ, types[tree[x].typ])
 
-  proc findUse(tree: MirTree, dfg: DataFlowGraph, p: Path, typ: PType,
+  proc findUse(tree: MirTree, types: TypeEnv, dfg: DataFlowGraph,
+               p: Path, typ: PType,
                start: InstrPos, e: LocalId): NodePosition {.nimcall.} =
     ## Conservative data-flow analysis that computes whether the `p` might be
     ## modified. If there are no modifications of `p` between `start`
@@ -305,8 +309,8 @@ proc eliminateTemporaries(tree: MirTree, changes: var Changeset) =
         n   = NodePosition n
         def = tree.parent(n)
         p   = computePath(tree, tree.child(def, 1))
-        typ = tree[n].typ
-        pos = findUse(tree, dfg, p, typ, i + 1, tree[n].local)
+        typ = types[tree[n].typ]
+        pos = findUse(tree, types, dfg, p, typ, i + 1, tree[n].local)
 
       if pos == NodePosition(-1):
         # the copy is necessary
@@ -367,7 +371,7 @@ proc extractStringLiterals(tree: MirTree, env: var MirEnv,
     changes.replaceMulti(tree, i, bu):
       bu.use toValue(c, tree[i].typ)
 
-proc injectResultInit(tree: MirTree, resultTyp: PType, changes: var Changeset) =
+proc injectResultInit(tree: MirTree, resultTyp: TypeId, changes: var Changeset) =
   ## Injects a default-initialization for the result variable, if deemed
   ## necessary by data-flow analysis.
   ##
@@ -427,13 +431,12 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
   ## * at the beginning of a procedure's body
   ## * at the end of a loop's body
   let
-    voidType = graph.getSysType(unknownLineInfo, tyVoid)
     prcId = env.procedures.add(graph.getCompilerProc("nimProfile"))
 
   # insert the entry call within the outermost scope:
   changes.insert(tree, tree.child(NodePosition 0, 0), NodePosition 0, bu):
     bu.subTree mnkVoid:
-      bu.buildCall prcId, voidType:
+      bu.buildCall prcId, VoidType:
         discard "no arguments"
 
   for i in search(tree, {mnkEnd}):
@@ -441,7 +444,7 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
       # insert the call before the end node:
       changes.insert(tree, i - 1, i, bu):
         bu.subTree mnkVoid:
-          bu.buildCall prcId, voidType:
+          bu.buildCall prcId, VoidType:
             discard "no arguments"
 
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
@@ -459,10 +462,10 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
     batch:
       # only the C code generator employs the return-value optimization (=RVO)
       # at the moment
-      preventRvo(body.code, c)
+      preventRvo(body.code, env.types, c)
 
   batch:
-    if target == targetC and body[resultId].typ != nil and
+    if target == targetC and body[resultId].typ != VoidType and
        (sfNoInit notin body[resultId].flags):
       # the procedure has a result variable and initialization of it is
       # allowed
@@ -482,4 +485,4 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
 
   # eliminate temporaries after all other passes
   batch:
-    eliminateTemporaries(body.code, c)
+    eliminateTemporaries(body.code, env.types, c)
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 0b44d015827..1eab6ece408 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -35,10 +35,8 @@ type
   DataId* = distinct uint32
     ## Identifies a complete constant expression
 
-  TypeInstance {.used.} = distinct uint32
-    ## Refers to an existing type instance
-  TypeId {.used.} = distinct uint32
-    ## The ID of a type instance or nil
+  TypeId* = distinct uint32
+    ## Identifies a type
 
   SourceId* = distinct range[0'u32 .. high(uint32)-1]
     ## The ID of a source-mapping that's stored separately from the MIR nodes.
@@ -274,7 +272,7 @@ type
     geMutateGlobal ## the operation mutates global state
 
   MirNode* = object
-    typ*: PType ## non-nil for all expressions
+    typ*: TypeId ## valid for all expression, including all calls
     info*: SourceId
       ## non-critical meta-data associated with the node (e.g., origin
       ## information)
@@ -402,6 +400,7 @@ func `==`*(a, b: DataId): bool {.borrow.}
 func `==`*(a, b: NumberId): bool {.borrow.}
 func `==`*(a, b: StringId): bool {.borrow.}
 func `==`*(a, b: AstId): bool {.borrow.}
+func `==`*(a, b: TypeId): bool {.borrow.}
 
 func isAnon*(id: ConstId): bool =
   ## Returns whether `id` represents an anonymous constant.
diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
new file mode 100644
index 00000000000..acbb11a58c6
--- /dev/null
+++ b/compiler/mir/mirtypes.nim
@@ -0,0 +1,100 @@
+## Implements the type IR for the MIR phase (not yet), plus the
+## `TypeEnv <#TypeEnv>`_, which stores the data for all types.
+##
+## All types are addressed via ``TypeId``, with the built-in types using
+## static IDs.
+
+import
+  std/[
+    hashes,
+    tables
+  ],
+  compiler/ast/[
+    ast_types,
+    lineinfos
+  ],
+  compiler/modules/[
+    modulegraphs,
+    magicsys
+  ],
+  compiler/mir/[
+    mirtrees,
+    typemaps
+  ],
+  compiler/utils/[
+    containers
+  ]
+
+type
+  TypeEnv* {.requiresInit.} = object
+    ## Stores the data associated with types. Has no valid default value, and
+    ## must be explicitly initialized first.
+    map: TypeTable[TypeId]
+      ## maps the hash of a type. Since the hash is not guaranteed to be
+      ## unique, hash collisions are possible!
+      # XXX: ^^ the collision needs to be addressed at some point. A proper,
+      #      non-sighash-based comparision needs to be used
+    types: Store[TypeId, PType]
+
+const
+  VoidType*    = TypeId 0
+  BoolType*    = TypeId 1
+  CharType*    = TypeId 2
+  Int8Type*    = TypeId 3
+  Int16Type*   = TypeId 4
+  Int32Type*   = TypeId 5
+  Int64Type*   = TypeId 6
+  UInt8Type*   = TypeId 7
+  UInt16Type*  = TypeId 8
+  UInt32Type*  = TypeId 9
+  UInt64Type*  = TypeId 10
+  Float32Type* = TypeId 11
+  Float64Type* = TypeId 12
+  StringType*  = TypeId 13
+  CstringType* = TypeId 14
+  PointerType* = TypeId 15
+
+proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
+  ## Returns a fully initialized type environment instance.
+  result = TypeEnv(map: default(TypeTable[TypeId]),
+                   types: default(Store[TypeId, PType]))
+
+  template add(kind: TTypeKind, expect: TypeId) =
+    let
+      typ = graph.getSysType(unknownLineInfo, kind)
+      id  = result.types.add(typ)
+    assert id == expect
+    # the type needs to be mapped too
+    result.map[typ] = id
+
+  add(tyVoid, VoidType)
+  add(tyBool, BoolType)
+  add(tyChar, CharType)
+  add(tyInt8, Int8Type)
+  add(tyInt16, Int16Type)
+  add(tyInt32, Int32Type)
+  add(tyInt64, Int64Type)
+  add(tyUInt8, UInt8Type)
+  add(tyUInt16, UInt16Type)
+  add(tyUInt32, UInt32Type)
+  add(tyUInt64, UInt64Type)
+  add(tyFloat32, Float32Type)
+  add(tyFloat64, Float64Type)
+  add(tyString, StringType)
+  add(tyCstring, CstringType)
+  add(tyPointer, PointerType)
+
+  # also register the built-in unspecified-width types. This prevents int/float
+  # literal types from being added to the environment
+  add(tyInt,   TypeId(ord(PointerType) + 1))
+  add(tyFloat, TypeId(ord(PointerType) + 2))
+
+proc add*(env: var TypeEnv, t: PType): TypeId =
+  ## If not registered yet, adds `t` to `env` and returns the ID to later
+  ## look it up with. Basic structural type unification is performed.
+  result = env.map.mgetOrPut(t, env.types.nextId())
+  if result == env.types.nextId():
+    result = env.types.add(t)
+
+func `[]`*(env: TypeEnv, id: TypeId): lent PType {.inline.} =
+  env.types[id]
diff --git a/compiler/mir/typemaps.nim b/compiler/mir/typemaps.nim
new file mode 100644
index 00000000000..ce57f670f5d
--- /dev/null
+++ b/compiler/mir/typemaps.nim
@@ -0,0 +1,188 @@
+## Implements a Table-like type for mapping a ``PType`` to some value. The
+## ``PType`` keys undergo basic canoncalization, meaning that two
+## different - in terms of reference equality - ``PType`` instances can
+## represent the same key.
+##
+## The canonicalization makes sure to not ignore type information relevant to
+## the mid-end and code generation stages.
+
+import
+  std/[
+    hashes,
+    tables
+  ],
+  compiler/ast/[
+    ast_types,
+    ast_query
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+type
+  Type = distinct PType
+    # a distinct type so that a new hash and equality operator can be
+    # attached
+  TypeTable*[T] = object
+    inner: Table[Type, T]
+
+func safeId(n: PNode): NodeId {.inline.} =
+  if n != nil: n.id
+  else:        NodeId -1
+
+func cmp(a, b: PType): bool
+
+func cmpElements(a, b: PType): bool =
+  if a.len != b.len:
+    return false
+
+  for i in 0..<a.len:
+    if not cmp(a[i], b[i]):
+      return false
+
+  result = true
+
+func cmpProc(a, b: PType): bool =
+  if a.len != b.len:
+    return false
+
+  # nil in the return type slot means 'void'; handle it separately
+  if a[0].isNil != b[0].isNil or (a[0] != nil and not cmp(a[0], b[0])):
+    return false
+
+  for i in 1..<a.len:
+    if not cmp(a[i], b[i]):
+      return false
+
+  result = true
+
+func cmp(a, b: PNode): bool =
+  if a.kind != b.kind:
+    return false
+  case a.kind
+  of nkFloatLiterals:
+    result = cast[BiggestInt](a.floatVal) == cast[BiggestInt](b.floatVal)
+  of nkIntLiterals:
+    result = a.intVal == b.intVal
+  else:
+    unreachable()
+
+func cmp(a, b: PType): bool =
+  # generic types are also handled here, since they can be part of
+  # ``tyTypeDesc``s
+  if a.id == b.id: # quick check: same type instance?
+    # FIXME: user type-classes are sometimes improperly instantiated,
+    #        producing different types that share the same ID.
+    #        ``concepts/tcomparable.nim`` is a test where removing the extra
+    #        condition would cause a failure
+    a.kind notin tyUserTypeClasses
+  elif a.kind != b.kind or a.sym != b.sym:
+    false
+  elif a.sym != nil and a.kind == tyObject and a.sym == b.sym:
+    # note: only object types have proper symbols at the moment. For all other
+    # types, instantiations of a generic invocation all use the symbol of the
+    # generic type
+    true
+  else:
+    case a.kind
+    of tyVoid, tyBool, tyChar, tyPointer, tyNil, tyInt..tyInt64,
+       tyUInt..tyUInt64, tyFloat..tyFloat64, tyString, tyCstring, tyEmpty,
+       tyAnything:
+      true
+    of tySet, tySequence, tyOpenArray, tyVarargs, tyUncheckedArray, tyPtr,
+       tyRef, tyLent, tyVar, tyAlias, tyOrdinal, tySink, tyTypeDesc, tyNot:
+      # simple structural-like types that are equal if their element types are
+      cmp(a[^1], b[^1])
+    of tyArray:
+      cmp(a[0], b[0]) and cmp(a[1], b[1])
+    of tyRange:
+      # only the range description matters
+      cmp(a.n[0], b.n[0]) and cmp(a.n[1], b.n[1])
+    of tyTuple:
+      # named and unnamed tuple distinction matters
+      safeId(a.n) == safeId(b.n) and cmpElements(a, b)
+    of tyProc:
+      # also consider the flags
+      a.flags == b.flags and a.callConv == b.callConv and cmpProc(a, b)
+    of tyAnd, tyOr:
+      cmp(a[0], b[1]) and cmp(a[1], b[1])
+    of tyBuiltInTypeClass:
+      a[0].kind == b[0].kind
+    of tyObject, tyDistinct, tyEnum, tyGenericInst, tyStatic,
+       tyUserTypeClasses, tyCompositeTypeClass, tyInferred:
+      # ids are not the same, so it must be a different type
+      # XXX: ideally, ``tyStatic`` would not be supported here, but ``mirgen``
+      #      does add those types
+      # FIXME: ``tyInferred`` reaches here, but shouldn't. Needs further
+      #        investigation.
+      false
+    else:
+      unreachable()
+
+func hash(n: PNode): Hash =
+  case n.kind
+  of nkFloatLiterals:
+    hash(cast[BiggestInt](n.floatVal))
+  of nkIntLiterals:
+    hash(n.intVal)
+  else:
+    unreachable(n.kind)
+
+func hash(t: PType): Hash =
+  # ``hash(a)`` must be ``== hash(b)`` if ``cmp(a, b)`` is true
+  if t.sym != nil:
+    # for types with symbols, only the symbol matters
+    result = !$(hash(true) !& hash(t.sym.id))
+  else:
+    result = hash(false) !& hash(t.kind)
+    case t.kind
+    of tyVoid, tyBool, tyChar, tyPointer, tyNil, tyInt..tyInt64,
+       tyUInt..tyUInt64, tyFloat..tyFloat64, tyString, tyCstring, tyEmpty:
+      discard "leaf type"
+    of tySet, tySequence, tyOpenArray, tyVarargs, tyUncheckedArray, tyPtr,
+       tyRef, tyLent, tyVar, tyTypeDesc, tyAlias, tyOrdinal, tySink:
+      result = result !& hash(t[0])
+    of tyArray:
+      result = result !& hash(t[0]) !& hash(t[1])
+    of tyTuple:
+      # only hash the number of elements
+      result = result !& hash(t.len) !& hash(safeId t.n)
+    of tyRange:
+      result = result !& hash(t.n[0]) !& hash(t.n[1])
+    of tyProc:
+      # only hash the number of parameters
+      result = result !& hash(t.flags) !& hash(t.callConv) !& hash(t.len)
+    of tyAnd, tyOr:
+      result = result !& hash(t[0]) !& hash(t[1])
+    of tyBuiltInTypeClass:
+      result = result !& hash(t[0].kind)
+    of tyObject, tyDistinct, tyEnum, tyGenericInst, tyStatic,
+       tyUserTypeClasses, tyCompositeTypeClass, tyInferred:
+      result = result !& hash(t.id)
+    else:
+      unreachable()
+
+    result = !$(result)
+
+# note: hash and the equality procedure need to be be exported for symbol
+# binding in ``Table`` routines to work properly
+
+func `==`*(a, b: Type): bool {.inline.} =
+  ## Leaked implementation detail -- do not use.
+  cmp(a.PType, b.PType)
+
+func hash*(x: Type): Hash {.inline.} =
+  ## Leaked implementation detail -- do not use.
+  hash(PType x)
+
+proc `[]`*[T](t: TypeTable[T], key: PType): lent T {.inline.} =
+  ## Looks up the item for `key`.
+  t.inner[Type key]
+
+proc `[]=`*[T](t: var TypeTable[T], key: PType, val: sink T) {.inline.} =
+  ## Assign a `val` for the `key`.
+  t.inner[Type key] = val
+
+proc mgetOrPut*[T](t: var TypeTable, key: PType, val: T): var T =
+  ## If `key` has no mapping in `t`, adds one with `val` as the value first.
+  t.inner.mgetOrPut(Type(key), val)
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 7c19220796d..5d60fae5a9f 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -19,7 +19,8 @@ import
   compiler/mir/[
     mirbodies,
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ]
 
 func `$`(n: MirNode): string =
@@ -71,9 +72,9 @@ func `$`(n: MirNode): string =
     result.add " len: "
     result.add $n.len
 
-  if n.typ != nil:
+  if n.typ != VoidType:
     result.add " typ: "
-    result.add $n.typ.kind
+    result.addInt n.typ.uint32
 
 proc treeRepr*(tree: MirTree, pos = NodePosition(0)): string =
   ## Renders the node or sub-tree at `pos` to a string in a tree-layout-
@@ -155,6 +156,14 @@ func addName[I](result: var string, id: I, open: string, c: RenderCtx) =
   else:
     result.add c.env[][id].name.s
 
+proc typeToStr(result: var string, t: TypeId, env: ptr MirEnv) =
+  if env.isNil:
+    result.add "<T"
+    result.addInt t.uint32
+    result.add ">"
+  else:
+    result.add typeToString(env.types[t])
+
 func addLocalName(result: var string, id: LocalId, open: string,
                   c: RenderCtx) =
   if c.body.isNil:
@@ -218,17 +227,17 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     if c.env.isNil:
       idToStr(result, n.number, "<Int: ")
     else:
-      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
+      result.addTypedNumber(c.env[].getInt(n.number), c.env[][n.typ])
   of mnkUIntLit:
     if c.env.isNil:
       idToStr(result, n.number, "<UInt: ")
     else:
-      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
+      result.addTypedNumber(c.env[].getInt(n.number), c.env[][n.typ])
   of mnkFloatLit:
     if c.env.isNil:
       idToStr(result, n.number, "<Float: ")
     else:
-      result.addTypedNumber(c.env[].getInt(n.number), n.typ)
+      result.addTypedNumber(c.env[].getInt(n.number), c.env[][n.typ])
   of mnkStrLit:
     if c.env.isNil:
       result.add "<Str: "
@@ -242,7 +251,7 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.add "<Ast>"
   of mnkType:
     result.add "type("
-    result.add $n.typ
+    typeToStr(result, n.typ, c.env)
     result.add ")"
   of AllNodeKinds - Atoms - mnkProc:
     result.add "<error: " & $n.kind & ">"
@@ -253,6 +262,13 @@ proc singleToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
 template singleToStr() =
   singleToStr(treeParam(), i, result, c)
 
+proc fieldToStr(field: int32, typ: TypeId, result: var string, c: RenderCtx) =
+  if c.env.isNil:
+    result.add "Field"
+    result.addInt field
+  else:
+    result.add lookupInType(c.env[][typ], field.int).name.s
+
 template valueToStr() =
   mixin valueToStr
   valueToStr(treeParam(), i, result, c)
@@ -281,12 +297,12 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       let typ = nodes[i].typ # type of the object operand
       valueToStr()
       result.add "."
-      result.add lookupInType(typ, n.field).name.s
+      fieldToStr(n.field, typ, result, c)
   of mnkPathConv:
     tree "":
       valueToStr()
       result.add ".("
-      result.add typeToString(n.typ)
+      typeToStr(result, n.typ, c.env)
       result.add ")"
   of mnkDeref, mnkDerefView:
     tree "":
@@ -401,8 +417,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
     let typ = nodes[i].typ
     tree "(":
       commaSeparated:
-        let field = lookupInType(typ, next(nodes, i).field.int)
-        result.add field.name.s & ": "
+        fieldToStr(next(nodes, i).field, typ, result, c)
         argToStr()
       result.add ")"
   of mnkCall:
@@ -454,7 +469,7 @@ proc renderNameWithType(tree: MirTree, i: var int, result: var string,
   let n {.cursor.} = next(tree, i)
   singleToStr(n, result, c)
   result.add ": "
-  result.add typeToString(n.typ)
+  typeToStr(result, n.typ, c.env)
 
 proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
                 c: RenderCtx)
@@ -583,7 +598,7 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
   of mnkVoid:
     # drop the 'discard' prefix if the expression is a void expression
     let lead =
-      if nodes[i].typ.kind == tyVoid: ""
+      if nodes[i].typ == VoidType: ""
       else: "discard "
     tree lead:
       exprToStr()
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index ca44b7803e6..e33517292d2 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -87,6 +87,7 @@ import
   compiler/mir/[
     analysis,
     mirbodies,
+    mirtypes,
     mirchangesets,
     mirconstr,
     mirenv,
@@ -201,10 +202,6 @@ func findScope(entities: EntityDict, name: EntityName, at: InstrPos,
   else:
     exists = false
 
-
-proc getVoidType(g: ModuleGraph): PType {.inline.} =
-  g.getSysType(unknownLineInfo, tyVoid)
-
 func isNamed(tree: MirTree, val: OpValue): bool =
   ## Returns whether `val` is the projection of a named location (or refers to
   ## the named location itself).
@@ -243,7 +240,7 @@ iterator nodesWithScope(tree: MirTree): (NodePosition, lent MirNode, Slice[NodeP
 
   #result.pos = p
 
-func initEntityDict(tree: MirTree, dfg: DataFlowGraph): EntityDict =
+func initEntityDict(tree: MirTree, dfg: DataFlowGraph, env: MirEnv): EntityDict =
   ## Collects the names of all analysable locations relevant to destructor
   ## injection and the move analyser. This includes: locals, temporaries, sink
   ## parameters and, with some restrictions, globals.
@@ -255,20 +252,7 @@ func initEntityDict(tree: MirTree, dfg: DataFlowGraph): EntityDict =
     case n.kind
     of mnkDef, mnkDefUnpack:
       let entity = tree[getDefEntity(tree, i)]
-
-      let t =
-        case entity.kind
-        of mnkParam:
-          assert isSinkTypeForParam(entity.typ)
-          entity.typ
-        of mnkLocal:
-          entity.typ
-        of mnkTemp, mnkGlobal:
-          entity.typ
-        else:
-          unreachable()
-
-      if hasDestructor(t):
+      if hasDestructor(env[entity.typ]):
         result.mgetOrPut(toName(entity), @[]).add:
           # don't include the data-flow operations preceding the def
           EntityInfo(def: i, scope: subgraphFor(dfg, i .. scope.b))
@@ -299,7 +283,7 @@ func computeOwnership(tree: MirTree, cfg: DataFlowGraph, entities: EntityDict,
     unreachable()
 
 func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
-                  entities: EntityDict): Moves =
+                  entities: EntityDict, env: TypeEnv): Moves =
   ## Computes for every ``mnkSink`` node what operation (copy or move) it has
   ## to collapse to, returning a set with the operands of all sinks that are
   ## collapsed into moves.
@@ -314,7 +298,7 @@ func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
   for i, op, opr in cfg.instructions:
     if op == opUse and tree[tree.parent(NodePosition opr)].kind == mnkSink:
       # it's the DFG instruction for a sink
-      if hasDestructor(tree[opr].typ) and
+      if hasDestructor(env[tree[opr].typ]) and
          computeOwnership(tree, cfg, entities,
                           computePath(tree, NodePosition opr), i + 1):
         update.add i
@@ -502,12 +486,12 @@ template buildVoidCall*(bu: var MirBuilder, env: var MirEnv, p: PSym,
                        body: untyped) =
   let prc = p # prevent multi evaluation
   bu.subTree mnkVoid:
-    bu.buildCall env.procedures.add(prc), getVoidType(graph):
+    bu.buildCall env.procedures.add(prc), VoidType:
       body
 
 proc genWasMoved(bu: var MirBuilder, graph: ModuleGraph, target: Value) =
   bu.subTree MirNode(kind: mnkVoid):
-    bu.buildMagicCall mWasMoved, getVoidType(graph):
+    bu.buildMagicCall mWasMoved, VoidType:
       bu.emitByName(target, ekKill)
 
 func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
@@ -636,14 +620,14 @@ proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
         genWasMoved(bu, ctx.graph, v)
 
 proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
-                        c: var Changeset) =
+                        env: TypeEnv, c: var Changeset) =
   ## Rewrites assignments to locations into calls to either the ``=copy``
   ## or ``=sink`` hook (see ``expandAsgn`` for more details).
   ##
   ## Also injects the necessary location reset logic for lvalues passed to
   ## 'consume' argument sinks.
   for i, opc, val in ctx.cfg.instructions:
-    if opc == opConsume and hasDestructor(tree[val].typ):
+    if opc == opConsume and hasDestructor(env[tree[val].typ]):
       # disarm the destructors for locations of which the value is consumed
       # but that are reassigned or destroyed after
       let parent = tree.parent(NodePosition val)
@@ -758,8 +742,8 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
   let
     target = body.operand(stmt, 0)
     objType = body[target].typ
-    field = lookupInType(objType, body[target].field.int)
-    typ = field.typ
+    field = lookupInType(env[objType], body[target].field.int)
+    typ = env.types.add(field.typ)
 
   assert body[target].kind == mnkPathVariant
   # the source expression must either be an rvalue, or there must be a
@@ -775,7 +759,7 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
       bu.emitFrom(body, body.child(stmt, 1))
 
   # check if the object contains fields requiring destruction:
-  if hasDestructor(objType):
+  if hasDestructor(env[objType]):
     # XXX: we are only interested in if the *record-case* contains fields
     #      requiring destruction, not the whole *object*. If none of the
     #      branches requires destruction, but the enclosing object does,
@@ -792,25 +776,22 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
     #      Depending on how it's implemented, this approach has issues with
     #      field alignment, however.
     let branchDestructor = produceDestructorForDiscriminator(
-                            graph, objType,
+                            graph, env[objType],
                             field,
                             unknownLineInfo, idgen
                            )
 
-    let
-      boolTyp = graph.getSysType(unknownLineInfo, tyBool)
-
     # XXX: comparing the discrimant values here means that the branch is
     #      destroyed even if the branch doesn't change. This differs from
     #      the VM's behaviour. There, the branch is only reset if it's
     #      actually changed
-    var val = bu.wrapTemp(boolTyp):
-      bu.buildMagicCall(getMagicEqForType(typ), boolTyp):
+    var val = bu.wrapTemp BoolType:
+      bu.buildMagicCall(getMagicEqForType(field.typ), BoolType):
         bu.emitByVal a
         bu.emitByVal b
 
-    val = bu.wrapTemp(boolTyp):
-      bu.buildMagicCall mNot, boolTyp:
+    val = bu.wrapTemp BoolType:
+      bu.buildMagicCall mNot, BoolType:
          bu.emitByVal val
 
     var src = body.child(NodePosition target, 0)
@@ -883,8 +864,8 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
       actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
 
     let
-      entities = initEntityDict(body.code, actx.cfg)
-      moves = collapseSink(body.code, actx.cfg, entities)
+      entities = initEntityDict(body.code, actx.cfg, env)
+      moves = collapseSink(body.code, actx.cfg, entities, env.types)
 
     let destructors = computeDestructors(body.code, actx.cfg, entities)
 
@@ -893,7 +874,7 @@ proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
       AnalysisResults(moves: cursor(moves),
                       entities: cursor(entities),
                       destroy: cursor(destructors)),
-      changes)
+      env.types, changes)
 
     injectDestructors(body.code, g, destructors, env, changes)
 
diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index 249f7113029..a6e50f661e5 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -95,13 +95,22 @@ type
   ExecutionResult* = Result[PNode, ExecErrorReport]
 
   PEvalContext* = ref EvalContext
-  EvalContext* = object of TPassContext
+  EvalContext* {.final.} = object of RootObj
     ## All state required to on-demand translate AST to VM bytecode and execute
     ## it. An ``EvalContext`` instance makes up everything that is required
     ## for running code at compile-time.
     vm*: TCtx
     jit*: JitState
 
+  PVmCtx* = ref object of RootObj
+    ## Wrapper type intended for storing only a VM instance (without a JIT
+    ## environment) in the module graph.
+    context*: TCtx
+
+  PEvalPassContext = ref object of PPassContext
+    ## Pass context for the evaluation pass.
+    graph: ModuleGraph
+    module: PSym
     oldErrorCount: int
 
 # prevent a default `$` implementation from being generated
@@ -460,7 +469,12 @@ proc setupGlobalCtx*(module: PSym; graph: ModuleGraph; idgen: IdGenerator) =
     ctx.flags = {cgfAllowMeta}
     registerAdditionalOps(ctx, disallowDangerous)
 
-    graph.vm = PEvalContext(vm: ctx)
+    graph.vm = PEvalContext(vm: ctx, jit: initJit(graph))
+  elif graph.vm of PVmCtx:
+    # take the VM instance provided by the wrapper and create a proper
+    # evaluation context from it
+    let ctx = move PVmCtx(graph.vm).context
+    graph.vm = PEvalContext(vm: ctx, jit: initJit(graph))
   else:
     let c = PEvalContext(graph.vm)
     refresh(c.vm, module, idgen)
@@ -691,26 +705,39 @@ proc setGlobalValue*(c: var EvalContext; s: PSym, val: PNode) =
 ## the ``nimeval`` interface
 
 proc myOpen(graph: ModuleGraph; module: PSym; idgen: IdGenerator): PPassContext {.nosinks.} =
-  #var c = newEvalContext(module, emRepl)
-  #c.features = {allowCast, allowInfiniteLoops}
-  #pushStackFrame(c, newStackFrame())
-
-  # XXX produce a new 'globals' environment here:
-  setupGlobalCtx(module, graph, idgen)
-  result = PEvalContext graph.vm
+  result = PEvalPassContext(idgen: idgen, graph: graph, module: module)
+
+proc isDecl(n: PNode): bool =
+  case n.kind
+  of nkStmtList:
+    # if one sub-node is not declarative, neither is `n`
+    for it in n.items:
+      if not isDecl(it):
+        return false
+    result = true
+  of nkEmpty, nkTypeSection, nkConstSection, nkImportStmt, nkImportAs,
+     nkImportExceptStmt, nkFromStmt, nkCommentStmt, routineDefs:
+    result = true
+  else:
+    result = false
 
 proc myProcess(c: PPassContext, n: PNode): PNode =
-  let c = PEvalContext(c)
-  # don't eval errornous code:
-  if c.oldErrorCount == c.vm.config.errorCounter and not n.isError:
-    let r = evalStmt(c.jit, c.vm, n)
-    reportIfError(c.vm.config, r)
+  let c = PEvalPassContext(c)
+  # don't eval errornous code. Also skip declarative nodes, as those represent
+  # type definitions required for bootstrapping the basic type environment
+  if c.oldErrorCount == c.graph.config.errorCounter and not n.isError and
+     not isDecl(n):
+    setupGlobalCtx(c.module, c.graph, c.idgen)
+    let eval = PEvalContext(c.graph.vm)
+
+    let r = evalStmt(eval.jit, eval.vm, n)
+    reportIfError(c.graph.config, r)
     # TODO: use the node returned by evalStmt as the result and don't report
     #       the error here
     result = newNodeI(nkEmpty, n.info)
   else:
     result = n
-  c.oldErrorCount = c.vm.config.errorCounter
+  c.oldErrorCount = c.graph.config.errorCounter
 
 proc myClose(graph: ModuleGraph; c: PPassContext, n: PNode): PNode =
   result = myProcess(c, n)
diff --git a/compiler/vm/nimeval.nim b/compiler/vm/nimeval.nim
index 69057e52390..3588777a4a9 100644
--- a/compiler/vm/nimeval.nim
+++ b/compiler/vm/nimeval.nim
@@ -174,7 +174,7 @@ proc createInterpreter*(
     # Register basic system operations and parts of stdlib modules
     for o in basicOps():
       vm.registerCallback(o.pattern, o.prc)
-  graph.vm = PEvalContext(vm: vm)
+  graph.vm = PVmCtx(context: vm)
   graph.compileSystemModule()
   result = Interpreter(mainModule: m, graph: graph, scriptName: scriptName, idgen: idgen)
 
@@ -219,7 +219,7 @@ proc runRepl*(
   var idgen = idGeneratorFromModule(m)
 
   if supportNimscript:
-    graph.vm = PEvalContext(vm: setupVM(m, cache, "stdin", graph, idgen))
+    graph.vm = PVmCtx(context: setupVM(m, cache, "stdin", graph, idgen))
 
   graph.compileSystemModule()
   processModule(graph, m, idgen, llStreamOpenStdIn(r))
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index d861e6ff736..f05c632a4f6 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -32,7 +32,8 @@ import
     rodfiles
   ],
   compiler/mir/[
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/utils/[
     idioms,
@@ -193,6 +194,11 @@ type
     ## Contextual state needed for turning data `PNode`-trees into
     ## `PackedDataNode` trees and storing them into the packed environment
     config*: ConfigRef
+    types*: ptr TypeEnv
+      # HACK: some parts of constant data encoding need read-only access to
+      #       the type environment, so a pointer to the environment is stored
+      #       here to prevent excessive parameter passing. No access to the
+      #       type environment should be required
     i: int ## the index in `PackedEnv.nodes` where the next item is to be stored
 
 const
@@ -298,7 +304,7 @@ func storeDiscrData(enc: var DataEncoder, e: var PackedEnv, s: PSym, v: Int128)
 proc storeFieldsData(enc: var DataEncoder, e: var PackedEnv,
                      t: MirTree, n: NodePosition) =
   let
-    typ = t[n].typ
+    typ = enc.types[][t[n].typ]
     count = t[n].len
   enc.put e, PackedDataNode(kind: pdkObj, pos: count.uint32)
   e.nodes.growBy(count * 2) # make space for the content
@@ -347,7 +353,7 @@ proc storeSetData(enc: var DataEncoder, e: var PackedEnv,
                   t: MirTree, n: NodePosition) =
   let
     count = t[n].len
-    typ = t[n].typ
+    typ = enc.types[][t[n].typ]
   enc.put e, PackedDataNode(kind: pdkSet, pos: count.uint32 * 2)
   e.nodes.growBy(count * 2) # make space for the content
 
@@ -373,7 +379,7 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
                    t: MirTree, n: NodePosition) =
   case t[n].kind
   of mnkNilLit:
-    if t[n].typ.skipTypes(abstractInst).callConv == ccClosure:
+    if enc.types[][t[n].typ].skipTypes(abstractInst).callConv == ccClosure:
       # XXX: some unexpanded `nil` closure literals reach here, so we have
       #      to expand them here. This needs to happen earlier
       enc.put e, PackedDataNode(kind: pdkObj, pos: 2)
diff --git a/compiler/vm/vmbackend.nim b/compiler/vm/vmbackend.nim
index b74ed810cce..5b965368a66 100644
--- a/compiler/vm/vmbackend.nim
+++ b/compiler/vm/vmbackend.nim
@@ -31,7 +31,8 @@ import
     mirbodies,
     mirenv,
     mirgen,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/modules/[
     modulegraphs,
@@ -235,7 +236,7 @@ proc storeData(enc: var PackedEncoder, dst: var PackedEnv,
                config: ConfigRef,
                consts: seq[(PVmType, DataId)], env: MirEnv) =
   ## Packs all constant data (`consts`) and stores it into `dst`.
-  var denc = DataEncoder(config: config)
+  var denc = DataEncoder(config: config, types: addr env.types)
   denc.startEncoding(dst)
 
   mapList(dst.cconsts, consts, it):
@@ -265,8 +266,7 @@ proc generateCode*(g: ModuleGraph, mlist: sink ModuleList) =
                                 magicsToKeep: MagicsToKeep))
 
   var c =
-    GenCtx(graph: g,
-           gen: CodeGenCtx(config: g.config, graph: g, mode: emStandalone))
+    GenCtx(graph: g, gen: initCodeGen(g))
 
   c.gen.typeInfoCache.init()
   c.gen.typeInfoCache.initRootRef(g.config, g.getCompilerProc("RootObj").typ)
@@ -300,7 +300,7 @@ proc generateCode*(g: ModuleGraph, mlist: sink ModuleList) =
   # produce a list with the type of each constant:
   var consts = newSeq[(PVmType, DataId)](c.gen.env.data.len)
   for i, data in c.gen.env.data.pairs:
-    let typ = c.gen.typeInfoCache.lookup(conf, data[0].typ)
+    let typ = c.gen.typeInfoCache.lookup(conf, c.gen.env[data[0].typ])
     consts[ord(i)] = (get(typ), i)
 
   env.typeInfoCache = move c.gen.typeInfoCache
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 6100ed15980..f33cb4dd837 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -52,7 +52,8 @@ import
   ],
   compiler/mir/[
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/front/[
     msgs,
@@ -180,7 +181,6 @@ type
     # immutable input parameters:
     graph*: ModuleGraph
     config*: ConfigRef
-    mode*: TEvalMode
     features*: TSandboxFlags
     module*: PSym
 
@@ -217,6 +217,9 @@ const
   noDest = TDest(-1)
   slotSomeTemp* = slotTempUnknown
 
+proc initCodeGen*(g: ModuleGraph): CodeGenCtx =
+  CodeGenCtx(graph: g, config: g.config, env: initMirEnv(g))
+
 proc getOrCreate*(c: var TCtx, typ: PType;
                   noClosure = false): PVmType {.inline.} =
   var cl: GenClosure
@@ -1083,7 +1086,7 @@ proc writeBackResult(c: var TCtx, info: CgNode) =
   ## If the result value fits into a register but is not stored in one
   ## (because it has its address taken, etc.), emits the code for storing it
   ## back into a register. `info` is only used to provide line information.
-  let typ = c.prc.body[resultId].typ
+  let typ = c.env[c.prc.body[resultId].typ]
   if not isEmptyType(typ) and fitsRegister(typ) and not isDirectView(typ) and
      c.prc[resultId].isIndirect:
       # a write-back is required. Load the value into temporary register and
@@ -1244,10 +1247,10 @@ proc genRegLoad(c: var TCtx, n: CgNode, dest, src: TRegister) {.inline.} =
 proc genFieldCheck(c: var TCtx; n: CgNode)
 proc genSym(c: var TCtx, n: CgNode, dest: var TDest, load = true)
 
-func usesRegister(p: BProc, s: LocalId): bool =
+func usesRegister(c: TCtx, s: LocalId): bool =
   ## Returns whether the location identified by `s` is backed by a register
   ## (that is, whether the value is stored in a register directly)
-  fitsRegister(p.body[s].typ) and not p[s].isIndirect
+  fitsRegister(c.env[c.prc.body[s].typ]) and not c.prc[s].isIndirect
 
 proc genNew(c: var TCtx; n: CgNode, dest: var TDest) =
   prepare(c, dest, n, n.typ)
@@ -1757,14 +1760,14 @@ func fitsRegister(t: PType): bool =
   st.kind in { tyBool, tyInt..tyUInt64, tyChar, tyPtr, tyPointer} or
     (st.sym != nil and st.sym.magic == mPNimrodNode) # NimNode goes into register too
 
-func usesRegister(p: BProc, n: CgNode): bool =
+func usesRegister(c: TCtx, n: CgNode): bool =
   ## Analyses and returns whether the value of the location named by l-value
   ## expression `n` is stored in a register instead of a memory location
   # XXX: instead of using a separate analysis, compute and return this as part
   #      of ``genLValue`` and
   case n.kind
   of cnkLocal:
-    usesRegister(p, n.local)
+    usesRegister(c, n.local)
   of cnkProc, cnkConst, cnkGlobal:
     false
   of cnkDeref, cnkDerefView, cnkFieldAccess, cnkArrayAccess, cnkTupleAccess,
@@ -1778,7 +1781,7 @@ proc genNoLoad(c: var TCtx, n: CgNode): tuple[reg: TRegister, isDirect: bool] =
   ## the result stores a handle or a value.
   var dest = noDest
   genLvalue(c, n, dest)
-  result = (TRegister(dest), usesRegister(c.prc, n))
+  result = (TRegister(dest), usesRegister(c, n))
 
 proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
   case m
@@ -2482,7 +2485,7 @@ proc genAsgnToLocal(c: var TCtx, le, ri: CgNode) =
       genToSlice(c, ri, dest, reified=false)
     else:
       gen(c, ri, dest)
-  elif usesRegister(c.prc, le.local):
+  elif usesRegister(c, le.local):
     gen(c, ri, dest)
   elif fitsRegister(le.typ):
     # the local is stored in-memory, a temporary register is needed
@@ -2638,7 +2641,7 @@ proc genSym(c: var TCtx; n: CgNode; dest: var TDest; load = true) =
     discard genType(c, n.typ) # make sure the type exists
     # somewhat hack-y, but the orchestrator later queries the type of the data
     # (which might be a different PType that maps to the same VM type)
-    discard genType(c, c.env[DataId pos][0].typ)
+    discard genType(c, c.env[c.env[DataId pos][0].typ])
   of cnkGlobal:
     # a global location
     let pos = useGlobal(c, n)
@@ -2655,7 +2658,7 @@ proc genSym(c: var TCtx; n: CgNode; dest: var TDest; load = true) =
   of cnkLocal:
       let local = c.prc[n.local].reg
       internalAssert(c.config, c.prc.regInfo[local].kind < slotSomeTemp)
-      if usesRegister(c.prc, n.local) or not load or not fitsRegister(n.typ):
+      if usesRegister(c, n.local) or not load or not fitsRegister(n.typ):
         if dest.isUnset:
           dest = local
         else:
@@ -2903,7 +2906,7 @@ proc genDef(c: var TCtx; a: CgNode) =
             # no initializer; only setup the register (and memory location,
             # if used)
             let reg = setSlot(c.prc, s)
-            let opc = if usesRegister(c.prc, s): opcLdNullReg
+            let opc = if usesRegister(c, s): opcLdNullReg
                       else: opcLdNull
 
             c.gABx(a, opc, reg, c.genType(typ))
@@ -2913,7 +2916,7 @@ proc genDef(c: var TCtx; a: CgNode) =
             # initialization is in progress:
             c.prc.regInfo[reg].kind = slotNoValue
             # XXX: checking for views here is wrong but necessary
-            if not usesRegister(c.prc, s) and not isDirectView(typ):
+            if not usesRegister(c, s) and not isDirectView(typ):
               # only setup a memory location if the local uses one
               c.gABx(a, opcLdNull, reg, c.genType(typ))
 
@@ -3205,7 +3208,7 @@ proc genStmt*(c: var TCtx; body: sink Body): Result[int, VmGenDiag] =
   except VmGenError as e:
     return typeof(result).err(move e.diag)
 
-  if not isEmptyType(c.prc.body[resultId].typ):
+  if c.prc.body[resultId].typ != VoidType:
     # the body has a result, emit a return
     c.gABC(n, opcRet, c.prc[resultId].reg)
 
@@ -3333,7 +3336,7 @@ proc genProcBody(c: var TCtx): int =
     # result register is setup at the start of macro evaluation
     # XXX: initializing the ``result`` of a macro should be handled through
     #      inserting the necessary code either in ``sem` or here
-    let rt = c.prc.body[resultId].typ
+    let rt = c.env[c.prc.body[resultId].typ]
     if not isEmptyType(rt) and fitsRegister(rt):
       # initialize the register holding the result
       if s.kind == skMacro:
@@ -3367,7 +3370,7 @@ proc genProcBody(c: var TCtx): int =
       # may pass it as a super type
       let env = TRegister(s.routineSignature.n.len)
       c.gABC(body, opcObjConv, env, env)
-      c.gABx(body, opcObjConv, 0, c.genType(c.prc.body[LocalId env].typ))
+      c.gABx(body, opcObjConv, 0, c.genType(c.env[c.prc.body[LocalId env].typ]))
 
     let eh = genSetEh(c, body.info)
     gen(c, body)
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 5878ea57d67..506c9156c6d 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -36,9 +36,11 @@ import
     mirgen,
     mirpasses,
     mirtrees,
+    mirtypes
   ],
   compiler/modules/[
-    magicsys
+    magicsys,
+    modulegraphs
   ],
   compiler/sem/[
     transf
@@ -70,6 +72,10 @@ type
     gen: CodeGenCtx
       ## code generator state
 
+proc initJit*(graph: ModuleGraph): JitState =
+  ## Returns an initialized ``JitState`` instance.
+  JitState(gen: initCodeGen(graph))
+
 func env*(jit: JitState): lent MirEnv {.inline.} =
   ## The JIT code generator's MIR environment.
   jit.gen.env
@@ -93,7 +99,6 @@ func swapState(c: var TCtx, gen: var CodeGenCtx) =
   # input parameters:
   swap(graph)
   swap(config)
-  swap(mode)
   swap(features)
   swap(module)
   swap(callbackKeys)
@@ -126,7 +131,7 @@ proc updateEnvironment(c: var TCtx, env: var MirEnv, cp: EnvCheckpoint) =
   # constants
   for id, data in since(env.data, cp.data):
     let
-      typ = c.getOrCreate(data[0].typ)
+      typ = c.getOrCreate(env.types[data[0].typ])
       handle = c.allocator.allocConstantLocation(typ)
 
     initFromExpr(handle, data, env, c)
@@ -167,7 +172,7 @@ proc generateMirCode(c: var TCtx, env: var MirEnv, n: PNode;
 
     result = exprToMir(c.graph, env, selectOptions(c), n)
 
-proc generateIR(c: var TCtx, env: MirEnv, body: sink MirBody): Body =
+proc generateIR(c: var TCtx, env: var MirEnv, body: sink MirBody): Body =
   backends.generateIR(c.graph, c.idgen, env, c.module, body)
 
 proc setupRootRef(c: var TCtx) =
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index be51f79dcc7..cd40fd36a5a 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -87,7 +87,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
     else:
       # allocate a managed heap location and fill it:
       let
-        t = c.getOrCreate(tree[n].typ)
+        t = c.getOrCreate(env[tree[n].typ])
         slot = c.heap.heapNew(c.allocator, t.targetType)
       recurse(c.heap.unsafeDeref(slot))
       deref(dest).refVal = slot
@@ -97,7 +97,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       toInt(val - first)
 
     let first =
-      if tree[n].len > 0: firstOrd(c.config, tree[n].typ)
+      if tree[n].len > 0: firstOrd(c.config, env[tree[n].typ])
       else:               Zero
     # XXX: ^^ ``set[empty]``-typed literals reach here, but they shouldn't. The
     #      len guard works around the issue
@@ -126,7 +126,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       iterTree(j):
         arg recurse(dest.getFieldHandle(j.FieldPosition))
     of mnkObjConstr:
-      let typ = tree[n].typ.skipTypes(abstractPtrs) ## the object's type
+      let typ = env[tree[n].typ].skipTypes(abstractPtrs) ## the object's type
       iterTree(i):
         let
           sym = lookupInType(typ, next().field)
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index f875c0a275e..cf72a869da1 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -4,17 +4,18 @@ discard """
 """
 
 import compiler/ast/ast
+import compiler/mir/mirtypes
 include compiler/mir/datatables
 
 # some placeholder types to assing to the nodes. For object types, a different
 # ID means that it's a different type
 let
-  t1 = PType(itemId: ItemId(item: 1), kind: tyObject, sons: @[PType nil])
-  t2 = PType(itemId: ItemId(item: 2), kind: tyObject, sons: @[PType nil])
-  t3 = PType(itemId: ItemId(item: 3), kind: tyObject, sons: @[PType nil])
+  t1 = Int8Type
+  t2 = Int16Type
+  t3 = Int32Type
 
 # node constructor
-template node(k: MirNodeKind, t: PType, field, val: untyped): MirNode =
+template node(k: MirNodeKind, t: TypeId, field, val: untyped): MirNode =
   MirNode(kind: k, typ: t, field: val)
 template node(k: MirNodeKind, field, val: untyped): MirNode =
   MirNode(kind: k, field: val)

From 14bb4d8281d9ed42d0fe2b253548ac33d669f1e8 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 18 Apr 2024 01:36:26 +0200
Subject: [PATCH 066/169] mir: shrink size of `MirNode` (#1279)

## Summary

Shrink the size of a `MirNode` from 24 byte (on a 64bit target) to 16
byte, reducing memory consumption and copying cost, as well as
increasing the number of nodes fitting in a cache line.

## Details

The `len` field was an int, resulting in the case having an
alignment requirement and size of 8 byte (for a 64bit target).
Since the `len` field is never negative, it's changed into a `uint32`
field. This also makes the size of a `MirNode` target-independent.
---
 compiler/mir/mirgen.nim   | 19 ++++++++++---------
 compiler/mir/mirtrees.nim |  2 +-
 2 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 1000586c2be..0ad55e6de73 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1174,7 +1174,8 @@ proc genClosureConstr(c: var TCtx, n: PNode, isConsume: bool) =
 proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
   let isRef = n.typ.skipTypes(abstractInst).kind == tyRef
 
-  c.subTree MirNode(kind: mnkObjConstr, typ: c.typeToMir(n.typ), len: n.len-1):
+  c.subTree MirNode(kind: mnkObjConstr, typ: c.typeToMir(n.typ),
+                    len: uint32(n.len-1)):
     for i in 1..<n.len:
       let it = n[i]
       let field = lookupFieldAgain(n.typ.skipTypes(abstractInst), it[0].sym)
@@ -1585,12 +1586,12 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
   assert isEmptyType(n.typ) == not dest.isSome
 
   let v = genUse(c, n[0])
-  c.add MirNode(kind: mnkCase, len: n.len - 1)
+  c.add MirNode(kind: mnkCase, len: uint32(n.len - 1))
   c.use v
 
   # iterate of/else branches:
   for (_, branch) in branches(n):
-    c.add MirNode(kind: mnkBranch, len: branch.len - 1)
+    c.add MirNode(kind: mnkBranch, len: uint32(branch.len - 1))
 
     case branch.kind
     of nkElse:
@@ -1619,7 +1620,7 @@ proc genExceptBranch(c: var TCtx, n: PNode, dest: Destination) =
   assert n.kind == nkExceptBranch
   c.builder.useSource(c.sp, n)
 
-  c.subTree MirNode(kind: mnkBranch, len: n.len - 1):
+  c.subTree MirNode(kind: mnkBranch, len: uint32(n.len - 1)):
     # emit the exception types the branch covers:
     for _, tn in branchLabels(n):
       case tn.kind
@@ -1643,7 +1644,7 @@ proc genTry(c: var TCtx, n: PNode, dest: Destination) =
     hasFinally = n.lastSon.kind == nkFinally
     hasExcept = n[1].kind == nkExceptBranch
 
-  c.add MirNode(kind: mnkTry, len: ord(hasFinally) + ord(hasExcept))
+  c.add MirNode(kind: mnkTry, len: uint32(ord(hasFinally) + ord(hasExcept)))
   c.scope:
     c.genBranch(n[0], dest)
 
@@ -1653,7 +1654,7 @@ proc genTry(c: var TCtx, n: PNode, dest: Destination) =
     ## the number of sub-nodes excluding ``nkFinally``
 
   if hasExcept:
-    c.subTree MirNode(kind: mnkExcept, len: len-1):
+    c.subTree MirNode(kind: mnkExcept, len: uint32(len-1)):
       for i in 1..<len:
         genExceptBranch(c, n[i], dest)
 
@@ -2280,7 +2281,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       # no normalization/canonicalization takes place here, meaning that
       # ``Obj(a: 0, b: 1)`` and ``Obj(b: 1, a: 0)`` will result in two data
       # table entries, even though the values they represent are equivalent
-      bu.subTree MirNode(kind: mnkObjConstr, typ: typ, len: n.len-1):
+      bu.subTree MirNode(kind: mnkObjConstr, typ: typ, len: uint32(n.len-1)):
         for i in 1..<n.len:
           bu.add MirNode(kind: mnkField, field: n[i][0].sym.position.int32)
           bu.subTree mnkArg:
@@ -2288,7 +2289,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
     of nkCurly:
       # similar to object construction, no normalization means that ``{1, 2}``
       # and ``{2, 1}`` results in two data table entries
-      bu.subTree MirNode(kind: mnkSetConstr, typ: typ, len: n.len):
+      bu.subTree MirNode(kind: mnkSetConstr, typ: typ, len: uint32(n.len)):
         for it in n.items:
           constToMirAux(bu, env, it)
     of nkBracket, nkTupleConstr, nkClosure:
@@ -2300,7 +2301,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         of tyProc:                  mnkClosureConstr
         else:                       unreachable()
 
-      bu.subTree MirNode(kind: kind, typ: typ, len: n.len):
+      bu.subTree MirNode(kind: kind, typ: typ, len: uint32(n.len)):
         for it in n.items:
           bu.subTree mnkArg:
             constToMirAux(bu, env, it.skipColon)
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 1eab6ece408..94901baaf49 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -309,7 +309,7 @@ type
       effect*: EffectKind ## the effect that happens when the operator the
                           ## tagged value is passed to is executed
     else:
-      len*: int
+      len*: uint32
 
   MirTree* = seq[MirNode]
   MirNodeSeq* = seq[MirNode]

From 8c271397002373af0e173a388c8dac870bd6514e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 18 Apr 2024 23:13:35 +0200
Subject: [PATCH 067/169] fix behaviour of closed-over locals in `and`/`or`
 expressions (#1278)

## Summary

Fix closed-over locals defined as part of `and`/`or` expressions not
having their default value when their defined-in sub-expression was
short-circuited.

## Details

Bindings part of `and`/`or` expressions were so far hoisted to the
start of their scope by the "unscoped def" handling in `cgirgen`, which
doesn't apply to lifted locals, since these don't have a `def` (they're
part of the environment object).

Performing the hoisting in `transf` makes sure the behaviour of closed-
over locals matches that of not closed-over ones, and it also removes
the reliance on `cgirgen`.

The hoisting works by scanning transformed `and`/`or` expressions for
bindings that are within the *same* scope as the `and`/`or` expression,
and moving them to the start of the `and`/`or` expression.

For example, `(let a = 0; x) or (let b = 0; y)` is transformed into
`(let a; let b; (a = 0; x) or (b = 0; y))`.

Lifted globals (`.global` and `.thread`) have to be accounted for by
the hoisting pass, since they weren't lifted at this point.
---
 compiler/sem/transf.nim                       | 77 +++++++++++++++++++
 .../lang_callable/closure/tclosure_issues.nim | 27 ++++++-
 2 files changed, 103 insertions(+), 1 deletion(-)

diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 0728f544adb..533f74baaf1 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -1032,6 +1032,81 @@ proc flattenTree(root: PNode): PNode =
   else:
     result = root
 
+proc transformAndOr(c: PTransf, n: PNode): PNode =
+  ## Transforms both operands and hoists all locals within them that are in
+  ## the outermost scope to the start of the and/or expression:
+  ##
+  ##   (let x = 0; a) or (var y; y = 1; b)
+  ##   # ->
+  ##   (let x; var y; (x = 0; a) or (y = 1; b))
+  ##
+  ## This makes sure that the bindings' lifetime is delimited by the `and`/`or`
+  ## expression's enclosing scope, even after lowering the expression.
+  proc hoist(c: PTransf, n: sink PNode, target: PNode): PNode {.nimcall.} =
+    # traverse all statements/expressions within the *same* scope
+    case n.kind
+    of nkVarSection, nkLetSection:
+      result = newTreeI(nkStmtList, n.info)
+
+      for it in n.items:
+        case it.kind
+        of nkIdentDefs:
+          if (it[0].kind == nkSym and (sfGlobal notin it[0].sym.flags or
+              it[0].sym.owner.kind notin routineKinds)) or
+             it[0].kind == nkDotExpr:
+            # local or module-level global. The initializer expression must be
+            # processed first, since locations defined therein start their
+            # lifetime earlier. That is, for ``var x = (var y = 0; y)`` the
+            # ``var y`` must be hoisted first
+            let src = hoist(c, move it[2], target)
+            target.add newTreeI(n.kind, it.info,
+              newTreeI(nkIdentDefs, it.info, it[0], c.graph.emptyNode,
+                        c.graph.emptyNode))
+            if src.kind != nkEmpty:
+              result.add newTreeI(nkAsgn, it.info, it[0], src)
+          else:
+            # a global defined within a procedure, leave as is
+            result.add newTreeI(n.kind, n.info, it)
+        of nkVarTuple:
+          # lower into assignments first, then process the result
+          let x = lowerTupleUnpacking(c.graph, it, c.idgen, getCurrOwner(c))
+          result.add hoist(c, x, target)
+        else:
+          unreachable()
+
+      if result.len == 0:
+        # all definitions were hoisted
+        result = c.graph.emptyNode
+
+    of nkHiddenAddr, nkHiddenDeref, nkAddr, nkDerefExpr, nkObjDownConv,
+        nkObjUpConv, nkStringToCString, nkCStringToString, nkCheckedFieldExpr:
+      result = n
+      result[0] = hoist(c, move result[0], target)
+    of nkCast, nkConv, nkHiddenStdConv, nkHiddenSubConv, nkPragmaBlock:
+      result = n
+      result[1] = hoist(c, move result[1], target)
+    of nkDotExpr, nkBracketExpr, nkCallKinds, nkBracket, nkTupleConstr,
+        nkChckRangeF, nkChckRange64, nkChckRange, nkStmtListExpr, nkStmtList:
+      result = n
+      for i in 0..<result.len:
+        result[i] = hoist(c, move result[i], target)
+    else:
+      # other expressions or statements are either decalarative or open a
+      # new scope
+      result = n
+
+  if c.inlining > 0:
+    # hoisting already happened fro inlined and/or expressions
+    result = transformSons(c, n)
+  else:
+    var hoisted = newTreeIT(nkStmtListExpr, n.info, n.typ)
+    result = hoist(c, transformSons(c, n), hoisted)
+
+    if hoisted.len > 0:
+      # append the transformed expression to the statement list:
+      hoisted.add result
+      result = hoisted
+
 proc transformCall(c: PTransf, n: PNode): PNode =
   var n = flattenTree(n)
   let op = getMergeOp(n)
@@ -1066,6 +1141,8 @@ proc transformCall(c: PTransf, n: PNode): PNode =
     result = transform(c, n[1])
   elif magic == mExpandToAst:
     result = transformExpandToAst(c, n)
+  elif magic in {mAnd, mOr}:
+    result = transformAndOr(c, n)
   else:
     let s = transformSons(c, n)
     # bugfix: check after 'transformSons' if it's still a method call:
diff --git a/tests/lang_callable/closure/tclosure_issues.nim b/tests/lang_callable/closure/tclosure_issues.nim
index a1f6d15e825..51a8770bb2d 100644
--- a/tests/lang_callable/closure/tclosure_issues.nim
+++ b/tests/lang_callable/closure/tclosure_issues.nim
@@ -121,4 +121,29 @@ block:
     doAssert typeof(inner) isnot "closure"
     inner()
 
-  test()
\ No newline at end of file
+  test()
+
+block closed_over_local_in_or_expression:
+  # regression test: closed-over locals defined in ``or`` expressions
+  # behaved differently compared to when not being closed over
+
+  proc test() =
+    var i = 0
+    var take = false
+    while i < 2: # run the body two times
+      if (let x = 1; take) or (let y = 2; not take):
+        proc inner() =
+          # close over `y`
+          discard y
+
+        inner()
+
+        if take:
+          doAssert y == 0
+        else:
+          doAssert y == 2
+
+      take = true # enable short-circuiting
+      inc i
+
+  test()

From afc4b825e1a56afdb9ea6ab333efdd3d599ecf8e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 19 Apr 2024 02:04:16 +0200
Subject: [PATCH 068/169] lower `new` and `ref` construction with MIR pass
 (#1280)

## Summary

Perform the lowering of `new` and `ref` constructions with a MIR pass,
moving the logic out of the C code generator. This is progress towards
having the code generator operate on only a very small core language.

## Details

### MIR

* introduce the `mnkRefConstr` node; `mnkObjConstr` is now only used
  for object constructions. While both are the same syntactically,
  they're very different semantically, and distinguishing them in
  syntax makes analysis and lowering easier
* no new CGIR counterpart is added; `mnkRefConstr` is translated to
  `cnkObjConstr`, meaning that no code generator change is required
* `TypeEnv` now provides the integer type to use for size-like values
  via the `sizeType` procedure

### Lowering

The lowering is largely equivalent to the one previously performed by
`cgen`. That is:
* the standard `new` is turned into `nimNewObjUninit` + `default(T)`
* the unsafe `new`-with-size is turned into `nimNewObj` + `default(T)`
* a `ref` construction (e.g.: `var x = RefObj(...)`) is turned into
  `def x = nimNewObjUninit(...); x[] = Obj(...)`

Compared to previous lowering in `cgen`, the difference is that both
the standard `new` and `ref` constructions now use the non-zeroing
`newNewObjUninit`. In the case of the standard `new`, if the type has
embedded type fields, this eliminates an unnecessary `memset`, but
observable behaviour stays the same.

### C Code Generator

Handling of the `mNew` magic (`genNew`) and `ref` constructions
(implemented in `genObjConstr`) are both obsolete, and thus removed.
---
 compiler/backend/ccgexprs.nim |  77 ++----------------------
 compiler/backend/cgirgen.nim  |   2 +-
 compiler/backend/compat.nim   |   2 +-
 compiler/mir/datatables.nim   |   4 +-
 compiler/mir/mirgen.nim       |   9 ++-
 compiler/mir/mirpasses.nim    | 108 +++++++++++++++++++++++++++++++++-
 compiler/mir/mirtrees.nim     |  12 ++--
 compiler/mir/mirtypes.nim     |  22 ++++++-
 compiler/mir/utils.nim        |   2 +-
 compiler/sem/mirexec.nim      |   2 +-
 compiler/vm/packed_env.nim    |   2 +-
 compiler/vm/vmserialize.nim   |   2 +-
 doc/mir.rst                   |   5 +-
 13 files changed, 155 insertions(+), 94 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 55569fb331f..0a994368b22 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -870,39 +870,6 @@ proc genDefault(p: BProc; n: CgNode; d: var TLoc) =
     getTemp(p, n.typ, d)
   resetLoc(p, d)
 
-proc rawGenNew(p: BProc, a: var TLoc, sizeExpr: Rope; needsInit: bool; doInitObj = true) =
-  var sizeExpr = sizeExpr
-  let typ = a.t
-  var b: TLoc
-  initLoc(b, locExpr, a.lode, OnHeap)
-  let refType = typ.skipTypes(abstractInst)
-  assert refType.kind == tyRef
-  let bt = refType.lastSon
-  if sizeExpr == "":
-    sizeExpr = "sizeof($1)" % [getTypeDesc(p.module, bt)]
-
-  block:
-    if needsInit:
-      b.r = ropecg(p.module, "($1) #nimNewObj($2, NIM_ALIGNOF($3))",
-          [getTypeDesc(p.module, typ), sizeExpr, getTypeDesc(p.module, bt)])
-    else:
-      b.r = ropecg(p.module, "($1) #nimNewObjUninit($2, NIM_ALIGNOF($3))",
-          [getTypeDesc(p.module, typ), sizeExpr, getTypeDesc(p.module, bt)])
-    genAssignment(p, a, b)
-
-  if doInitObj:
-    # set the object type:
-    genObjectInit(p, cpsStmts, bt, a, constructRefObj)
-
-proc genNew(p: BProc, e: CgNode, a: var TLoc) =
-  # 'genNew' also handles 'unsafeNew':
-  if e.len == 2:
-    var se: TLoc
-    initLocExpr(p, e[1], se)
-    rawGenNew(p, a, se.rdLoc, needsInit = true)
-  else:
-    rawGenNew(p, a, "", needsInit = true)
-
 proc genNewSeqOfCap(p: BProc; e: CgNode; d: var TLoc) =
   let seqtype = skipTypes(e.typ, abstractVarRange)
   var a: TLoc
@@ -1034,13 +1001,7 @@ proc specializeInitObject(p: BProc, accessor: Rope, typ: PType,
     discard
 
 proc genObjConstr(p: BProc, e: CgNode, d: var TLoc) =
-  var t = e.typ.skipTypes(abstractInst)
-  let isRef = t.kind == tyRef
-
-  # a temporary was injected if in-place construction cannot be used,
-  # meaning that we can always construct in-place here (we still have
-  # to consider uninitialized and expression locs)
-  let useTemp = isRef or d.k == locNone
+  let t = e.typ.skipTypes(abstractInst)
 
   # if the object has a record-case, don't initialize type fields before but
   # after initializing discriminators. Otherwise, the type fields in the
@@ -1057,22 +1018,8 @@ proc genObjConstr(p: BProc, e: CgNode, d: var TLoc) =
 
     v
 
-  var tmp: TLoc
-  var r: Rope
-  if useTemp:
-    getTemp(p, t, tmp)
-    r = rdLoc(tmp)
-    if isRef:
-      rawGenNew(p, tmp, "",
-                needsInit = true,
-                doInitObj = not hasCase)
-      t = t.lastSon.skipTypes(abstractInst)
-      r = "(*$1)" % [r]
-    else:
-      constructLoc(p, tmp, doInitObj = not hasCase)
-  else:
-    resetLoc(p, d, doInitObj = not hasCase)
-    r = rdLoc(d)
+  resetLoc(p, d, doInitObj = not hasCase)
+  let r = rdLoc(d)
   discard getTypeDesc(p.module, t)
   let ty = getUniqueType(t)
   for it in e.items:
@@ -1082,29 +1029,16 @@ proc genObjConstr(p: BProc, e: CgNode, d: var TLoc) =
     ensureObjectFields(p.module, field, ty)
     tmp2.r.add(".")
     tmp2.r.add(p.fieldName(field))
-    if useTemp:
-      tmp2.k = locTemp
-      tmp2.storage = if isRef: OnHeap else: OnStack
-    else:
-      tmp2.k = d.k
-      tmp2.storage = if isRef: OnHeap else: d.storage
+    tmp2.k = d.k
+    tmp2.storage = d.storage
     tmp2.lode = it[1]
     expr(p, it[1], tmp2)
-  if useTemp:
-    if d.k == locNone:
-      d = tmp
-    else:
-      genAssignment(p, d, tmp)
 
   if hasCase:
     # initialize the object's type fields, if there are any
-
     # XXX: for some discriminators, the value is known at compile-time, so
     #      their switch-case stmt emitted by `specializeInitObject` could be
     #      elided
-    var r = rdLoc(d)
-    if isRef: r = "(*$1)" % [r]
-
     specializeInitObject(p, r, t, e.info)
 
 proc genSeqConstr(p: BProc, n: CgNode, d: var TLoc) =
@@ -1677,7 +1611,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
   of mFinished: genBreakState(p, e, d)
   of mEnumToStr: genCall(p, e, d)
   of mOf: genOf(p, e, d)
-  of mNew: genNew(p, e, d)
   of mNewSeqOfCap: genNewSeqOfCap(p, e, d)
   of mSizeOf:
     let t = e[1].typ.skipTypes({tyTypeDesc})
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 86c38ade5b2..892e3d7ebe4 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -1010,7 +1010,7 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   of mnkClosureConstr:
     treeOp cnkClosureConstr:
       res.add argToIr(tree, cl, cr)[1]
-  of mnkObjConstr:
+  of mnkObjConstr, mnkRefConstr:
     let typ = cl.map(n.typ)
     assert typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 72e299ce21f..23539a05dce 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -161,7 +161,7 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
 
     inc i # advance to the first child node
     case n.kind
-    of mnkObjConstr:
+    of mnkObjConstr, mnkRefConstr:
       tree cnkObjConstr:
         let field = lookupInType(typ, t[i].field.int)
         inc i # advance to the arg node
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index d3e2636a782..af337cd7cd9 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -38,7 +38,7 @@ func hashTree(tree: ConstrTree): Hash =
     of mnkProcVal:
       result = result !& hash(n.prc.ord)
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
-       mnkClosureConstr, mnkObjConstr:
+       mnkClosureConstr, mnkObjConstr, mnkRefConstr:
       result = result !& hash(n.len)
     of mnkField:
       result = result !& hash(n.field)
@@ -70,7 +70,7 @@ proc cmp(a, b: ConstrTree): bool =
     of mnkProcVal:
       a.prc == b.prc
     of mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
-       mnkClosureConstr, mnkObjConstr:
+       mnkClosureConstr, mnkObjConstr, mnkRefConstr:
       a.len == b.len
     of mnkField:
       a.field == b.field
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 0ad55e6de73..173a08e16da 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1172,10 +1172,13 @@ proc genClosureConstr(c: var TCtx, n: PNode, isConsume: bool) =
     c.emitOperandTree n[1], isConsume # the environment
 
 proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
-  let isRef = n.typ.skipTypes(abstractInst).kind == tyRef
+  let
+    isRef = n.typ.skipTypes(abstractInst).kind == tyRef
+    kind: range[mnkObjConstr..mnkRefConstr] =
+      if isRef: mnkRefConstr
+      else:     mnkObjConstr
 
-  c.subTree MirNode(kind: mnkObjConstr, typ: c.typeToMir(n.typ),
-                    len: uint32(n.len-1)):
+  c.subTree MirNode(kind: kind, typ: c.typeToMir(n.typ), len: uint32(n.len-1)):
     for i in 1..<n.len:
       let it = n[i]
       let field = lookupFieldAgain(n.typ.skipTypes(abstractInst), it[0].sym)
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 3e4d9a5d62d..ecbca601fb7 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -57,6 +57,11 @@ const
   LocSkip = abstractRange + tyUserTypeClasses
     ## types to skip to arrive at the underlying concrete value type
 
+template subTree(bu: var MirBuilder, k: MirNodeKind, t: TypeId,
+                 body: untyped) =
+  bu.subTree MirNode(kind: k, typ: t):
+    body
+
 iterator search(tree: MirTree, kinds: static set[MirNodeKind]): NodePosition =
   ## Returns in order of appearance the positions of all nodes matching the
   ## given `kinds`.
@@ -325,7 +330,12 @@ proc eliminateTemporaries(tree: MirTree, types: TypeEnv,
       of LvalueExprKinds:
         # usage in an lvalue expression -> the temporary can be elided
         elide = true
-      of RvalueExprKinds, mnkSetConstr:
+      of RvalueExprKinds:
+        elide = true
+      of mnkSetConstr, mnkRefConstr:
+        # constructions that are either not in-place (ref construction) or
+        # there's no relation between the operands and the result (set
+        # construction)
         elide = true
       of mnkArrayConstr, mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
          mnkObjConstr:
@@ -447,6 +457,99 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
           bu.buildCall prcId, VoidType:
             discard "no arguments"
 
+proc lowerNew(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
+              changes: var Changeset) =
+  ## Lowers ``mNew`` magic calls and ref construction into runtime procedure
+  ## calls + initialization.
+  let
+    uninitNewProc = graph.getCompilerProc("nimNewObjUninit")
+    initNewProc   = graph.getCompilerProc("nimNewObj")
+
+  proc emitNew(bu: var MirBuilder, env: var MirEnv, typ, base: TypeId,
+               size: Value, prc: PSym): Value {.nimcall.} =
+    ## Emits:
+    ##   def _1 = alignof(arg type(typ))
+    ##   def _2 = nimNewObj|nimNewObjUninit(arg size, arg _1)
+    ##   def _3 = cast _2
+    let align = bu.wrapTemp(env.types.sizeType):
+      bu.buildMagicCall mAlignOf, env.types.sizeType:
+        bu.emitByVal typeLit(base)
+    let raw = bu.wrapTemp(PointerType):
+      bu.buildCall env.procedures.add(prc), PointerType:
+        bu.emitByVal size
+        bu.emitByVal align
+    result = bu.wrapTemp typ:
+      bu.subTree mnkCast, typ:
+        bu.use raw
+
+  for i, n in tree.pairs:
+    if n.kind == mnkRefConstr:
+      let
+        stmt = tree.parent(i)
+        typ  = tree[i].typ
+        base = env.types.add(env[typ].skipTypes(abstractInst).base)
+
+      var tmp: Value
+      changes.insert(tree, stmt, i, bu):
+        let size = bu.wrapTemp(env.types.sizeType):
+          bu.buildMagicCall mSizeOf, env.types.sizeType:
+            bu.emitByVal typeLit(base)
+
+        # the object construction will zero the memory, meaning that it's okay
+        # to use the uninit-new can be used
+        tmp = emitNew(bu, env, typ, base, size, uninitNewProc)
+
+        # create a normal object construction with the original arguments, and
+        # assign it to the location:
+        bu.subTree mnkInit:
+          bu.subTree mnkDeref, base:
+            bu.use tmp
+          bu.subTree mnkObjConstr, base:
+            for it in subNodes(tree, i):
+              bu.emitFrom(tree, it)
+
+      changes.replaceMulti(tree, i, bu):
+        bu.move tmp
+    elif n.kind == mnkMagic and n.magic == mNew:
+      # lower ``x = new()`` into:
+      #   def _1 = sizeof(arg type(T))
+      #   def _2 = alignof(arg type(T))
+      #   def _3 = nimNewObjUninit(arg _1, arg _2)
+      #   def _4 = cast _3
+      #   _4[] = default()
+      #   x = move _4
+      let
+        call = tree.parent(i)
+        stmt = tree.parent(call)
+        typ  = tree[call].typ
+        base = env.types.add(env[typ].skipTypes(abstractInst).base)
+
+      var tmp: Value
+      changes.insert(tree, stmt, call, bu):
+        if numArgs(tree, call) == 2:
+          # the unsafe new-with-size version
+          let size = bu.inline(tree, NodePosition tree.argument(call, 0))
+          # not the whole memory is necessarily initialized by the default
+          # assignment, so zero the whole region (``nimNewObj``)
+          tmp = emitNew(bu, env, typ, base, size, initNewProc)
+        else:
+          # the standard new version
+          let size = bu.wrapTemp(env.types.sizeType):
+            bu.buildMagicCall mSizeOf, env.types.sizeType:
+              bu.emitByVal typeLit(base)
+          tmp = emitNew(bu, env, typ, base, size, uninitNewProc)
+
+        # ``_4[] = default()``
+        bu.subTree mnkInit:
+          bu.subTree mnkDeref, base:
+            bu.use tmp
+          bu.buildMagicCall mDefault, base:
+            discard
+
+      changes.replaceMulti(tree, call, bu):
+        bu.move tmp
+
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   graph: ModuleGraph, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
@@ -477,6 +580,9 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       # requires the extraction for cstring literals
       extractStringLiterals(body.code, env, c)
 
+    if target == targetC:
+      lowerNew(body.code, graph, env, c)
+
   # instrument the body with profiler calls after all lowerings, but before
   # optimization
   if (sfPure notin prc.flags) and (optProfiler in prc.options):
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 94901baaf49..18be9c1b946 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -185,9 +185,8 @@ type
     mnkSeqConstr  ## constructor for seq values
     mnkTupleConstr## constructor for tuple values
     mnkClosureConstr## constructor for closure values
-    mnkObjConstr  ## either allocate a new managed heap cell and returns a
-                  ## ``ref`` to it, or or constructs a new aggregate value
-                  ## with named fields
+    mnkObjConstr  ## constructor for object values
+    mnkRefConstr  ## allocates a new managed heap cell and initializes it
 
     mnkCopy   ## denotes the assignment as copying the source value
     mnkMove   ## denotes the assignment as moving the value. This does
@@ -359,7 +358,8 @@ const
 
   ConstrTreeNodes* = {mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr,
                       mnkTupleConstr, mnkClosureConstr, mnkObjConstr,
-                      mnkProcVal, mnkArg, mnkField, mnkEnd} + LiteralDataNodes
+                      mnkRefConstr, mnkProcVal, mnkArg, mnkField,
+                      mnkEnd} + LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
   # --- semantics-focused sets:
@@ -385,8 +385,8 @@ const
                       mnkToMutSlice} + UnaryOps + BinaryOps + LiteralDataNodes
   ExprKinds* =       {mnkCall, mnkCheckedCall, mnkSetConstr, mnkArrayConstr,
                       mnkSeqConstr, mnkTupleConstr, mnkClosureConstr,
-                      mnkObjConstr} + LvalueExprKinds + RvalueExprKinds +
-                     ModifierNodes
+                      mnkObjConstr, mnkRefConstr} + LvalueExprKinds +
+                     RvalueExprKinds + ModifierNodes
 
   CallKinds* = {mnkCall, mnkCheckedCall}
 
diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index acbb11a58c6..7b0f90879bf 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -13,6 +13,9 @@ import
     ast_types,
     lineinfos
   ],
+  compiler/front/[
+    options
+  ],
   compiler/modules/[
     modulegraphs,
     magicsys
@@ -22,7 +25,8 @@ import
     typemaps
   ],
   compiler/utils/[
-    containers
+    containers,
+    idioms
   ]
 
 type
@@ -35,6 +39,8 @@ type
       # XXX: ^^ the collision needs to be addressed at some point. A proper,
       #      non-sighash-based comparision needs to be used
     types: Store[TypeId, PType]
+    sizeType: TypeId
+      ## the target-dependent integer type to use for size values
 
 const
   VoidType*    = TypeId 0
@@ -57,7 +63,8 @@ const
 proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
   ## Returns a fully initialized type environment instance.
   result = TypeEnv(map: default(TypeTable[TypeId]),
-                   types: default(Store[TypeId, PType]))
+                   types: default(Store[TypeId, PType]),
+                   sizeType: VoidType)
 
   template add(kind: TTypeKind, expect: TypeId) =
     let
@@ -89,6 +96,12 @@ proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
   add(tyInt,   TypeId(ord(PointerType) + 1))
   add(tyFloat, TypeId(ord(PointerType) + 2))
 
+  result.sizeType =
+    case graph.config.target.intSize
+    of 1, 2, 4: Int32Type
+    of 8:       Int64Type
+    else:       unreachable()
+
 proc add*(env: var TypeEnv, t: PType): TypeId =
   ## If not registered yet, adds `t` to `env` and returns the ID to later
   ## look it up with. Basic structural type unification is performed.
@@ -98,3 +111,8 @@ proc add*(env: var TypeEnv, t: PType): TypeId =
 
 func `[]`*(env: TypeEnv, id: TypeId): lent PType {.inline.} =
   env.types[id]
+
+func sizeType*(env: TypeEnv): TypeId {.inline.} =
+  ## Returns the type to use for values representing some size. This is a
+  ## signed integer type of target-dependent bit-width.
+  env.sizeType
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 5d60fae5a9f..b5fe4cb5b9a 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -413,7 +413,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       valueToStr()
       result.add " .. "
       valueToStr()
-  of mnkObjConstr:
+  of mnkObjConstr, mnkRefConstr:
     let typ = nodes[i].typ
     tree "(":
       commaSeparated:
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index 6d5d6f3bf4c..ad0162a7911 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -237,7 +237,7 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
 
   case tree[source].kind
   of mnkCall, mnkCheckedCall, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
-     mnkClosureConstr, mnkObjConstr:
+     mnkClosureConstr, mnkObjConstr, mnkRefConstr:
     emitForArgs(env, tree, at, source)
   of mnkSetConstr:
     for it in subNodes(tree, source):
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index f05c632a4f6..a61045e3ce4 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -406,7 +406,7 @@ func storeDataNode(enc: var DataEncoder, e: var PackedEnv,
     enc.storeTupleData(e, t, n)
   of mnkSetConstr:
     enc.storeSetData(e, t, n)
-  of mnkObjConstr:
+  of mnkObjConstr, mnkRefConstr:
     enc.storeFieldsData(e, t, n)
   else:
     unreachable(t[n].kind)
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index cd40fd36a5a..7eaab915c4e 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -125,7 +125,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
     of mnkTupleConstr, mnkClosureConstr:
       iterTree(j):
         arg recurse(dest.getFieldHandle(j.FieldPosition))
-    of mnkObjConstr:
+    of mnkObjConstr, mnkRefConstr:
       let typ = env[tree[n].typ].skipTypes(abstractPtrs) ## the object's type
       iterTree(i):
         let
diff --git a/doc/mir.rst b/doc/mir.rst
index bd992f41f58..84e8e2736d8 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -110,8 +110,8 @@ Semantics
          | SeqConstr CONSTR_ARG...
          | TupleConstr CONSTR_ARG...
          | ClosureConstr CONSTR_ARG...
-         | ObjConstr (<Field> CONSTR_ARG) ... # construct an `object` or
-                                         # `ref object`
+         | ObjConstr (<Field> CONSTR_ARG) ... # construct an `object`
+         | RefConstr (<Field> CONSTR_ARG) ... # construct a `ref object`
          | StdConv  VALUE                # number conversion or conversion
                                          # between cstring and string
          | Conv     VALUE                # same as `StdConv`. Only duplicate
@@ -403,3 +403,4 @@ ones).
           | TupleConstr ARG...
           | ClosureConstr ARG...
           | ObjConstr (<Field> ARG)...
+          | RefConstr (<Field> ARG)...

From 67be9887c9f64ba1004d2761a857ea65320363a2 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 23 Apr 2024 00:37:34 +0000
Subject: [PATCH 069/169] build(deps): Bump
 JamesIves/github-pages-deploy-action from 4.5.0 to 4.6.0 (#1282)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[JamesIves/github-pages-deploy-action](https://github.com/jamesives/github-pages-deploy-action)
from 4.5.0 to 4.6.0.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/jamesives/github-pages-deploy-action/releases">JamesIves/github-pages-deploy-action's
releases</a>.</em></p>
<blockquote>
<h2>v4.6.0</h2>
<h2>What's Changed</h2>
<ul>
<li>Check for fatal on every line of stderr of the git command by <a
href="https://github.com/ben-z"><code>@​ben-z</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1551">JamesIves/github-pages-deploy-action#1551</a></li>
<li>Migrated to eslint v9</li>
<li>build(deps): bump github/codeql-action from 2 to 3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1488">JamesIves/github-pages-deploy-action#1488</a></li>
<li>Bump <code>@​babel/traverse</code> from 7.8.3 to 7.23.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1460">JamesIves/github-pages-deploy-action#1460</a></li>
<li>build(deps-dev): bump eslint-plugin-jest from 27.2.3 to 27.6.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1469">JamesIves/github-pages-deploy-action#1469</a></li>
<li>build(deps-dev): bump <code>@​types/node</code> from 20.10.0 to
20.11.6 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1507">JamesIves/github-pages-deploy-action#1507</a></li>
<li>build(deps-dev): bump eslint-plugin-jest from 27.6.0 to 27.6.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1501">JamesIves/github-pages-deploy-action#1501</a></li>
<li>build(deps-dev): bump <code>@​types/node</code> from 20.11.6 to
20.11.13 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1513">JamesIves/github-pages-deploy-action#1513</a></li>
<li>build(deps): bump codecov/codecov-action from 3.1.4 to 3.1.6 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1512">JamesIves/github-pages-deploy-action#1512</a></li>
<li>Bump <code>@​actions/core</code> from 1.10.0 to 1.10.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1434">JamesIves/github-pages-deploy-action#1434</a></li>
<li>Bump codecov/codecov-action from 3.1.6 to 4.0.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1515">JamesIves/github-pages-deploy-action#1515</a></li>
<li>Bump <code>@​types/node</code> from 20.11.13 to 20.11.16 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1516">JamesIves/github-pages-deploy-action#1516</a></li>
<li>Bump codecov/codecov-action from 4.0.0 to 4.0.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1517">JamesIves/github-pages-deploy-action#1517</a></li>
<li>Bump <code>@​types/node</code> from 20.11.16 to 20.11.22 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1534">JamesIves/github-pages-deploy-action#1534</a></li>
<li>Bump <code>@​types/node</code> from 20.11.22 to 20.11.25 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1537">JamesIves/github-pages-deploy-action#1537</a></li>
<li>Bump codecov/codecov-action from 4.0.1 to 4.1.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1532">JamesIves/github-pages-deploy-action#1532</a></li>
<li>Bump eslint-plugin-jest from 27.6.3 to 27.9.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1526">JamesIves/github-pages-deploy-action#1526</a></li>
<li>Bump webfactory/ssh-agent from 0.8.0 to 0.9.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1520">JamesIves/github-pages-deploy-action#1520</a></li>
<li>Bump actions/checkout in README by <a
href="https://github.com/verhovsky"><code>@​verhovsky</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1523">JamesIves/github-pages-deploy-action#1523</a></li>
<li>Bump codecov/codecov-action from 4.1.0 to 4.1.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1547">JamesIves/github-pages-deploy-action#1547</a></li>
<li>Bump <code>@​types/node</code> from 20.11.25 to 20.11.30 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1545">JamesIves/github-pages-deploy-action#1545</a></li>
<li>Bump <code>@​types/node</code> from 20.11.30 to 20.12.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1550">JamesIves/github-pages-deploy-action#1550</a></li>
<li>Bump <code>@​types/node</code> from 20.12.2 to 20.12.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1552">JamesIves/github-pages-deploy-action#1552</a></li>
<li>Bump <code>@​types/node</code> from 20.12.3 to 20.12.6 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1557">JamesIves/github-pages-deploy-action#1557</a></li>
<li>Bump codecov/codecov-action from 4.1.1 to 4.3.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1559">JamesIves/github-pages-deploy-action#1559</a></li>
<li>Bump <code>@​types/node</code> from 20.12.6 to 20.12.7 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1558">JamesIves/github-pages-deploy-action#1558</a></li>
<li>Bump <code>@​actions/github</code> from 5.1.1 to 6.0.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1455">JamesIves/github-pages-deploy-action#1455</a></li>
<li>build(deps): bump actions/upload-artifact from 3 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1490">JamesIves/github-pages-deploy-action#1490</a></li>
<li>build(deps): bump actions/download-artifact from 3 to 4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1489">JamesIves/github-pages-deploy-action#1489</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/verhovsky"><code>@​verhovsky</code></a>
made their first contribution in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1523">JamesIves/github-pages-deploy-action#1523</a></li>
<li><a href="https://github.com/ben-z"><code>@​ben-z</code></a> made
their first contribution in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1551">JamesIves/github-pages-deploy-action#1551</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/JamesIves/github-pages-deploy-action/compare/v4.5.0...v4.6.0">https://github.com/JamesIves/github-pages-deploy-action/compare/v4.5.0...v4.6.0</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/ec9c88baef04b842ca6f0a132fd61c762aa6c1b0"><code>ec9c88b</code></a>
Merge branch 'releases/v4' of <a

href="https://github.com/JamesIves/github-pages-deplo">https://github.com/JamesIves/github-pages-deplo</a>...</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/e58e46c5c618013742423183f7149662d4fcc209"><code>e58e46c</code></a>
Delete .eslintrc.json</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/19d08120f6103caf2b5eb996daebf903fc8166fd"><code>19d0812</code></a>
Deploy Production Code for Commit
1008d185fbd2e25a24f2da400f5ad62db137c39d 🚀</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/1008d185fbd2e25a24f2da400f5ad62db137c39d"><code>1008d18</code></a>
Merge branch 'dev' into releases/v4</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/d60bb0b490844000f6a10edae89c221b7c6ecbd6"><code>d60bb0b</code></a>
Update sponsors.yml</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/69873ad9157bf0b4fb59bf0a3e1875e3e3526b78"><code>69873ad</code></a>
Update eslint.config.mjs</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/d37392594b7fb43ab272315dbbd59189e340607e"><code>d373925</code></a>
Update worktree.test.ts</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/9c1917a5628868a2ba383a50b85fc6fc9b685dbb"><code>9c1917a</code></a>
fix: migrate to ESLint 9</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/ea27152698ebe125eabc56f00fd66ac1d441a4ea"><code>ea27152</code></a>
Merge branch 'dev' of <a

href="https://github.com/JamesIves/github-pages-deploy-action">https://github.com/JamesIves/github-pages-deploy-action</a>...</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/6727ffe63cf10549e07f2c3551dbb350cc789141"><code>6727ffe</code></a>
chore: resolve formatting changes from newer prettier version</li>
<li>Additional commits viewable in <a

href="https://github.com/jamesives/github-pages-deploy-action/compare/v4.5.0...v4.6.0">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=JamesIves/github-pages-deploy-action&package-manager=github_actions&previous-version=4.5.0&new-version=4.6.0)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 6e60bbb202a..fb8c0790fb9 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -71,7 +71,7 @@ jobs:
           path: release-staging
 
       - name: Publish docs
-        uses: JamesIves/github-pages-deploy-action@v4.5.0
+        uses: JamesIves/github-pages-deploy-action@v4.6.0
         with:
           branch: gh-pages
           folder: doc/html

From fa85029c0cecd689807e66e3c746881c1e200381 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 23 Apr 2024 04:48:13 +0200
Subject: [PATCH 070/169] sem: proper error propagation for set construction
 (#1283)

## Summary

Refactor/fix set construction analysis such that:
* `nkRange` nodes are properly analyzed after macro expansion
* errors within set constructions are propagated properly

## Details

Only `semSetConstr` is modified:
* use `shallowCopy` instead of creating a new node (no sequence
  resizing, keeps the persistent node flags)
* always re-analyze `nkRange` nodes (they were previously never typed)
* guard against ill-formed `nkRange` AST (could previously crash the
  compiler)
* don't modify the input AST
* replace `localReport` with using `nkError`
* propagate `nkError`
---
 compiler/sem/semexprs.nim                  | 80 +++++++++++++---------
 tests/lang_exprs/tset_construction_ast.nim | 14 ++++
 2 files changed, 63 insertions(+), 31 deletions(-)
 create mode 100644 tests/lang_exprs/tset_construction_ast.nim

diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 0c51fe54b89..5c74f0625ad 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -2980,55 +2980,73 @@ proc semWhen(c: PContext, n: PNode, semCheck = true): PNode =
     result.typ = typ
 
 proc semSetConstr(c: PContext, n: PNode): PNode =
-  result = newNodeI(nkCurly, n.info)
+  ## Analyses and types a set construction expression (``nkCurly``). Produces
+  ## a typed expression, or an error.
+  result = shallowCopy(n)
   result.typ = newTypeS(tySet, c)
   result.typ.flags.incl tfIsConstructor
   if n.len == 0:
     rawAddSon(result.typ, newTypeS(tyEmpty, c))
   else:
+    var
+      typ: PType = nil
+      diag: PAstDiag ## the error diagnostic, if an error occurred
+
     # only semantic checking for all elements, later type checking:
-    var typ: PType = nil
-    for i in 0..<n.len:
-      if isRange(n[i]):
-        checkSonsLen(n[i], 3, c.config)
-        n[i][1] = semExprWithType(c, n[i][1])
-        n[i][2] = semExprWithType(c, n[i][2])
-        if typ == nil:
-          typ = skipTypes(n[i][1].typ,
-                          {tyGenericInst, tyVar, tyLent, tyOrdinal, tyAlias, tySink})
-        n[i].typ = n[i][2].typ # range node needs type too
+    for i, it in n.pairs:
+      var elem: PType
+      if isRange(it):
+        checkSonsLen(it, 3, c.config)
+        result[i] =
+          newTreeI(nkRange, it.info,
+                   semExprWithType(c, it[1]),
+                   semExprWithType(c, it[2]))
+        elem = result[i][0].typ
       elif n[i].kind == nkRange:
-        # already semchecked
-        if typ == nil:
-          typ = skipTypes(n[i][0].typ,
-                          {tyGenericInst, tyVar, tyLent, tyOrdinal, tyAlias, tySink})
+        checkSonsLen(n[i], 2, c.config)
+        result[i] =
+          newTreeI(nkRange, it.info,
+                   semExprWithType(c, it[0]),
+                   semExprWithType(c, it[1]))
+        elem = result[i][0].typ
       else:
-        n[i] = semExprWithType(c, n[i])
-        if typ == nil:
-          typ = skipTypes(n[i].typ, {tyGenericInst, tyVar, tyLent, tyOrdinal, tyAlias, tySink})
+        result[i] = semExprWithType(c, n[i])
+        elem = result[i].typ
+
+      if typ.isNil:
+        typ = skipTypes(elem, {tyGenericInst, tyOrdinal, tyAlias, tySink})
+
     if not isOrdinalType(typ, allowEnumWithHoles=true):
-      localReport(c.config, n, reportSem rsemExpectedOrdinal)
+      if typ.kind != tyError:
+        diag = PAstDiag(kind: adSemExpectedOrdinal, nonOrdTyp: typ)
       typ = makeRangeType(c, 0, MaxSetElements - 1, n.info)
 
     elif lengthOrd(c.config, typ) > MaxSetElements:
       typ = makeRangeType(c, 0, MaxSetElements - 1, n.info)
 
     addSonSkipIntLit(result.typ, typ, c.idgen)
-    for i in 0..<n.len:
-      var m: PNode
-      let info = n[i].info
-      if isRange(n[i]):
-        m = newNodeI(nkRange, info)
-        m.add fitNode(c, typ, n[i][1], info)
-        m.add fitNode(c, typ, n[i][2], info)
-
-      elif n[i].kind == nkRange:
-        m = n[i] # already semchecked
 
+    var hasError = false
+    template handleError(n: PNode): PNode =
+      let x = n
+      hasError = hasError or x.kind == nkError
+      x
+
+    # second pass: type checking and error detection
+    for i in 0..<result.len:
+      let info = result[i].info
+      case result[i].kind
+      of nkRange:
+        result[i][0] = handleError fitNode(c, typ, result[i][0], info)
+        result[i][1] = handleError fitNode(c, typ, result[i][1], info)
       else:
-        m = fitNode(c, typ, n[i], info)
+        result[i] = handleError fitNode(c, typ, result[i], info)
 
-      result.add m
+    # wrap with the appropriate error (or none)
+    if diag != nil:
+      result = c.config.newError(result, diag)
+    elif hasError:
+      result = c.config.wrapError(result)
 
 proc semTableConstr(c: PContext, n: PNode): PNode =
   # we simply transform ``{key: value, key2, key3: value}`` to
diff --git a/tests/lang_exprs/tset_construction_ast.nim b/tests/lang_exprs/tset_construction_ast.nim
new file mode 100644
index 00000000000..4e4833840bc
--- /dev/null
+++ b/tests/lang_exprs/tset_construction_ast.nim
@@ -0,0 +1,14 @@
+discard """
+  description: '''
+    Ensure that valid `nkRange` AST in a set construction emitted by a macro
+    is correctly semantically anaylsed
+  '''
+  targets: native
+"""
+
+import std/macros
+
+macro m(): untyped =
+  result = nnkCurly.newTree(nnkRange.newTree(newLit(1'u8), newLit(3'u8)))
+
+doAssert m() == {1'u8, 2'u8, 3'u8}

From 12ed7517d1120f1a15d33b896803b8421bd33c65 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 24 Apr 2024 21:27:32 +0200
Subject: [PATCH 071/169] cgen: don't emit excessive strings constants (#1285)

## Summary

For the C backend, don't emit excessive, duplicate string constants
for field checks when compiling with `--declaredlocs:off` (the
default).

## Details

The code generator handling for field checks unconditionally emitted
raw strings, resulting in a separate string constant being emitted for
each field check appearing in the code. This is unnecessary when the
error message string value stays as is, bloating the produced C code.

If the error message string does not need to be modified (i.e., when
`--declaredlocs` is disabled), the cache-using overload of
`genStringLiteral` is now used.
---
 compiler/backend/ccgexprs.nim | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 0a994368b22..aa495980c9b 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -578,18 +578,19 @@ proc genFieldCheck(p: BProc, e: CgNode) =
     initLocExpr(p, e[1], u)
     initLocExpr(p, e[2], v)
     genInExprAux(p, e, u, v, test)
-    var msg = ""
+    var strLit: Rope
     if optDeclaredLocs in p.config.globalOptions:
       # xxx this should be controlled by a separate flag, and
       # used for other similar defects so that location information is shown
       # even without the expensive `--stacktrace`; binary size could be optimized
       # by encoding the file names separately from `file(line:col)`, essentially
       # passing around `TLineInfo` + the set of files in the project.
-      msg.add toFileLineCol(p.config, e.info) & " "
-    msg.add getString(p, e[4])
-    # don't commit the string to the string table, as it's likely to be
-    # unique and never used again
-    let strLit = genStringLiteral(p.module, msg)
+      let msg = toFileLineCol(p.config, e.info) & " " & getString(p, e[4])
+      # don't commit the string to the string table, as it's likely to be
+      # unique and never used again
+      strLit = genStringLiteral(p.module, msg)
+    else:
+      strLit = genStringLiteral(p.module, e[4])
 
     ## discriminant check
     template fun(code) = linefmt(p, cpsStmts, code, [rdLoc(test)])

From 421ab5a9669c4d95fc13876c53fd20d6b1c94d86 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 24 Apr 2024 21:33:09 +0200
Subject: [PATCH 072/169] sem: clean up `case` analysis and fix edge cases
 (#1284)

## Summary

Clean up, improve, and fix `case` analysis. Errors are properly
propagated, input AST is no longer modified, and multiple bugs are
fixed:
* `nkRange` nodes in `nkOfBranch` AST in macro output is properly
  analyzed
* converters are correctly taken into account for branch labels
  (previously resulted in a compiler crash)
* empty set, array, and seq values in otherwise non-empty `of` branches
  no longer result in spurious "not all cases are covered" errors

## Details

Both the `case` statements and `case`-object declarations are affected.
For the range syntax analysis (`semBranchRange`):
* evaluating the expression happens *after* fitting, so that converter
  calls are accounted for (they previously stayed, crashing the
  compiler later on)
* the `localReport`s are replaced with diagnostics; two new diagnostics
  corresponding to the previously used reports are added
* errors are wrapped properly
* "cannot be string range" errors now take precedence over
  "empty range" errors
* the operand type is passed directly as a parameter, instead of
  indirectly via the case statement AST

For the `of` branch analysis (`semCaseBranch`):
* `semConstExpr` (which uses `localReport`) is replaced with
  `semExprWithType` + `evalConstExpr`
* the input AST is no longer modified
* empty set, array, and seq values no longer, erroneously, count
  towards the number of values that need to be covered
* `nkRange` nodes are always (re-)analyzed
* only the selector's type is passed as the parameter, checking for
  duplicates moves to the callsite

The `case` statement analysis (`semCase`) is changed to not modify
input AST. For wrapping the `nkCaseStmt` in an error, the AST is
scanned for errors afterwards.
---
 compiler/ast/ast_types.nim                    |   4 +
 compiler/front/cli_reporter.nim               |   2 +
 compiler/front/msgs.nim                       |   2 +
 compiler/sem/sem.nim                          |   1 -
 compiler/sem/semstmts.nim                     |  76 ++++----
 compiler/sem/semtypes.nim                     | 167 ++++++++++--------
 .../casestmt/tbranch_with_empty_set.nim       |  22 +++
 .../casestmt/tlabel_considers_converter.nim   |  30 ++++
 8 files changed, 199 insertions(+), 105 deletions(-)
 create mode 100644 tests/lang_stmts/casestmt/tbranch_with_empty_set.nim
 create mode 100644 tests/lang_stmts/casestmt/tlabel_considers_converter.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 429afb3a4ba..d271d0fba8f 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1159,6 +1159,8 @@ type
     adSemDefNameSym   ## when creating a sym node from `nkIdentKinds`
     # semtypes
     adSemTypeExpected
+    adSemStringRangeNotAllowed
+    adSemRangeIsEmpty
     # semtempl
     adSemIllformedAst
     adSemIllformedAstExpectedPragmaOrIdent
@@ -1336,6 +1338,8 @@ type
         adSemCallInCompilesContextNotAProcOrField,
         adSemExpressionHasNoType,
         adSemTypeExpected,
+        adSemStringRangeNotAllowed,
+        adSemRangeIsEmpty,
         adSemIllformedAst,
         adSemIllformedAstExpectedPragmaOrIdent,
         adSemInvalidExpression,
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 647658542f9..43d110df1a4 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3225,6 +3225,8 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
       adSemCallInCompilesContextNotAProcOrField,
       adSemExpressionHasNoType,
       adSemTypeExpected,
+      adSemStringRangeNotAllowed,
+      adSemRangeIsEmpty,
       adSemIllformedAst,
       adSemInvalidExpression,
       adSemExpectedNonemptyPattern,
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index 735abc46a94..01a3540303a 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -501,6 +501,8 @@ func astDiagToLegacyReportKind*(
   of adSemCalleeHasAnError: rsemCalleeHasAnError
   of adSemExpressionHasNoType: rsemExpressionHasNoType
   of adSemTypeExpected: rsemTypeExpected
+  of adSemStringRangeNotAllowed: rsemStringRangeNotAllowed
+  of adSemRangeIsEmpty: rsemRangeIsEmpty
   of adSemIllformedAst: rsemIllformedAst
   of adSemIllformedAstExpectedPragmaOrIdent: rsemIllformedAst
   of adSemIllformedAstExpectedOneOf: rsemIllformedAst
diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index 84ba9bfc3bd..381526fdea4 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -616,7 +616,6 @@ proc evalConstExpr(c: PContext, n: PNode): PNode =
   ## Tries to turn the expression `n` into AST that represents a concrete
   ## value. If this fails, an `nkError` node is returned
   addInNimDebugUtils(c.config, "evalConstExpr", n, result)
-  assert not n.isError
 
   # this happens when the overloadableEnums is enabled. We short-circuit
   # evaluation in this case, as neither ``vmgen`` nor ``semfold`` know what to
diff --git a/compiler/sem/semstmts.nim b/compiler/sem/semstmts.nim
index f027b528573..ae74be1efa4 100644
--- a/compiler/sem/semstmts.nim
+++ b/compiler/sem/semstmts.nim
@@ -1641,16 +1641,16 @@ proc semFor(c: PContext, n: PNode; flags: TExprFlags): PNode =
   closeScope(c)
 
 proc semCase(c: PContext, n: PNode; flags: TExprFlags): PNode =
-  result = n
   checkMinSonsLen(n, 2, c.config)
+  result = copyNodeWithKids(n)
   openScope(c)
-  pushCaseContext(c, n)
-  n[0] = semExprWithType(c, n[0])
+  result[0] = semExprWithType(c, n[0]) # selector operand
+  let selector = result[0].typ
   var chckCovered = false
   var covered: Int128 = toInt128(0)
   var typ = commonTypeBegin
   var hasElse = false
-  let caseTyp = skipTypes(n[0].typ, abstractVar-{tyTypeDesc})
+  let caseTyp = skipTypes(selector, abstractInst-{tyTypeDesc})
   const shouldChckCovered = {tyInt..tyInt64, tyChar, tyEnum, tyUInt..tyUInt64, tyBool}
   case caseTyp.kind
   of shouldChckCovered:
@@ -1659,76 +1659,90 @@ proc semCase(c: PContext, n: PNode; flags: TExprFlags): PNode =
     if skipTypes(caseTyp[0], abstractInst).kind in shouldChckCovered:
       chckCovered = true
   of tyFloat..tyFloat64, tyString:
-    # xxx: possible case statement macro bug, as it'll be skipped here
-    discard
+    discard "not all possible values have to be covered"
   else:
-    popCaseContext(c)
     closeScope(c)
-    result[0] = c.config.newError(n[0],
+    result[0] = c.config.newError(result[0],
                           PAstDiag(kind: adSemSelectorMustBeOfCertainTypes))
+    result = c.config.wrapError(result)
     return
+
+  pushCaseContext(c, result) # push the in-progress case context
   for i in 1..<n.len:
     setCaseContextIdx(c, i)
-    var x = n[i]
+    let x = n[i]
     when defined(nimsuggest):
       if c.config.ideCmd == ideSug and c.config.m.trackPos == x.info and caseTyp.kind == tyEnum:
         suggestEnum(c, x, caseTyp)
     case x.kind
     of nkOfBranch:
-      checkMinSonsLen(x, 2, c.config)
-      semCaseBranch(c, n, x, i, covered)
-      var last = x.len-1
-      x[last] = semExprBranchScope(c, x[last])
-      typ = commonType(c, typ, x[last])
+      let branch = semCaseBranch(c, selector, x, covered)
+      result[i] = branch
+      checkBranchForOverlap(c, result, i, result[i].len - 1)
+      # the branch node might be inspected from within the body, so make sure
+      # it is syntactically valid prior to the analysis
+      branch.add c.graph.emptyNode
+      branch[^1] = semExprBranchScope(c, x[^1])
     of nkElifBranch:
       chckCovered = false
       checkSonsLen(x, 2, c.config)
       openScope(c)
-      x[0] = forceBool(c, semExprWithType(c, x[0]))
-      x[1] = semExprBranch(c, x[1])
-      typ = commonType(c, typ, x[1])
+      let branch = shallowCopy(x)
+      branch[0] = forceBool(c, semExprWithType(c, x[0]))
+      branch[1] = semExprBranch(c, x[1])
       closeScope(c)
+      result[i] = branch
     of nkElse:
       checkSonsLen(x, 1, c.config)
-      x[0] = semExprBranchScope(c, x[0])
-      typ = commonType(c, typ, x[0])
-      if (chckCovered and covered == toCover(c, n[0].typ)) or hasElse:
+      let branch = shallowCopy(x)
+      branch[0] = semExprBranchScope(c, x[0])
+      result[i] = branch
+      if (chckCovered and covered == toCover(c, selector)) or hasElse:
         localReport(c.config, x.info, SemReport(kind: rsemUnreachableElse))
       hasElse = true
       chckCovered = false
     else:
       semReportIllformedAst(c.config, x, {nkElse, nkElifBranch, nkOfBranch})
 
+    # update the expression type:
+    typ = commonType(c, typ, result[i][^1])
+
   if chckCovered:
-    if covered == toCover(c, n[0].typ):
+    if covered == toCover(c, selector):
       hasElse = true
-    elif n[0].typ.skipTypes(abstractRange).kind in {tyEnum, tyChar}:
-      localReport(c.config, n, SemReport(
+    elif selector.skipTypes(abstractRange).kind in {tyEnum, tyChar}:
+      localReport(c.config, result, SemReport(
         kind: rsemMissingCaseBranches,
-        nodes: formatMissingBranches(c, n)))
+        nodes: formatMissingBranches(c, result)))
 
     else:
-      localReport(c.config, n, reportSem rsemMissingCaseBranches)
+      localReport(c.config, result, reportSem rsemMissingCaseBranches)
 
   popCaseContext(c)
   closeScope(c)
   if isEmptyType(typ) or typ.kind in {tyNil, tyUntyped} or
       (not hasElse and efInTypeof notin flags):
-    for i in 1..<n.len:
-      n[i][^1] = discardCheck(c, n[i][^1], flags)
-      if n[i][^1].isError:
-        return wrapError(c.config, n)
+    for _, it in branches(result):
+      it[^1] = discardCheck(c, it[^1], flags)
+
     # propagate any enforced VoidContext:
     if typ == c.enforceVoidContext:
       result.typ = c.enforceVoidContext
   else:
-    for i in 1..<n.len:
-      var it = n[i]
+    for i, it in branches(result):
       let j = it.len-1
       if not endsInNoReturn(it[j]):
         it[j] = fitNode(c, typ, it[j], it[j].info)
+
     result.typ = typ
 
+  # wrap in an error, if necessary:
+  for _, b in branches(result):
+    # check a single layer, everything else had error propagated already
+    for it in b.items:
+      if it.kind == nkError:
+        return c.config.wrapError(result)
+
 proc semRaise(c: PContext, n: PNode): PNode =
   checkSonsLen(n, 1, c.config)
   result = shallowCopy(n)
diff --git a/compiler/sem/semtypes.nim b/compiler/sem/semtypes.nim
index 091d9c54fbd..ac82a2dc5b5 100644
--- a/compiler/sem/semtypes.nim
+++ b/compiler/sem/semtypes.nim
@@ -737,7 +737,9 @@ proc semIdentWithPragma(c: PContext, kind: TSymKind, n: PNode,
     result = semIdentVis(c, kind, n, allowed)
 
 proc checkForOverlap(c: PContext, t: PNode, currentEx, branchIndex: int) =
-  let ex = t[branchIndex][currentEx].skipConv
+  ## Given the in-progress ``nkCaseStmt`` production `t`, reports an error for
+  ## each value in branch `branchIndex` that already appears elsewhere.
+  let ex = t[branchIndex][currentEx]
   for i in 1..branchIndex:
     for j in 0..<t[i].len - 1:
       if i == branchIndex and j == currentEx: break
@@ -747,80 +749,96 @@ proc checkForOverlap(c: PContext, t: PNode, currentEx, branchIndex: int) =
           ast: ex,
           overlappingGroup: t[i][j].skipConv))
 
-proc semBranchRange(c: PContext, t, a, b: PNode, covered: var Int128): PNode =
-  checkMinSonsLen(t, 1, c.config)
-  let ac = semConstExpr(c, a)
-  let bc = semConstExpr(c, b)
-  let at = fitNode(c, t[0].typ, ac, ac.info).skipConvTakeType
-  let bt = fitNode(c, t[0].typ, bc, bc.info).skipConvTakeType
+proc checkBranchForOverlap(c: PContext, caseStmt: PNode, branch, last: int) =
+  for i in 0..last:
+    checkForOverlap(c, caseStmt, i, branch)
+
+proc semBranchRange(c: PContext, typ: PType, a, b: PNode,
+                    covered: var Int128): PNode =
+  ## Analyses an ``nkRange`` AST and produces a typed version thereof, or an
+  ## error. `typ` is the expected element type.
+  let
+    a = evalConstExpr(c, fitNode(c, typ, semExprWithType(c, a, {}), a.info))
+    b = evalConstExpr(c, fitNode(c, typ, semExprWithType(c, b, {}), b.info))
 
   result = newNodeI(nkRange, a.info)
-  result.add(at)
-  result.add(bt)
-  if emptyRange(ac, bc):
-    localReport(c.config, b, reportSem rsemRangeIsEmpty)
-  elif t[0].typ.skipTypes(abstractInst).kind == tyString:
-    # XXX: ``nkError`` needs to be used here
-    localReport(c.config, b, reportSem rsemStringRangeNotAllowed)
-  else: covered = covered + getOrdValue(bc) + 1 - getOrdValue(ac)
-
-proc semCaseBranchRange(c: PContext, t, b: PNode,
+  result.add(a)
+  result.add(b)
+  if a.kind == nkError or b.kind == nkError:
+    result = c.config.wrapError(result)
+  elif typ.skipTypes(abstractInst).kind == tyString:
+    result = c.config.newError(result):
+      PAstDiag(kind: adSemStringRangeNotAllowed)
+  elif emptyRange(a, b):
+    result = c.config.newError(result):
+      PAstDiag(kind: adSemRangeIsEmpty)
+  else:
+    # all good; no error
+    covered = covered + getOrdValue(b) + 1 - getOrdValue(a)
+
+proc semCaseBranchRange(c: PContext, typ: PType, b: PNode,
                         covered: var Int128): PNode =
   checkSonsLen(b, 3, c.config)
-  result = semBranchRange(c, t, b[1], b[2], covered)
-
-proc semCaseBranchSetElem(c: PContext, t, b: PNode,
-                          covered: var Int128): PNode =
-  if isRange(b):
-    checkSonsLen(b, 3, c.config)
-    result = semBranchRange(c, t, b[1], b[2], covered)
-  elif b.kind == nkRange:
-    checkSonsLen(b, 2, c.config)
-    result = semBranchRange(c, t, b[0], b[1], covered)
-  else:
-    result = fitNode(c, t[0].typ, b, b.info)
-    inc(covered)
-
-proc semCaseBranch(c: PContext, t, branch: PNode, branchIndex: int,
-                   covered: var Int128) =
-  let lastIndex = branch.len - 2
-  for i in 0..lastIndex:
-    var b = branch[i]
+  result = semBranchRange(c, typ, b[1], b[2], covered)
+
+proc semCaseBranch(c: PContext, typ: PType, branch: PNode,
+                   covered: var Int128): PNode =
+  ## Analyses the ``nkOfBranch`` AST `branch`, producing either an error or
+  ## the typed AST. Note that the production does *not* include the action
+  ## slot.
+  ##
+  ## Productions with no items are valid: they result from, e.g., ``of {}:``.
+  proc fitAndAdd(to: PNode, c: PContext, typ: PType, n: PNode,
+                 covered: var Int128) {.nimcall.} =
+    if n.kind == nkError:
+      to.add n
+      return
+
+    # errors are ignored here; they're handled later
+    for it in n.items:
+      case it.kind
+      of nkRange:
+        to.add semBranchRange(c, typ, it[0], it[1], covered)
+      else:
+        var x = fitNode(c, typ, it, it.info)
+        # fitting the element may introduce a conversion
+        if x.kind in {nkHiddenCallConv, nkHiddenStdConv, nkHiddenSubConv}:
+          x = evalConstExpr(c, x)
+        to.add x
+        inc covered
+
+  checkMinSonsLen(branch, 2, c.config)
+  # not a one-to-one mapping between the input and output AST
+  result = copyNode(branch)
+
+  for _, b in branchLabels(branch):
     if b.kind == nkRange:
-      branch[i] = b
+      result.add semBranchRange(c, typ, b[0], b[1], covered)
     elif isRange(b):
-      branch[i] = semCaseBranchRange(c, t, b, covered)
+      result.add semCaseBranchRange(c, typ, b, covered)
     else:
-      # constant sets and arrays are allowed:
-      var r = semConstExpr(c, b)
-      if r.kind in {nkCurly, nkBracket} and r.len == 0 and branch.len == 2:
-        # discarding ``{}`` and ``[]`` branches silently
-        delSon(branch, 0)
-        return
-      elif r.kind notin {nkCurly, nkBracket} or r.len == 0:
-        checkMinSonsLen(t, 1, c.config)
-        var tmp = fitNode(c, t[0].typ, r, r.info)
-        # the call to fitNode may introduce a call to a converter
-        if tmp.kind in {nkHiddenCallConv}: tmp = semConstExpr(c, tmp)
-        branch[i] = skipConv(tmp)
-        inc(covered)
+      var r = semExprWithType(c, b, {})
+      # XXX: distincts are currently skipped, but it would make sense to
+      #      not, thus preventing, e.g., a distinct set from being usable
+      #      in a label slot without explicit conversion
+      case r.typ.skipTypes(abstractRange).kind
+      of tySet:
+        # constant sets are allowed
+        r = evalConstExpr(c, r)
+        if r.kind == nkError:
+          result.add r
+        elif r.len > 0:
+          # duplicates from the evaluated set need to be eliminated
+          result.fitAndAdd(c, typ, deduplicate(c.config, r), covered)
+        else:
+          discard "do nothing for empty sets"
+      of tyArray, tySequence:
+        # constant arrays and sequences are allowed too
+        r = evalConstExpr(c, r)
+        result.fitAndAdd(c, typ, r, covered)
       else:
-        if r.kind == nkCurly:
-          r = deduplicate(c.config, r)
-
-        # first element is special and will overwrite: branch[i]:
-        branch[i] = semCaseBranchSetElem(c, t, r[0], covered)
-
-        # other elements have to be added to ``branch``
-        for j in 1..<r.len:
-          branch.add(semCaseBranchSetElem(c, t, r[j], covered))
-          # caution! last son of branch must be the actions to execute:
-          swap(branch[^2], branch[^1])
-    checkForOverlap(c, t, i, branchIndex)
-
-  # Elements added above needs to be checked for overlaps.
-  for i in lastIndex.succ..<branch.len - 1:
-    checkForOverlap(c, t, i, branchIndex)
+        result.add evalConstExpr(c, fitNode(c, typ, r, r.info))
+        inc covered
 
 proc toCover(c: PContext, t: PType): Int128 =
   let t2 = skipTypes(t, abstractVarRange-{tyTypeDesc})
@@ -936,25 +954,28 @@ proc semRecordCase(c: PContext, n: PNode, check: var IntSet, pos: var int,
       sym: a[0].sym))
 
   for i in 1..<n.len:
-    var b = copyTree(n[i])
-    a.add b
+    let b = n[i]
     case n[i].kind
     of nkOfBranch:
-      checkMinSonsLen(b, 2, c.config)
-      semCaseBranch(c, a, b, i, covered)
+      a.add semCaseBranch(c, a[0].typ, b, covered)
+      checkBranchForOverlap(c, a, i, a[^1].len - 1)
+      # XXX: errors need to be propagated
+      for e in walkErrors(c.config, a[^1]):
+        localReport(c.config, e)
     of nkElse:
       checkSonsLen(b, 1, c.config)
       if chckCovered and covered == toCover(c, a[0].typ):
         localReport(c.config, b.info, SemReport(kind: rsemUnreachableElse))
       chckCovered = false
+      # copy without the action slot:
+      a.add copyNode(b)
     else:
       semReportIllformedAst(
         c.config, n,
         "Expected ofBranch or else for object case statement, but found" &
           $n[i].kind)
 
-    delSon(b, b.len - 1)
-    semRecordNodeAux(c, lastSon(n[i]), check, pos, b, rectype, hasCaseFields = true)
+    semRecordNodeAux(c, lastSon(n[i]), check, pos, a[^1], rectype, hasCaseFields = true)
   if chckCovered and covered != toCover(c, a[0].typ):
     if a[0].typ.skipTypes(abstractRange).kind == tyEnum:
       localReport(c.config, a.info, SemReport(
diff --git a/tests/lang_stmts/casestmt/tbranch_with_empty_set.nim b/tests/lang_stmts/casestmt/tbranch_with_empty_set.nim
new file mode 100644
index 00000000000..1c22cbd2e80
--- /dev/null
+++ b/tests/lang_stmts/casestmt/tbranch_with_empty_set.nim
@@ -0,0 +1,22 @@
+discard """
+  description: '''
+    Regression test for where an empty set/array value in a label position
+    counted towards the number of required labels, leading to errors being
+    reported for valid case statements.
+  '''
+  action: compile
+"""
+
+var x: bool
+
+case x
+of true, []: # would cause "not all cases are covered"
+  discard
+of false:
+  discard
+
+case x
+of true, {}: # would cause "not all cases are covered"
+  discard
+of false:
+  discard
diff --git a/tests/lang_stmts/casestmt/tlabel_considers_converter.nim b/tests/lang_stmts/casestmt/tlabel_considers_converter.nim
new file mode 100644
index 00000000000..01323230035
--- /dev/null
+++ b/tests/lang_stmts/casestmt/tlabel_considers_converter.nim
@@ -0,0 +1,30 @@
+discard """
+  description: '''
+    Ensure that converters are considered with each 'of'-branch label syntax.
+  '''
+"""
+
+converter f2i(x: float): int8 =
+  int8(x)
+
+proc test(x: int8): int =
+  case x
+  of 1.0:
+    1
+  of 2.2 .. 3.3: # with range syntax: 2 .. 3
+    2
+  of [4.1, 6.1]: # with array constructor syntax: 4, 6
+    3
+  of @[10.1] & @[12.1]: # with compile-time-evaluated sequence: 10, 12
+    4
+  else:
+    5
+
+doAssert test(1) == 1
+doAssert test(2) == 2
+doAssert test(3) == 2
+doAssert test(4) == 3
+doAssert test(6) == 3
+doAssert test(10) == 4
+doAssert test(12) == 4
+doAssert test(11) == 5 # covered by the else branch

From 05e3db8560645fb2b0f1b41321669e89ae614d80 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 28 Apr 2024 00:49:15 +0200
Subject: [PATCH 073/169] mirpasses: implement string COW handling with MIR
 pass (#1287)

## Summary

Perform the injection of runtime procedure calls for handling copy-on-
write strings with an MIR pass, instead of doing it in the C code
generator, removing another responsibility from the latter.

## Details

The new MIR pass does the equivalent of what `cgen` previously did,
that is, injecting `nimPrepareStrMutationV2` calls wherever a string's
underlying storage might be modified.

The injection logic, together with the `lfPrepareForMutation` flag, is
removed from `cgen`.
---
 compiler/backend/ccgcalls.nim |  2 --
 compiler/backend/ccgexprs.nim | 18 ++---------
 compiler/backend/ccgstmts.nim |  4 +--
 compiler/backend/cgendata.nim |  1 -
 compiler/mir/mirpasses.nim    | 58 +++++++++++++++++++++++++++++++++++
 5 files changed, 63 insertions(+), 20 deletions(-)

diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index a9cdb221b2d..f30e5356990 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -171,8 +171,6 @@ proc genOpenArraySlice(p: BProc; q: CgNode; formalType, destType: PType): (Rope,
               lengthExpr)
   of tyString, tySequence:
     let atyp = skipTypes(a.t, abstractInst)
-    if formalType.skipTypes(abstractInst).kind in {tyVar} and atyp.kind == tyString:
-      linefmt(p, cpsStmts, "#nimPrepareStrMutationV2($1);$n", [byRefLoc(p, a)])
     if atyp.kind in {tyVar}:
       result = ("((*$1).p != NIM_NIL ? ($4*)(*$1)$3+$2 : NIM_NIL)" %
                   [rdLoc(a), rdLoc(b), dataField(p), dest],
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index aa495980c9b..fa646b2b1b1 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -128,18 +128,12 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
     else:
       linefmt(p, cpsStmts, "$1.Field0 = $2; $1.Field1 = $2Len_0;$n",
         [rdLoc(d), a.rdLoc])
-  of tySequence:
+  of tySequence, tyString:
     linefmt(p, cpsStmts, "$1.Field0 = ($2.p != NIM_NIL ? $2$3 : NIM_NIL); $1.Field1 = $4;$n",
       [rdLoc(d), a.rdLoc, dataField(p), lenExpr(p, a)])
   of tyArray:
     linefmt(p, cpsStmts, "$1.Field0 = $2; $1.Field1 = $3;$n",
       [rdLoc(d), rdLoc(a), rope(lengthOrd(p.config, a.t))])
-  of tyString:
-    if skipTypes(d.t, abstractInst).kind in {tyVar}:
-      linefmt(p, cpsStmts, "#nimPrepareStrMutationV2($1);$n", [byRefLoc(p, a)])
-
-    linefmt(p, cpsStmts, "$1.Field0 = ($2.p != NIM_NIL ? $2$3 : NIM_NIL); $1.Field1 = $4;$n",
-      [rdLoc(d), a.rdLoc, dataField(p), lenExpr(p, a)])
   else:
     internalError(p.config, a.lode.info, "cannot handle " & $a.t.kind)
 
@@ -506,16 +500,13 @@ proc genDeref(p: BProc, e: CgNode, d: var TLoc) =
       discard getTypeDesc(p.module, e.typ)
       putIntoDest(p, d, e, "(*$1)" % [rdLoc(a)], a.storage)
 
-proc genAddr(p: BProc, e: CgNode, mutate: bool, d: var TLoc) =
+proc genAddr(p: BProc, e: CgNode, d: var TLoc) =
   if mapType(p.config, e.operand.typ) == ctArray:
     expr(p, e.operand, d)
   else:
     var a: TLoc
     initLoc(a, locNone, e.operand, OnUnknown)
     a.flags.incl lfWantLvalue
-    if mutate:
-      a.flags.incl lfPrepareForMutation
-
     expr(p, e.operand, a)
     putIntoDest(p, d, e, addrLoc(p.config, a), a.storage)
 
@@ -751,8 +742,6 @@ proc genSeqElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   if skipTypes(a.t, abstractVar).kind in {tyRef, tyPtr}:
     a.r = ropecg(p.module, "(*$1)", [a.r])
 
-  if lfPrepareForMutation in d.flags and ty.kind == tyString:
-    linefmt(p, cpsStmts, "#nimPrepareStrMutationV2($1);$n", [byRefLoc(p, a)])
   putIntoDest(p, d, n,
               ropecg(p.module, "$1$3[$2]", [rdLoc(a), rdCharLoc(b), dataField(p)]), a.storage)
 
@@ -2024,8 +2013,7 @@ proc expr(p: BProc, n: CgNode, d: var TLoc) =
       # ``&(*x)`` to just ``x``
       expr(p, n.operand.operand, d)
     else:
-      let mutate = n.kind == cnkHiddenAddr and n.typ.kind == tyVar
-      genAddr(p, n, mutate, d)
+      genAddr(p, n, d)
   of cnkArrayAccess: genArrayLikeElem(p, n, d)
   of cnkTupleAccess:
     if n[0].typ.skipTypes(abstractInst).kind == tyProc:
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index 3bed1798f6a..bd918b3d4f2 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -492,9 +492,9 @@ proc genAsgn(p: BProc, e: CgNode) =
     let ri = e[1]
     var a: TLoc
     initLoc(a, locNone, le, OnUnknown)
-    a.flags.incl {lfEnforceDeref, lfPrepareForMutation, lfWantLvalue}
+    a.flags.incl {lfEnforceDeref, lfWantLvalue}
     expr(p, le, a)
-    a.flags.excl {lfPrepareForMutation, lfWantLvalue}
+    a.flags.excl {lfWantLvalue}
     assert(a.t != nil)
     genLineDir(p, ri)
     loadInto(p, le, ri, a)
diff --git a/compiler/backend/cgendata.nim b/compiler/backend/cgendata.nim
index 5f939582a67..7cb19ded484 100644
--- a/compiler/backend/cgendata.nim
+++ b/compiler/backend/cgendata.nim
@@ -79,7 +79,6 @@ type
     lfEnforceDeref           ## a copyMem is required to dereference if this a
                              ## ptr array due to C array limitations.
                              ## See #1181, #6422, #11171
-    lfPrepareForMutation     ## string location is about to be mutated
     lfWantLvalue             ## on empty locs, signals that a C lvalue is
                              ## expected
 
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index ecbca601fb7..3fb33dea804 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -62,6 +62,12 @@ template subTree(bu: var MirBuilder, k: MirNodeKind, t: TypeId,
   bu.subTree MirNode(kind: k, typ: t):
     body
 
+func getStmt(tree: MirTree, n: NodePosition): NodePosition =
+  ## Returns the statement `n` is part of.
+  result = n
+  while tree[result].kind notin StmtNodes:
+    result = tree.parent(result)
+
 iterator search(tree: MirTree, kinds: static set[MirNodeKind]): NodePosition =
   ## Returns in order of appearance the positions of all nodes matching the
   ## given `kinds`.
@@ -549,6 +555,57 @@ proc lowerNew(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
       changes.replaceMulti(tree, call, bu):
         bu.move tmp
 
+proc injectStrPreparation(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
+                          changes: var Changeset) =
+  ## Injects the calls to the runtime for making sure copy-on-write strings
+  ## work. Whenever a string's underlying storage is modified, it needs to be
+  ## ensured that the storage is actually writable (copy on write).
+  let prc = graph.getCompilerProc("nimPrepareStrMutationV2")
+
+  proc insertPrepareCall(changes: var Changeset, tree: MirTree,
+                         src: NodePosition, prc: ProcedureId) {.nimcall.} =
+    ## Insert the call prior to the statement `src` is part of.
+    let stmt = getStmt(tree, src)
+    changes.insert(tree, stmt, src, bu):
+      bu.subTree mnkVoid:
+        bu.buildCall prc, VoidType:
+          bu.emitByName ekMutate:
+            bu.emitFrom(tree, src)
+
+  template isStringAccess(n: NodePosition): bool =
+    tree[n].kind == mnkPathArray and
+      env[tree[n, 0].typ].skipTypes(abstractInst).kind == tyString
+
+  # search for all operations that modify, or potentially modify, a string's
+  # storage
+  for i, node in tree.pairs:
+    case node.kind
+    of mnkAsgn, mnkInit, mnkMutView, mnkTag:
+      let op = tree.child(i, 0) # the operand
+      if isStringAccess(op):
+        # either
+        # * a mutable view of a string element is created
+        # * OR an element within the string is directly assigned to
+        insertPrepareCall(changes, tree, tree.child(op, 0),
+                          env.procedures.add(prc))
+
+    of mnkToMutSlice:
+      if env[tree[i, 0].typ].skipTypes(abstractInst).kind == tyString:
+        # conservatively prepare the string for mutation when creating a
+        # mutable slice of its storage
+        insertPrepareCall(changes, tree, tree.child(i, 0),
+                          env.procedures.add(prc))
+
+    of mnkBindMut:
+      let op = tree.child(i, 1) # the operand
+      if isStringAccess(op):
+        # just creating a mutable binding to the element doesn't imply
+        # mutation, but it's simpler to assume it does
+        insertPrepareCall(changes, tree, tree.child(op, 0),
+                          env.procedures.add(prc))
+
+    else:
+      discard "not relevant"
 
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   graph: ModuleGraph, target: TargetBackend) =
@@ -582,6 +639,7 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
 
     if target == targetC:
       lowerNew(body.code, graph, env, c)
+      injectStrPreparation(body.code, graph, env, c)
 
   # instrument the body with profiler calls after all lowerings, but before
   # optimization

From d24fb098b8f037a61ad8bb4c86db37d7a2221f86 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 28 Apr 2024 18:40:20 +0200
Subject: [PATCH 074/169] mirgen: better code generation for `high` (#1286)

## Summary

Omit unnecessary to-slice conversions for `high(x)` calls where `x` is
a `seq` value, resulting in a small compiler speed up. All backends are
affected.

## Details

There's no dedicated `high` overload for `seq`, so the `openArray`
overload is picked for `seq` arguments. The implicit argument
conversion was previously translated as is, resulting in an extra
temporary and conversion operation, both which are unnecessary, since
all three code generators support `high` for `tySequence` operands.

While an optimizing C compiler is able to eliminate the conversion,
doing it on the NimSkull side still benefits debug builds and the
JavaScript and VM target, as well as reduce the workload for the MIR
passes and code generators.

### Tests

* add a new test category for optimization-related tests
* add a test to ensure there's no conversion for `high(seq)` calls
---
 compiler/mir/mirgen.nim                      | 10 ++++++++++
 tests/optimization/README.md                 |  2 ++
 tests/optimization/tno_conv_for_seq_high.nim | 16 ++++++++++++++++
 3 files changed, 28 insertions(+)
 create mode 100644 tests/optimization/README.md
 create mode 100644 tests/optimization/tno_conv_for_seq_high.nim

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 173a08e16da..c745625a163 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -940,6 +940,16 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
         c.userOptions = {}
         genx(c, n[1])
         c.userOptions = orig
+  of mHigh:
+    # custom translation in order to skip both explicit and implicit to-slice
+    # conversions; those are unnecessary
+    c.buildMagicCall mHigh, rtyp:
+      var arg = n[1]
+      while arg.kind in {nkConv, nkHiddenStdConv, nkHiddenSubConv} and
+            classifyBackendView(arg.typ) == bvcSequence:
+        arg = arg[^1]
+
+      c.emitOperandTree arg, sink=false
 
   # arithmetic operations:
   of mAddI, mSubI, mMulI, mDivI, mModI, mPred, mSucc:
diff --git a/tests/optimization/README.md b/tests/optimization/README.md
new file mode 100644
index 00000000000..e85d349f6a6
--- /dev/null
+++ b/tests/optimization/README.md
@@ -0,0 +1,2 @@
+Tests that, for the purpose of ensuring that some optimization takes place (or
+not), inspect compiler output belong here.
\ No newline at end of file
diff --git a/tests/optimization/tno_conv_for_seq_high.nim b/tests/optimization/tno_conv_for_seq_high.nim
new file mode 100644
index 00000000000..b3d4a9da50f
--- /dev/null
+++ b/tests/optimization/tno_conv_for_seq_high.nim
@@ -0,0 +1,16 @@
+discard """
+  description: '''
+    Ensure that no to-slice conversion is emitted for `high` calls with
+    `seq` arguments
+  '''
+  action: compile
+  matrix: "--expandArc:test"
+  nimout: '''--expandArc: test
+scope:
+  result = high(arg x)
+
+-- end of expandArc ------------------------'''
+"""
+
+proc test(x: seq[int]): int {.exportc.} =
+  result = high(x)

From 46019b440a517364f10d574de425c54c08dc594e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 28 Apr 2024 19:27:07 +0200
Subject: [PATCH 075/169] cgen: better code generation for `.noreturn` calls
 (#1288)

## Summary

Improve C code generation for `.noreturn` calls, by omitting the
unnecessary error flag check for them.

## Details

If a procedure only returns due to exceptional unwinding, the
`if(NIM_UNLIKELY(*nimErr_))` guard guarding the unwinding is
unnecessary, since it's guaranteed that the error flag is set (all
exits of the procedure are due to exceptional unwinding).

Unconditionally jumping to the error handling target makes it clear
to the C compiler that control-flow doesn't continue normally after
the call

### Other improvements

In addition, the `canRaiseConservative` usage is unnecessary too, since
a `cnkCheckedCall` already signals that the call can raise. The
procedure has no more users and is thus removed.

Finally, for compilers that support it, a call to a `.noreturn`
procedure that doesn't raise is now followed by an `__assume(0)`
statement, communicating to the C compiler that control-flow never
returns to the caller.
---
 compiler/backend/ccgcalls.nim | 26 +++++++++++++++++++-------
 compiler/backend/compat.nim   |  6 ------
 2 files changed, 19 insertions(+), 13 deletions(-)

diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index f30e5356990..b2796ada2df 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -76,18 +76,30 @@ proc isHarmlessStore(p: BProc; ri: CgNode, d: TLoc): bool =
 
 proc exitCall(p: BProc, call: CgNode) =
   ## Emits the exceptional control-flow related post-call logic.
+  let isNoReturn = call[0].kind == cnkProc and
+                   sfNoReturn in p.env[call[0].prc].flags
   if call.kind == cnkCheckedCall:
-    if nimErrorFlagDisabled in p.flags:
-      if call[0].kind == cnkProc and sfNoReturn in p.env[call[0].prc].flags and
-         canRaiseConservative(p.env, call[0]):
-        # when using goto-exceptions, noreturn doesn't map to "doesn't return"
-        # at the C-level. In order to still support dispatching to wrapper
-        # procedures around ``raise`` from inside ``.compilerprocs``, we emit
-        # an exit after the call
+    if isNoReturn:
+      # the callee raises and doesn't have a normal exit -> testing the error
+      # flag is unnecessary
+      if nimErrorFlagDisabled in p.flags:
+        # don't jump to the error target. Both exception handlers and
+        # finalizers require disabling error mode, but due to the flag being
+        # inaccessible, that's not going to work
+        # XXX: as an interim solution, skipping handlers is safer than
+        #      attempting to execute them. Ultimately, the error flag needs
+        #      to be available everywhere
         p.flags.incl beforeRetNeeded
         lineF(p, cpsStmts, "goto BeforeRet_;$n", [])
+      else:
+        # jump to the handler/finalizer
+        lineF(p, cpsStmts, "$1$n", [raiseInstr(p, call[^1])])
     else:
       raiseExit(p, call[^1])
+  elif isNoReturn:
+    # mark the control-flow path following the call as unreachable
+    if hasAssume in CC[p.config.cCompiler].props:
+      lineF(p, cpsStmts, "__assume(0);$n", [])
 
 proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
                callee, params: Rope) =
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index 23539a05dce..fa78e7e9c0a 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -102,12 +102,6 @@ proc isDeepConstExpr*(n: CgNode): bool =
   else:
     result = false
 
-proc canRaiseConservative*(env: MirEnv, fn: CgNode): bool =
-  ## Duplicate of `canRaiseConservative <ast_query.html#canRaiseConservative,PNode>`_.
-  # ``mNone`` is also included in the set, therefore this check works even for
-  # non-magic calls
-  getCalleeMagic(env, fn) in magicsThatCanRaise
-
 proc toBitSet*(conf: ConfigRef; s: CgNode): TBitSet =
   ## Duplicate of `toBitSet <nimsets.html#toBitSet,ConfigRef,PNode>`_
   bitSetInit(result, int(getSize(conf, s.typ)))

From 8cdd91394d43c2cf43208fdfa30ae3331d445fe3 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 29 Apr 2024 22:35:56 +0200
Subject: [PATCH 076/169] system: mark `raiseX` runtime procedures as noreturn
 (#1289)

## Summary

Mark the `raiseX` runtime procedures used by the C backend as
`.noreturn`, to allow for generation of more efficient code.

## Details

For less code duplication, the `.noinline`, `.noreturn`, and
`.compilerproc` pragmas are combined into the custom `.errorPrc`
pragma.

At the moment, code generation is not affected, since `cgen` itself
emits calls to the `raiseX` procedures, but this is going to change
once MIR passes perform lowering of the runtime checks.
---
 lib/system/chcks.nim      | 34 +++++++++++++++++++---------------
 lib/system/integerops.nim |  8 ++++----
 2 files changed, 23 insertions(+), 19 deletions(-)

diff --git a/lib/system/chcks.nim b/lib/system/chcks.nim
index d6507709912..f32726e98f4 100644
--- a/lib/system/chcks.nim
+++ b/lib/system/chcks.nim
@@ -10,41 +10,45 @@
 # Implementation of some runtime checks.
 include system/indexerrors
 
-proc raiseRangeError(val: BiggestInt) {.compilerproc, noinline.} =
+# don't inline the raise procedures in order to reduce both executable size
+# and I-cache pressure
+{.pragma: errorPrc, compilerproc, noinline, noreturn.}
+
+proc raiseRangeError(val: BiggestInt) {.errorPrc.} =
   when hostOS == "standalone":
     sysFatal(RangeDefect, "value out of range")
   else:
     sysFatal(RangeDefect, "value out of range: ", $val)
 
-proc raiseIndexError3(i, a, b: int) {.compilerproc, noinline.} =
+proc raiseIndexError3(i, a, b: int) {.errorPrc.} =
   sysFatal(IndexDefect, formatErrorIndexBound(i, a, b))
 
-proc raiseIndexError2(i, n: int) {.compilerproc, noinline.} =
+proc raiseIndexError2(i, n: int) {.errorPrc.} =
   sysFatal(IndexDefect, formatErrorIndexBound(i, n))
 
-proc raiseIndexError() {.compilerproc, noinline.} =
+proc raiseIndexError() {.errorPrc.} =
   sysFatal(IndexDefect, "index out of bounds")
 
-proc raiseFieldError(f: string) {.compilerproc, noinline.} =
+proc raiseFieldError(f: string) {.errorPrc.} =
   ## remove after bootstrap > 1.5.1
   sysFatal(FieldDefect, f)
 
-proc raiseFieldErrorBool(f: string, val: bool) {.compilerproc, noinline.} =
+proc raiseFieldErrorBool(f: string, val: bool) {.errorPrc.} =
   sysFatal(FieldError, formatFieldDefect(f, $val))
 
 when false:
   # XXX: the character value needs to be escaped properly, but the ``reprChar``
   #      is not defined yet (or at all)
-  proc raiseFieldErrorChar(f: string, val: char) {.compilerproc, noinline.} =
+  proc raiseFieldErrorChar(f: string, val: char) {.errorPrc.} =
     sysFatal(FieldError, formatFieldDefect(f, $val))
 
-proc raiseFieldErrorInt(f: string, val: int64) {.compilerproc, noinline.} =
+proc raiseFieldErrorInt(f: string, val: int64) {.errorPrc.} =
   sysFatal(FieldError, formatFieldDefect(f, $val))
 
-proc raiseFieldErrorUInt(f: string, val: uint64) {.compilerproc, noinline.} =
+proc raiseFieldErrorUInt(f: string, val: uint64) {.errorPrc.} =
   sysFatal(FieldError, formatFieldDefect(f, $val))
 
-proc raiseFieldErrorStr(f: string, val: string) {.compilerproc, noinline.} =
+proc raiseFieldErrorStr(f: string, val: string) {.errorPrc.} =
   sysFatal(FieldError, formatFieldDefect(f, val))
 
 when defined(nimV2):
@@ -56,26 +60,26 @@ else:
     ## Obsolete. Remove after updating the csources compiler
     sysFatal(FieldError, formatFieldDefect(f, discVal))
 
-proc raiseRangeErrorI(i, a, b: BiggestInt) {.compilerproc, noinline.} =
+proc raiseRangeErrorI(i, a, b: BiggestInt) {.errorPrc.} =
   when defined(standalone):
     sysFatal(RangeDefect, "value out of range")
   else:
     sysFatal(RangeDefect, "value out of range: " & $i & " notin " & $a & " .. " & $b)
 
-proc raiseRangeErrorF(i, a, b: float) {.compilerproc, noinline.} =
+proc raiseRangeErrorF(i, a, b: float) {.errorPrc.} =
   when defined(standalone):
     sysFatal(RangeDefect, "value out of range")
   else:
     sysFatal(RangeDefect, "value out of range: " & $i & " notin " & $a & " .. " & $b)
 
-proc raiseRangeErrorU(i, a, b: uint64) {.compilerproc, noinline.} =
+proc raiseRangeErrorU(i, a, b: uint64) {.errorPrc.} =
   # todo: better error reporting
   sysFatal(RangeDefect, "value out of range")
 
-proc raiseRangeErrorNoArgs() {.compilerproc, noinline.} =
+proc raiseRangeErrorNoArgs() {.errorPrc.} =
   sysFatal(RangeDefect, "value out of range")
 
-proc raiseObjectConversionError() {.compilerproc, noinline.} =
+proc raiseObjectConversionError() {.errorPrc.} =
   sysFatal(ObjectConversionDefect, "invalid object conversion")
 
 proc chckIndx(i, a, b: int): int =
diff --git a/lib/system/integerops.nim b/lib/system/integerops.nim
index 4ef3594f118..d543fd3bbdb 100644
--- a/lib/system/integerops.nim
+++ b/lib/system/integerops.nim
@@ -10,11 +10,11 @@
 # Integer arithmetic with overflow checking. Uses
 # intrinsics or inline assembler.
 
-proc raiseOverflow {.compilerproc, noinline.} =
+proc raiseOverflow {.errorPrc.} =
   # a single proc to reduce code size to a minimum
   sysFatal(OverflowDefect, "over- or underflow")
 
-proc raiseDivByZero {.compilerproc, noinline.} =
+proc raiseDivByZero {.errorPrc.} =
   sysFatal(DivByZeroDefect, "division by zero")
 
 {.pragma: nimbaseH, importc, nodecl, noSideEffect, compilerproc.}
@@ -122,10 +122,10 @@ template divImplFallback(name, T) {.dirty.} =
 divImplFallback(nimDivInt, int)
 divImplFallback(nimDivInt64, int64)
 
-proc raiseFloatInvalidOp {.compilerproc, noinline.} =
+proc raiseFloatInvalidOp {.errorPrc.} =
   sysFatal(FloatInvalidOpDefect, "FPU operation caused a NaN result")
 
-proc raiseFloatOverflow(x: float64) {.compilerproc, noinline.} =
+proc raiseFloatOverflow(x: float64) {.errorPrc.} =
   if x > 0.0:
     sysFatal(FloatOverflowDefect, "FPU operation caused an overflow")
   else:

From 2941acce50f10f6d2ea999cf93e454c3f5ae53e3 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 30 Apr 2024 21:36:44 +0200
Subject: [PATCH 077/169] refactor(pragmas): improve `processCompile` (#1294)

## Summary

Refactor the `pragmas.processCompile` procedure to not mutate input
AST, and add a specification test for the undocumented pattern-matching
version of `.compile`.

## Details

For `pragmas.processCompile`:
* don't mutate input AST
* use proper error propagation (i.e., keep the shape of the AST intact)
* test that the specified path is relative before trying to interpret
  it as a relative path (less work)

The `.compile` pragma has a pattern-matching version, but this was
not documented anywhere. A specification test derived from the current
behaviour is added for it.
---
 compiler/sem/pragmas.nim                      | 117 +++++++++---------
 .../s01_interop/t06_compile_pattern.nim       |  22 ++++
 2 files changed, 82 insertions(+), 57 deletions(-)
 create mode 100644 tests/lang/s05_pragmas/s01_interop/t06_compile_pattern.nim

diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index f6b50c29ca2..4a2ad2d0f0a 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -709,9 +709,9 @@ proc relativeFile(c: PContext; name: string, info: TLineInfo;
 
 proc processCompile(c: PContext, n: PNode): PNode =
   ## compile pragma
-  ## produces (mutates) `n`, which must be a callable, analysing its arg, or returning
-  ## `n` wrapped in an error.
-  result = n
+  ## Produces the pragma with all arguments evaluated, or returns an error.
+  ## If the pragma is well-formed, the external files to compile are added to
+  ## the build.
   proc docompile(c: PContext; it: PNode; src, dest: AbsoluteFile; customArgs: string) =
     var cf = Cfile(nimname: splitFile(src).name,
                    cname: src, obj: dest, flags: {CfileFlag.External},
@@ -719,65 +719,68 @@ proc processCompile(c: PContext, n: PNode): PNode =
     extccomp.addExternalFileToCompile(c.config, cf)
     recordPragma(c, it, "compile", src.string, dest.string, customArgs)
 
-  proc getStrLit(c: PContext, n: PNode; i: int): (string, PNode) =
-    n[i] = c.semConstExpr(c, n[i])
-    case n[i].kind
-    of nkStrLit, nkRStrLit, nkTripleStrLit:
-      shallowCopy(result[0], n[i].strVal)
-      result[1] = nil
+  proc expectString(c: PContext, n: PNode): PNode =
+    result = c.semConstExpr(c, n)
+    case result.kind
+    of nkStrLiterals:
+      discard "all good"
     else:
-      result = ("", c.config.newError(
-        n, PAstDiag(kind: adSemStringLiteralExpected)))
-
-  let it = if n.kind in nkPragmaCallKinds and n.len == 2: n[1] else: n
-  if it.kind in {nkPar, nkTupleConstr} and it.len == 2:
-    let
-      (s, sErr) = getStrLit(c, it, 0)
-      (dest, destErr) = getStrLit(c, it, 1)
+      result = c.config.newError(n, PAstDiag(kind: adSemStringLiteralExpected))
 
-    if sErr != nil:
-      result = sErr
-    elif destErr != nil:
-      result = destErr
-    else:
-      var found = parentDir(toFullPath(c.config, n.info)) / s
-      for f in os.walkFiles(found):
-        let obj = completeCfilePath(c.config, AbsoluteFile(dest % extractFilename(f)))
-        docompile(c, it, AbsoluteFile f, obj, "")
-  else:
-    var
-      s = ""
-      customArgs = ""
-      err: PNode
-    if n.kind in nkCallKinds:
-      (s, err) = getStrLit(c, n, 1)
-      if err.isNil:
-        if n.len <= 3:
-          (customArgs, err) = getStrLit(c, n, 2)
-          if err != nil:
-            result = err
-            return
-        else:
-          result = c.config.newError(n, PAstDiag(
-            kind: adSemExcessiveCompilePragmaArgs))
-          return
-      else:
-        result = err
-        return
+  if n.kind notin nkPragmaCallKinds:
+    result = invalidPragma(c, n)
+  elif n.len == 2 and n[1].kind == nkTupleConstr and n[1].len == 2:
+    # the pattern matching version of the pragma
+    result = shallowCopy(n)
+    result[0] = n[0]
+    # both operands need to be strings:
+    let tup = shallowCopy(n[1])
+    tup[0] = expectString(c, n[1][0]) # input pattern
+    tup[1] = expectString(c, n[1][1]) # object file pattern
+    result[1] = tup
+
+    if nkError in {tup[0].kind, tup[1].kind}:
+      return c.config.wrapError(result)
+
+    # add all files matching the pattern to the build:
+    let found = parentDir(toFullPath(c.config, n.info)) / tup[0].strVal
+    for f in os.walkFiles(found):
+      let obj = completeCfilePath(c.config,
+                                  AbsoluteFile(tup[1].strVal % extractFilename(f)))
+      docompile(c, n, AbsoluteFile f, obj, "")
+
+  elif n.len <= 3:
+    # the single file version. Can either have 1 or 2 arguments, both which must
+    # be strings
+    result = shallowCopy(n)
+    result[0] = n[0] # use the identifier as is
+    var hasError = false
+    for i in 1..<n.len:
+      result[i] = expectString(c, n[i])
+      hasError = hasError or result[i].isError
+
+    if hasError:
+      return c.config.wrapError(result)
+
+    # find the file and add it to the build:
+    let file = result[1].strVal # file path
+    var found: AbsoluteFile
+    if isAbsolute(file):
+      found = AbsoluteFile file
     else:
-      (s, err) = strLitToStrOrErr(c, n)
-      if err != nil:
-        result = err
-        return
+      # first, look for the file relative to the current directory
+      found = AbsoluteFile(parentDir(toFullPath(c.config, n.info)) / file)
+      if not fileExists(found):
+        # look up the file relative to the search paths:
+        found = findFile(c.config, file)
+        if found.isEmpty: found = AbsoluteFile file
 
-    var found = AbsoluteFile(parentDir(toFullPath(c.config, n.info)) / s)
-    if not fileExists(found):
-      if isAbsolute(s): found = AbsoluteFile s
-      else:
-        found = findFile(c.config, s)
-        if found.isEmpty: found = AbsoluteFile s
     let obj = toObjFile(c.config, completeCfilePath(c.config, found, false))
-    docompile(c, it, found, obj, customArgs)
+    docompile(c, n, found, obj, (if n.len == 2: "" else: result[2].strVal))
+  else:
+    # too many arguments
+    result = c.config.newError(n,
+      PAstDiag(kind: adSemExcessiveCompilePragmaArgs))
 
 proc processLink(c: PContext, n: PNode): PNode =
   result = n
diff --git a/tests/lang/s05_pragmas/s01_interop/t06_compile_pattern.nim b/tests/lang/s05_pragmas/s01_interop/t06_compile_pattern.nim
new file mode 100644
index 00000000000..8b117da7bb9
--- /dev/null
+++ b/tests/lang/s05_pragmas/s01_interop/t06_compile_pattern.nim
@@ -0,0 +1,22 @@
+discard """
+  description: '''
+    The `compile` pragma can also be used to compile all files matching a
+    pattern, by providing a two-element tuple argument.
+  '''
+  targets: "c"
+  joinable: false
+"""
+
+## The first operand is a file pattern for matching the C files to add to the
+## build. Only `*.suffix` patterns are guaranteed to work. The pattern is
+## relative to the current module's parent directory.
+##
+## The second operand specifies a pattern for the object file name. The object
+## file(s) are always placed in the project's cache directory, even if the
+## pattern evaluates to an absolute or relative file path. Similarily, the file
+## extension in the pattern is ignored too.
+{.compile: ("*.c", "~/cache/$1_generated.suffix").}
+
+proc c_compiled_only(arg: cint): cint {.importc.}
+
+doAssert c_compiled_only(1) == 2

From 0e88f12d656e58c371bf87882517639d24400e82 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 30 Apr 2024 22:43:27 +0200
Subject: [PATCH 078/169] lower `mChckRange` magic with MIR pass (#1290)

## Summary

Lower the `mChckRange` magic with a MIR pass instead of as part of C
code generation, shrinking down `cgen`. A bug where no ranger errors
were reported for some `uint`/`uint64`-to-signed-integer conversions is
fixed too.

## Details

The lowering pass is implemented in the new `rtchecks` module, which is
also going to host the lowerings for the other run-time check magics.

The pass turns `chckRange(x, a, b)` into the MIR equivalent of
`(if x < a or b < x: raiseRangeError(...); Target(x))`.

### Float checks

For to-`float` range checks, the to-be-converted value is first
converted to the output type, and then it's compared against the
specified lower and upper bound.

### Integer checks

For to-integer range checks, the lower and upper bound integer values
are first converted to the source type, but only of they're within the
source type's range. For example, for
`chckRange(x, 0'i16, 32_768'i16)`, where `x` is an `int8`, the
`32_768 < x` is unnecessary, since it's guaranteed to be false.

### Bugfix

For `uint`-to-`int` conversion range checks, the lower bound was
previously not considered, resulting in conversions such as
`range[1..5](x)` not triggering a range error when `x` < 1. The MIR
pass addresses this.

A regression test is added to `trangechecks.nim`.

### Other

`mirgen` incorrectly assigned the `range`/`enum` type to the
intermediate temporary when lowering `dec`/`inc` into a `-`/`+` + range
check + assignment. Since the input and output type for the range check
are then the same, the `mChckRange` lowering pass would erroneously
optimize the call away.

To address this, `mirgen` now assigns the `range`/`enum` type's
underlying integer type to the temporary.
---
 compiler/backend/ccgexprs.nim |  34 ------
 compiler/mir/mirgen.nim       |   7 +-
 compiler/mir/mirpasses.nim    |   2 +
 compiler/mir/rtchecks.nim     | 192 ++++++++++++++++++++++++++++++++++
 compiler/modules/magicsys.nim |  20 ++--
 tests/misc/trangechecks.nim   |   9 +-
 6 files changed, 219 insertions(+), 45 deletions(-)
 create mode 100644 compiler/mir/rtchecks.nim

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index fa646b2b1b1..aca17171ecd 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1430,38 +1430,6 @@ proc genCast(p: BProc, e: CgNode, d: var TLoc) =
     # C code; plus it's the right thing to do for closures:
     genSomeCast(p, e, d)
 
-proc genRangeChck(p: BProc, n: CgNode, d: var TLoc) =
-  var a: TLoc
-  var dest = skipTypes(n.typ, abstractVar)
-  initLocExpr(p, n[1], a)
-  if true:
-    let n0t = n[1].typ
-
-    # emit range check:
-    if n0t.kind in {tyUInt, tyUInt64}:
-      linefmt(p, cpsStmts, "if ($1 > ($6)($3)){ #raiseRangeErrorNoArgs(); $5}$n",
-        [rdCharLoc(a), genLiteral(p, n[2], dest), genLiteral(p, n[3], dest),
-        raiser, raiseInstr(p, n.exit), getTypeDesc(p.module, n0t)])
-    else:
-      let raiser =
-        case skipTypes(n.typ, abstractVarRange).kind
-        of tyUInt..tyUInt64, tyChar: "raiseRangeErrorU"
-        of tyFloat..tyFloat64: "raiseRangeErrorF"
-        else: "raiseRangeErrorI"
-      discard cgsym(p.module, raiser)
-
-      let boundaryCast =
-        if n0t.skipTypes(abstractVarRange).kind in {tyUInt, tyUInt32, tyUInt64} or
-            (n0t.sym != nil and sfSystemModule in n0t.sym.owner.flags and n0t.sym.name.s == "csize"):
-          "(NI64)"
-        else:
-          ""
-      linefmt(p, cpsStmts, "if ($6($1) < $2 || $6($1) > $3){ $4($1, $2, $3); $5}$n",
-        [rdCharLoc(a), genLiteral(p, n[2], dest), genLiteral(p, n[3], dest),
-        raiser, raiseInstr(p, n.exit), boundaryCast])
-  putIntoDest(p, d, n, "(($1) ($2))" %
-      [getTypeDesc(p.module, dest), rdCharLoc(a)], a.storage)
-
 proc genConv(p: BProc, e: CgNode, d: var TLoc) =
   let destType = e.typ.skipTypes({tyVar, tyLent, tyGenericInst, tyAlias, tySink})
   if sameBackendType(destType, e.operand.typ):
@@ -1677,8 +1645,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
       typ.add "*"
 
     linefmt(p, cpsStmts, "$1 = ($2)($3);$n", [a.r, typ, rdLoc(b)])
-  of mChckRange:
-    genRangeChck(p, e, d)
   of mChckNaN:
     var a: TLoc
     initLocExpr(p, e[1], a)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index c745625a163..36030ca8be5 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1009,8 +1009,11 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
         if optRangeCheck in c.userOptions and
            typ.skipTypes(abstractInst).kind in {tyRange, tyEnum}:
           # needs an additional range check in order to ensure that the value
-          # is in range
-          let val = c.wrapTemp(rtyp): op(c, dest, n, m)
+          # is in range. For proper lowering later on, the intermediate
+          # temporary must use the *underlying* type, not the range/enum type
+          let
+            tmpTyp = c.typeToMir(typ.skipTypes(abstractRange + {tyEnum}))
+            val = c.wrapTemp(tmpTyp): op(c, dest, n, m)
           c.buildDefectMagicCall mChckRange, rtyp:
             c.emitByVal val
             c.emitByVal toIntLiteral(c.env, firstOrd(c.graph.config, typ), typ)
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 3fb33dea804..cd90cbb3d58 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -23,6 +23,7 @@ import
     mirconstr,
     mirtrees,
     mirtypes,
+    rtchecks,
     sourcemaps
   ],
   compiler/modules/[
@@ -639,6 +640,7 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
 
     if target == targetC:
       lowerNew(body.code, graph, env, c)
+      lowerChecks(body.code, graph, env, c)
       injectStrPreparation(body.code, graph, env, c)
 
   # instrument the body with profiler calls after all lowerings, but before
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
new file mode 100644
index 00000000000..17ec42baa07
--- /dev/null
+++ b/compiler/mir/rtchecks.nim
@@ -0,0 +1,192 @@
+## Implements the MIR passes for lowering the various run-time check magic
+## calls into comparisons + calls to runtime procedures. The lowerings are only
+## applicable for backends using the runtime for C-like targets.
+
+import
+  std/[
+    options
+  ],
+  compiler/ast/[
+    ast_types,
+    ast_query,
+    lineinfos,
+    types
+  ],
+  compiler/modules/[
+    modulegraphs,
+    magicsys
+  ],
+  compiler/mir/[
+    mirchangesets,
+    mirconstr,
+    mirenv,
+    mirtrees,
+    mirtypes
+  ],
+  compiler/utils/[
+    int128,
+    idioms
+  ]
+
+# shorten some common parameter declarations:
+using
+  tree: MirTree
+  call: NodePosition
+  graph: ModuleGraph
+  bu: var MirBuilder
+  env: var MirEnv
+
+template subTree(bu; k: MirNodeKind, t: TypeId, body: untyped) =
+  bu.subTree MirNode(kind: k, typ: t):
+    body
+
+template buildIf(bu; cond: Value, body: untyped) =
+  bu.subTree mnkIf:
+    bu.use cond
+    body
+
+template buildIfNot(bu; cond: Value, body: untyped) =
+  let c = bu.wrapTemp BoolType:
+    bu.buildMagicCall mNot, BoolType:
+      bu.emitByVal cond
+
+  bu.subTree mnkIf:
+    bu.use c
+    body
+
+template emitCall(bu; tree; call; prc: ProcedureId, arguments: untyped) =
+  ## Emits a void call of `prc`, inherting the checked-ness from `call`.
+  bu.subTree mnkVoid:
+    # if the input call is a checked call, so is the new call
+    bu.subTree tree[call].kind, VoidType:
+      bu.add procNode(prc) # callee
+      arguments # custom arguments
+
+proc addCompilerProc(env; graph; name: string): ProcedureId =
+  env.procedures.add(graph.getCompilerProc(name))
+
+proc getInt(env: MirEnv, n: MirNode): Int128 =
+  case n.kind
+  of mnkIntLit:  toInt128 env.getInt(n.number)
+  of mnkUIntLit: toInt128 env.getUInt(n.number)
+  else:          unreachable()
+
+proc emitRangeCheck(tree, call, graph, env, bu): Value =
+  ## Emits the lowered version of range check `call`. A range check amounts to
+  ## ``if val < a or b < val: raise``, but with comparisons always yielding
+  ## false optimized away.
+  proc comparison(bu; magic: TMagic, val: Value;
+                  lo, hi: Option[Value]): Value {.nimcall.} =
+    if lo.isSome:
+      # ``cond = val < lo``
+      result = bu.wrapTemp BoolType:
+        bu.buildMagicCall magic, BoolType:
+          bu.emitByVal val
+          bu.emitByVal lo.unsafeGet
+
+    if hi.isSome:
+      if lo.isSome:
+        # ``if not cond: cond = hi < val``
+        bu.buildIfNot result:
+          bu.subTree mnkAsgn:
+            bu.use result
+            bu.buildMagicCall magic, BoolType:
+              bu.emitByVal hi.unsafeGet
+              bu.emitByVal val
+      else:
+        # ``cond = hi < val``
+        result = bu.wrapTemp BoolType:
+          bu.buildMagicCall magic, BoolType:
+            bu.emitByVal hi.unsafeGet
+            bu.emitByVal val
+
+  let
+    input   = tree.argument(call, 0)
+    lowVal  = tree.argument(call, 1)
+    highVal = tree.argument(call, 2)
+    outType = env[tree[call].typ].skipTypes(abstractRange)
+
+  var inType = env[tree[input].typ]
+  if inType.sym != nil and sfSystemModule in inType.sym.owner.flags and
+     inType.sym.name.s == "csize":
+    # redirect the underlying type of csize to uint
+    # HACK: this works around the ``system.csize`` definition using the wrong
+    #       underlying type (int instead of uint)
+    inType = graph.getSysType(unknownLineInfo, tyUInt)
+
+  result = bu.inline(tree, NodePosition input)
+
+  let
+    lo  = bu.inline(tree, NodePosition lowVal)
+    hi  = bu.inline(tree, NodePosition highVal)
+
+  var cond: Value
+  if outType.kind in {tyFloat, tyFloat32, tyFloat64}:
+    # float range checks are a bit special -- the operand is converted to the
+    # target type *first*
+    result = bu.wrapTemp tree[call].typ:
+      bu.subTree mnkConv, tree[call].typ:
+        bu.use result
+
+    cond = comparison(bu, mLtF64, result, some(lo), some(hi))
+  else:
+    # only the bounds where a range error is possible need to be checked. For
+    # the comparisons, the literal values representing the bounds need to be
+    # converted to the input type first. Since the guaranteed-to-be-false
+    # comparisons are omitted, this conversion is guaranteed to be safe (no
+    # out-of-range error is possible)
+    let
+      lo =
+        if firstOrd(graph.config, inType) < env.getInt(tree[lowVal]):
+          some literal(tree[lowVal].kind, tree[lowVal].number, result.typ)
+        else:
+          none Value # low(in) >= lo -> no check needed
+      hi =
+        if lastOrd(graph.config, inType) > env.getInt(tree[highVal]):
+          some literal(tree[highVal].kind, tree[highVal].number, result.typ)
+        else:
+          none Value # high(in) <= hi -> no check needed
+
+    # if both checks can be omitted, no range check call should have been
+    # emitted in the first place
+    assert not(lo.isNone and hi.isNone)
+
+    let magic = getMagicLessForType(inType.skipTypes(abstractRange)).lt
+    cond = comparison(bu, magic, result, lo, hi)
+
+  bu.buildIf cond:
+    if inType.skipTypes(abstractRange).kind in {tyUInt, tyUInt64}:
+      # the value could be outside the representable range for the raise
+      # procedure's parameter, so use the no-args one
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseRangeErrorNoArgs")):
+        discard
+    else:
+      let raiser =
+        case outType.kind
+        of tyUInt..tyUInt64, tyChar: "raiseRangeErrorU"
+        of tyFloat..tyFloat64:       "raiseRangeErrorF"
+        else:                        "raiseRangeErrorI"
+
+      # XXX: result isn't necessarily correctly typed for the call argument...
+      bu.emitCall(tree, call, env.addCompilerProc(graph, raiser)):
+        bu.emitByVal result
+        bu.emitByVal lo
+        bu.emitByVal hi
+
+proc lowerChecks*(tree; graph; env; changes: var Changeset) =
+  ## Lowers all magic calls implementing the run-time checks.
+  for i, n in tree.pairs:
+    if n.kind == mnkMagic:
+      case n.magic
+      of mChckRange:
+        let call = tree.parent(i)
+        var tmp: Value
+        # insert the range check before the statement:
+        changes.insert(tree, tree.parent(call), call, bu):
+          tmp = emitRangeCheck(tree, call, graph, env, bu)
+        # replace the original call expression with a conversion:
+        changes.replaceMulti(tree, call, bu):
+          bu.subTree mnkConv, tree[call].typ:
+            bu.use tmp
+      else:
+        discard "not relevant"
diff --git a/compiler/modules/magicsys.nim b/compiler/modules/magicsys.nim
index 17a8c85814a..ab145148148 100644
--- a/compiler/modules/magicsys.nim
+++ b/compiler/modules/magicsys.nim
@@ -180,20 +180,24 @@ func getMagicEqForType*(t: PType): TMagic =
   else:
     unreachable(t.kind)
 
-func getMagicLeForType*(t: PType): TMagic =
-  ## Returns the ``mLeX`` magic for the given type `t`.
+func getMagicLessForType*(t: PType): tuple[le, lt: TMagic] =
+  ## Returns the ``mLeX`` and ``mLtX`` magic for type `t`.
   case t.kind
   of tyInt, tyInt8, tyInt16, tyInt32, tyInt64,
      tyUInt, tyUInt8, tyUInt16, tyUInt32, tyUInt64:
-    mLeI
-  of tyEnum:   mLeEnum
-  of tyBool:   mLeB
-  of tyString: mLeStr
-  of tyChar:   mLeCh
-  of tySet:    mLeSet
+    (mLeI, mLtI)
+  of tyEnum:   (mLeEnum, mLtEnum)
+  of tyBool:   (mLeB,    mLtB)
+  of tyString: (mLeStr,  mLtStr)
+  of tyChar:   (mLeCh,   mLtCh)
+  of tySet:    (mLeSet,  mLtSet)
   else:
     unreachable(t.kind)
 
+template getMagicLeForType*(t: PType): TMagic =
+  ## Returns the ``mLeX`` magic for the given type `t`.
+  getMagicLessForType(t).le
+
 proc getMagicEqSymForType*(g: ModuleGraph; t: PType; info: TLineInfo): PSym =
   let magic = getMagicEqForType(t)
   result = getSysMagic(g, info, "==", magic)
diff --git a/tests/misc/trangechecks.nim b/tests/misc/trangechecks.nim
index 3b4a92b6d2a..8d0454c0734 100644
--- a/tests/misc/trangechecks.nim
+++ b/tests/misc/trangechecks.nim
@@ -55,4 +55,11 @@ static:
   proc f(x: range[1..4]) =
     discard
 
-  doAssert not compiles(f(0))
\ No newline at end of file
+  doAssert not compiles(f(0))
+
+block unsigned_64_bit_to_range_conversion:
+  # regression test to make sure a uint/uint64 to integer range conversion
+  # checks the target range's lower bound
+  var x: uint64 = 0
+  doAssertRaises RangeDefect:
+    discard range[1..high(int)](x)

From 57f22ed2b2ab135707a7c6da62279daf20a408a0 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 1 May 2024 23:59:08 +0200
Subject: [PATCH 079/169] support multiple external C files having the same
 name (#1295)

## Summary

Adding multiple C files sharing the same name to the build via the
`compile` pragma is now supported.

Closes https://github.com/nim-works/nimskull/issues/1291.

## Details

For the non-pattern `compile` pragma, the C file name is turned into a
unique object file name via `withPackageName`, mirroring what the C
backend does for the C files it generates.

To prevent the object files for the external C files from colliding
with the NimSkull module object files, they're placed under the
`external` sub-directory within the cache directory.
---
 compiler/backend/extccomp.nim     |  5 +++++
 compiler/front/options.nim        | 13 +++++++++++++
 compiler/sem/pragmas.nim          |  5 ++++-
 tests/pragmas/sub/cfunction.c     |  3 +++
 tests/pragmas/tcompile_pragma.nim |  9 +++++++--
 5 files changed, 32 insertions(+), 3 deletions(-)
 create mode 100644 tests/pragmas/sub/cfunction.c

diff --git a/compiler/backend/extccomp.nim b/compiler/backend/extccomp.nim
index 57392890d3c..d77a409a977 100644
--- a/compiler/backend/extccomp.nim
+++ b/compiler/backend/extccomp.nim
@@ -393,6 +393,11 @@ proc toObjFile*(conf: ConfigRef; filename: AbsoluteFile): AbsoluteFile =
   # Object file for compilation
   result = AbsoluteFile(filename.string & "." & CC[conf.cCompiler].objExt)
 
+proc externalObjFile*(conf: ConfigRef; cfile: AbsoluteFile): AbsoluteFile =
+  ## Returns the path of the object file to output for the external C file
+  ## `cfile`.
+  result = toObjFile(conf, completeGeneratedExtFilePath(conf, cfile))
+
 proc addFileToCompile*(conf: ConfigRef; cf: Cfile) =
   conf.toCompile.add(cf)
 
diff --git a/compiler/front/options.nim b/compiler/front/options.nim
index 3fffa7d55c2..9b7629d0c44 100644
--- a/compiler/front/options.nim
+++ b/compiler/front/options.nim
@@ -1300,6 +1300,19 @@ proc completeGeneratedFilePath*(conf: ConfigRef; f: AbsoluteFile,
   result = subdir / RelativeFile f.string.splitPath.tail
   #echo "completeGeneratedFilePath(", f, ") = ", result
 
+proc completeGeneratedExtFilePath*(conf: ConfigRef, f: AbsoluteFile
+                                  ): AbsoluteFile =
+  ## Returns the absolute file path within the cache directory for file `f`.
+  ## This procedure is meant to be used for external files with names not
+  ## controlled by the compiler -- a sub-directory is used to prevent
+  ## collisions.
+  let subdir = getNimcacheDir(conf.active) / RelativeDir("external")
+  try:
+    createDir(subdir.string)
+  except OSError:
+    conf.quitOrRaise "cannot create directory: " & subdir.string
+  result = subdir / RelativeFile(f.string.splitPath.tail)
+
 proc toRodFile*(conf: ConfigRef; f: AbsoluteFile; ext = RodExt): AbsoluteFile =
   result = changeFileExt(completeGeneratedFilePath(conf,
     withPackageName(conf, f)), ext)
diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index 4a2ad2d0f0a..58b479b0be3 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -775,7 +775,10 @@ proc processCompile(c: PContext, n: PNode): PNode =
         found = findFile(c.config, file)
         if found.isEmpty: found = AbsoluteFile file
 
-    let obj = toObjFile(c.config, completeCfilePath(c.config, found, false))
+    # prepend the package name derived from the file path to `found`, in order
+    # to prevent name collisions when there are multiple external C files with
+    # the same name
+    let obj = externalObjFile(c.config, withPackageName(c.config, found))
     docompile(c, n, found, obj, (if n.len == 2: "" else: result[2].strVal))
   else:
     # too many arguments
diff --git a/tests/pragmas/sub/cfunction.c b/tests/pragmas/sub/cfunction.c
new file mode 100644
index 00000000000..fe61e7b9623
--- /dev/null
+++ b/tests/pragmas/sub/cfunction.c
@@ -0,0 +1,3 @@
+int cfunction2(void) {
+  return NUMBER_HERE;
+}
diff --git a/tests/pragmas/tcompile_pragma.nim b/tests/pragmas/tcompile_pragma.nim
index 4e09a7501a0..c261fa0a966 100644
--- a/tests/pragmas/tcompile_pragma.nim
+++ b/tests/pragmas/tcompile_pragma.nim
@@ -1,9 +1,14 @@
 discard """
-  output: '''34'''
+  description: "Tests for the `compile` pragma"
+  targets: "c"
 """
 
 {.compile("cfunction.c", "-DNUMBER_HERE=34").}
+# ensure that compiling a second C file with the same name works:
+{.compile("sub/cfunction.c", "-DNUMBER_HERE=1").}
 
 proc cfunction(): cint {.importc.}
+proc cfunction2(): cint {.importc.}
 
-echo cfunction()
+doAssert cfunction() == 34
+doAssert cfunction2() == 1

From f244f3d2733b7d4eaf34bc27949033aec7347afa Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 2 May 2024 20:04:02 +0200
Subject: [PATCH 080/169] fix(vmgen): string literal changing at run-time
 (#1296)

## Summary

Fix a string literal's underlying storage being modified when passing
a string literal to a `sink string` parameter, where the parameter is
modified within the callee. Only the VM backend was affected.

## Details

No copy of the string literal (which was lifted into a constant
earlier) is created for string literals passed to `sink` parameters.
This is not a problem for the C (copy-on-write strings are used) and
JS backend (a new run-time string instance is created on each string
literal usage), but it is for the VM backend.

Without a copy, the callee can directly modify the constant string's
underlying character storage, affecting all string literal usage
throughout the program.

`mirgen` should introduce an intermediate temporary for the argument in
this case, but - at the moment - doing so would lead to worse code
generation for all code generators, so the problem is worked around in
`vmgen`, by creating a copy of the string constant when passed to a
`sink string` parameter.
---
 compiler/vm/vmgen.nim                         | 10 ++++++++++
 .../lang_types/sink/tsink_string_literal.nim  | 20 +++++++++++++++++++
 2 files changed, 30 insertions(+)
 create mode 100644 tests/lang_types/sink/tsink_string_literal.nim

diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index f33cb4dd837..68b0da05ddb 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -1184,6 +1184,16 @@ proc genCall(c: var TCtx; n: CgNode; dest: var TDest) =
       let tmp = c.genx(n[i])
       c.gABC(n[i], opcAsgnComplex, r, tmp)
       c.freeTemp(tmp)
+    elif n[i].kind == cnkConst and i < fntyp.len and
+         fntyp[i].kind == tySink and fntyp[i][0].kind == tyString:
+      # HACK: passing a string literal (lifted into a constant) directly to a
+      #       sink parameter is wrong, since it allows the callee to modify the
+      #       constant data; a copy has to be introduced. This needs to
+      #       eventually be fixed in ``mirgen``, by introducing a intermediate
+      #       temporary for the argument
+      let tmp = c.genx(n[i])
+      c.gABC(n[i], opcAsgnComplex, r, tmp)
+      c.freeTemp(tmp)
     else:
       c.gen(n[i], r)
 
diff --git a/tests/lang_types/sink/tsink_string_literal.nim b/tests/lang_types/sink/tsink_string_literal.nim
new file mode 100644
index 00000000000..bf5f2242e37
--- /dev/null
+++ b/tests/lang_types/sink/tsink_string_literal.nim
@@ -0,0 +1,20 @@
+discard """
+  description: '''
+    Ensure string character data is not modified when passing a string literal
+    to a sink parameter
+  '''
+  targets: "c js vm"
+"""
+
+proc f_sink(x: sink string) =
+  x[0] = '0'
+
+# pass a string literal directly to a sink parameter:
+f_sink("abc")
+
+# the underlying constant string data storage must not have been
+# modified:
+proc test(x: string) =
+  doAssert x[0] == 'a'
+
+test("abc")

From b48e74b27dae81a2bba20b05a1b4818676b3cac1 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 2 May 2024 20:19:29 +0200
Subject: [PATCH 081/169] lower `mChckNaN` magic with MIR pass (#1297)

## Summary

Lower the `mChckRange` magic with a MIR pass instead of as part of C
code generation, shrinking down `cgen`.

## Details

The lowering is integrated into `rtchecks.lowerChecks`, and is a
straightforward MIR port of how `cgen` handled the `mChckNaN` magic.
---
 compiler/backend/ccgexprs.nim |  7 -------
 compiler/mir/rtchecks.nim     | 23 +++++++++++++++++++++++
 2 files changed, 23 insertions(+), 7 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index aca17171ecd..191c3370347 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1645,13 +1645,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
       typ.add "*"
 
     linefmt(p, cpsStmts, "$1 = ($2)($3);$n", [a.r, typ, rdLoc(b)])
-  of mChckNaN:
-    var a: TLoc
-    initLocExpr(p, e[1], a)
-    # NOTE: if the value is a signaling NaN, the comparison itself results in
-    #       a float-point exception (which might result in a trap)
-    linefmt(p, cpsStmts, "if ($1 != $1){ #raiseFloatInvalidOp(); $2}$n",
-            [rdLoc(a), raiseInstr(p, e.exit)])
   of mChckIndex:
     var arr, a: TLoc
     initLocExpr(p, e[1], arr)
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 17ec42baa07..a2b863e4676 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -173,6 +173,24 @@ proc emitRangeCheck(tree, call, graph, env, bu): Value =
         bu.emitByVal lo
         bu.emitByVal hi
 
+proc emitNanCheck(tree; call; graph; env; bu) =
+  ## For ``chckNaN(val)`` emit:
+  ##   def _1 = eqF64(arg val, arg val)
+  ##   def _2 = not(arg _1)
+  ##   if _2:
+  ##     raiseFloatInvalidOp()
+  let cmp = bu.wrapTemp BoolType:
+    bu.buildMagicCall mEqF64, BoolType:
+      bu.subTree mnkArg:
+        bu.emitFrom(tree, NodePosition tree.argument(call, 0))
+      bu.subTree mnkArg:
+        bu.emitFrom(tree, NodePosition tree.argument(call, 0))
+
+  # if a float value is not equal to itself, it is not a number (=NaN)
+  bu.buildIfNot cmp:
+    bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseFloatInvalidOp")):
+      discard
+
 proc lowerChecks*(tree; graph; env; changes: var Changeset) =
   ## Lowers all magic calls implementing the run-time checks.
   for i, n in tree.pairs:
@@ -188,5 +206,10 @@ proc lowerChecks*(tree; graph; env; changes: var Changeset) =
         changes.replaceMulti(tree, call, bu):
           bu.subTree mnkConv, tree[call].typ:
             bu.use tmp
+      of mChckNaN:
+        let call = tree.parent(i)
+        # make sure to take the ``mnkVoid`` wrapper into account
+        changes.replaceMulti(tree, tree.parent(call), bu):
+          emitNanCheck(tree, call, graph, env, bu)
       else:
         discard "not relevant"

From 6e8ab5a73e50896f33f562438e7c7de31877fd7b Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 2 May 2024 23:38:22 +0200
Subject: [PATCH 082/169] fix: `move` not resetting source location (#1293)

## Summary

Use a MIR pass to lower the `move` and `wasMoved` magic calls into
assignments, fixing `move` not always resetting the source location for
both the VM and JS backends. The C backend was not affected.

## Details

A `x = move(y)` call is now lowered into the following MIR:
```
x = move y
y = default()
```
and a `wasMoved(x)` call into:
```
x = default()
```
which is equivalent in behaviour to the code previously produced by
`cgen` -- using a shared MIR pass for the lowering ensures that the
behaviour is consistent across all backends.

The implementation of the two magics is removed from each code
generator, and a test for making sure `move` works correctly is added.

### Previous behaviour

For the VM backend, the source location was never reset on `move`,
while for the JS backend, the source location was reset with
`genericReset`, which left record-like locations empty (reading the
fields then yield `undefined`) and ignores primitive types like int or
float.
---
 compiler/backend/ccgexprs.nim      | 19 -----------
 compiler/backend/jsgen.nim         | 22 -------------
 compiler/mir/mirpasses.nim         | 38 ++++++++++++++++++++++
 compiler/vm/vmgen.nim              | 51 ------------------------------
 tests/magics/tdestructive_move.nim | 19 +++++++++++
 tests/stdlib/os/tisolation.nim     | 42 +++++++++---------------
 6 files changed, 72 insertions(+), 119 deletions(-)
 create mode 100644 tests/magics/tdestructive_move.nim

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 191c3370347..9900fee52f3 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1470,23 +1470,6 @@ proc skipAddr(n: CgNode): CgNode =
   if n.kind == cnkHiddenAddr: n.operand
   else:                       n
 
-proc genWasMoved(p: BProc; n: CgNode) =
-  var a: TLoc
-  let n1 = n[1].skipAddr
-  if true:
-    initLocExpr(p, n1, a, {lfWantLvalue})
-    resetLoc(p, a)
-    #linefmt(p, cpsStmts, "#nimZeroMem((void*)$1, sizeof($2));$n",
-    #  [addrLoc(p.config, a), getTypeDesc(p.module, a.t)])
-
-proc genMove(p: BProc; n: CgNode; d: var TLoc) =
-  var a: TLoc
-  initLocExpr(p, n[1], a, {lfWantLvalue})
-  if true:
-    if d.k == locNone: getTemp(p, n.typ, d)
-    genAssignment(p, d, a)
-    resetLoc(p, a)
-
 proc genDestroy(p: BProc; n: CgNode) =
     let arg = n[1].skipAddr
     let t = arg.typ.skipTypes(abstractInst)
@@ -1629,8 +1612,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     initLocExpr(p, e[2], b)
     genDeepCopy(p, a, b)
   of mDotDot, mEqCString: genCall(p, e, d)
-  of mWasMoved: genWasMoved(p, e)
-  of mMove: genMove(p, e, d)
   of mDestroy: genDestroy(p, e)
   of mAccessTypeField: genAccessTypeField(p, e, d)
   of mTrace: discard "no code to generate"
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index e636ffe2688..cecdc04eb8a 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -1732,25 +1732,6 @@ proc genDefault(p: PProc, n: CgNode; r: var TCompRes) =
   else:
     r.res = createVar(p, n.typ, indirect = false)
 
-proc genReset(p: PProc, n: CgNode) =
-  var x: TCompRes
-  useMagic(p, "genericReset")
-  gen(p, n[1], x)
-  if x.typ == etyBaseIndex:
-    lineF(p, "$1 = null, $2 = 0;$n", [x.address, x.res])
-  else:
-    lineF(p, "$1 = genericReset($1, $2);$n", [x.rdLoc,
-                  genTypeInfo(p, n[1].typ)])
-
-proc genMove(p: PProc; n: CgNode; r: var TCompRes) =
-  var a: TCompRes
-  r.kind = resVal
-  r.res = p.getTemp()
-  gen(p, n[1], a)
-  lineF(p, "$1 = $2;$n", [r.rdLoc, a.rdLoc])
-  genReset(p, n)
-  #lineF(p, "$1 = $2;$n", [dest.rdLoc, src.rdLoc])
-
 proc genJSArrayConstr(p: PProc, n: CgNode, r: var TCompRes) =
   var a: TCompRes
   r.res = rope("[")
@@ -1894,7 +1875,6 @@ proc genMagic(p: PProc, n: CgNode, r: var TCompRes) =
   of mNewSeqOfCap: unaryExpr(p, n, r, "", "[]")
   of mOf: genOf(p, n, r)
   of mDefault: genDefault(p, n, r)
-  of mWasMoved: genReset(p, n)
   of mEcho: genEcho(p, n, r)
   of mNLen..mNError:
     localReport(p.config, n.info, reportSym(
@@ -1908,8 +1888,6 @@ proc genMagic(p: PProc, n: CgNode, r: var TCompRes) =
   of mParseBiggestFloat:
     useMagic(p, "nimParseBiggestFloat")
     genCall(p, n, r)
-  of mMove:
-    genMove(p, n, r)
   # of mAccessEnv:
   #   unaryExpr(p, n, r, "accessEnv", "accessEnv($1)")
   of mFinished:
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index cd90cbb3d58..c67db569866 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -608,6 +608,43 @@ proc injectStrPreparation(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
     else:
       discard "not relevant"
 
+proc lowerMove(tree: MirTree, changes: var Changeset) =
+  ## Lowers ``mMove`` and ``mWasMoved`` magic calls.
+  for i in search(tree, {mnkMagic}):
+    case tree[i].magic
+    of mMove:
+      # lower ``def x = move(name y)`` into:
+      #   def x = move y
+      #   y = default() # essentially ``wasMoved(y)``
+      let
+        call = tree.parent(i)
+        arg  = NodePosition tree.argument(call, 0)
+        stmt = getStmt(tree, call)
+      # the argument expression is stable, so there's no need to bind it
+      changes.replaceMulti(tree, call, bu):
+        bu.subTree mnkMove, tree[call].typ:
+          bu.emitFrom(tree, arg)
+      # emit the default-assignment after the move call:
+      changes.insert(tree, tree.sibling(stmt), call, bu):
+        bu.subTree mnkAsgn:
+          bu.emitFrom(tree, arg)
+          bu.buildMagicCall mDefault, tree[call].typ:
+            discard
+    of mWasMoved:
+      # lower ``wasMoved(name x)`` into:
+      #   x = default()
+      let
+        call = tree.parent(i)
+        arg  = NodePosition tree.argument(call, 0)
+        stmt = getStmt(tree, call)
+      changes.replaceMulti(tree, stmt, bu):
+        bu.subTree mnkAsgn:
+          bu.emitFrom(tree, arg)
+          bu.buildMagicCall mDefault, tree[arg].typ:
+            discard
+    else:
+      discard "not relevant"
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   graph: ModuleGraph, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
@@ -633,6 +670,7 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       injectResultInit(body.code, body[resultId].typ, c)
 
     lowerSwap(body.code, c)
+    lowerMove(body.code, c)
     if target == targetVm:
       # only the C and VM targets need the extraction, and only the VM
       # requires the extraction for cstring literals
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 68b0da05ddb..d7ac4e017dd 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -1770,29 +1770,6 @@ func fitsRegister(t: PType): bool =
   st.kind in { tyBool, tyInt..tyUInt64, tyChar, tyPtr, tyPointer} or
     (st.sym != nil and st.sym.magic == mPNimrodNode) # NimNode goes into register too
 
-func usesRegister(c: TCtx, n: CgNode): bool =
-  ## Analyses and returns whether the value of the location named by l-value
-  ## expression `n` is stored in a register instead of a memory location
-  # XXX: instead of using a separate analysis, compute and return this as part
-  #      of ``genLValue`` and
-  case n.kind
-  of cnkLocal:
-    usesRegister(c, n.local)
-  of cnkProc, cnkConst, cnkGlobal:
-    false
-  of cnkDeref, cnkDerefView, cnkFieldAccess, cnkArrayAccess, cnkTupleAccess,
-     cnkLvalueConv, cnkObjDownConv, cnkObjUpConv:
-    false
-  else:
-    unreachable(n.kind)
-
-proc genNoLoad(c: var TCtx, n: CgNode): tuple[reg: TRegister, isDirect: bool] =
-  ## Similar to ``genLValue``, but also returns whether the register storing
-  ## the result stores a handle or a value.
-  var dest = noDest
-  genLvalue(c, n, dest)
-  result = (TRegister(dest), usesRegister(c, n))
-
 proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
   case m
   of mSubI:
@@ -2016,19 +1993,6 @@ proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
     c.freeTemp(tmp1)
     c.freeTemp(tmp2)
     c.freeTemp(tmp3)
-  of mWasMoved:
-    unused(c, n, dest)
-    let
-      (dest, isDirect) = genNoLoad(c, n[1])
-      typ = n[1].typ.skipTypes({tyVar, tyLent})
-
-    if isDirect:
-      # the location uses a register -> load it with the empty value
-      c.gABx(n, opcLdNullReg, dest, c.genType(typ))
-    else:
-      c.gABx(n, opcReset, dest, c.genType(typ))
-
-    c.freeTemp(dest)
   of mDefault:
     if fitsRegister(n.typ):
       prepare(c, dest, n.typ)
@@ -2213,21 +2177,6 @@ proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
   of mRunnableExamples:
     discard "just ignore any call to runnableExamples"
   of mDestroy, mTrace: discard "ignore calls to the default destructor"
-  of mMove:
-    let arg = n[1]
-    if fitsRegister(n.typ):
-      gen(c, arg, dest)
-    else:
-      assert dest != noDest
-      let tmp = genLvalue(c, arg)
-      # perform a normal copy
-      c.gABC(n, opcWrLoc, dest, tmp)
-      c.freeTemp(tmp)
-    # XXX use ldNullOpcode() here?
-    # Don't zero out the arg for now #17199
-    # c.gABx(n, opcLdNull, a, c.genType(arg.typ))
-    # c.gABx(n, opcNodeToReg, a, a)
-    # c.genAsgnPatch(arg, a)
   of mNodeId:
     c.genUnaryABC(n, dest, opcNodeId)
   of mFinished:
diff --git a/tests/magics/tdestructive_move.nim b/tests/magics/tdestructive_move.nim
new file mode 100644
index 00000000000..c05a8a81af1
--- /dev/null
+++ b/tests/magics/tdestructive_move.nim
@@ -0,0 +1,19 @@
+discard """
+  description: "Ensure that a `move` resets the source location"
+  targets: "c js vm"
+"""
+
+type Object = object
+  a, b: int
+
+# test with primitive type:
+var a = 1
+let b = move(a)
+doAssert b == 1
+doAssert a == 0
+
+# test with aggregate type:
+var c = Object(a: 1, b: 2)
+let d = move(c)
+doAssert d.a == 1 and d.b == 2
+doAssert c.a == 0 and c.b == 0
diff --git a/tests/stdlib/os/tisolation.nim b/tests/stdlib/os/tisolation.nim
index ccc31dce25f..00821408541 100644
--- a/tests/stdlib/os/tisolation.nim
+++ b/tests/stdlib/os/tisolation.nim
@@ -6,7 +6,7 @@ import std/[isolation, json]
 
 
-proc main(moveZeroesOut: static bool) =
+proc main() =
   block:
     type
       Empty = ref object
@@ -18,76 +18,64 @@ proc main(moveZeroesOut: static bool) =
   block: # string literals
     var data = isolate("string")
     doAssert data.extract == "string"
-    if moveZeroesOut:
-      doAssert data.extract == ""
+    doAssert data.extract == ""
 
   block: # string literals
     var data = isolate("")
     doAssert data.extract == ""
-    if moveZeroesOut:
-      doAssert data.extract == ""
+    doAssert data.extract == ""
 
   block:
     var src = "string"
     var data = isolate(move src)
     doAssert data.extract == "string"
-    if moveZeroesOut:
-      doAssert src.len == 0
+    doAssert src.len == 0
 
   block: # int literals
     var data = isolate(1)
     doAssert data.extract == 1
-    if moveZeroesOut:
-      doAssert data.extract == 0
+    doAssert data.extract == 0
 
   block: # float literals
     var data = isolate(1.6)
     doAssert data.extract == 1.6
-    if moveZeroesOut:
-      doAssert data.extract == 0.0
+    doAssert data.extract == 0.0
 
   block:
     var data = isolate(@["1", "2"])
     doAssert data.extract == @["1", "2"]
-    if moveZeroesOut:
-      doAssert data.extract == @[]
+    doAssert data.extract == @[]
 
   block:
     var data = isolate(@["1", "2", "3", "4", "5"])
     doAssert data.extract == @["1", "2", "3", "4", "5"]
-    if moveZeroesOut:
-      doAssert data.extract == @[]
+    doAssert data.extract == @[]
 
   block:
     var data = isolate(@["", ""])
     doAssert data.extract == @["", ""]
-    if moveZeroesOut:
-      doAssert data.extract == @[]
+    doAssert data.extract == @[]
 
   block:
     var src = @["1", "2"]
     var data = isolate(move src)
     doAssert data.extract == @["1", "2"]
-    if moveZeroesOut:
-      doAssert src.len == 0
+    doAssert src.len == 0
 
   block:
     var data = isolate(@[1, 2])
     doAssert data.extract == @[1, 2]
-    if moveZeroesOut:
-      doAssert data.extract == @[]
+    doAssert data.extract == @[]
 
   block:
     var data = isolate(["1", "2"])
     doAssert data.extract == ["1", "2"]
-    if moveZeroesOut:
-      doAssert data.extract == ["", ""]
+    doAssert data.extract == ["", ""]
 
   block:
     var data = isolate([1, 2])
     doAssert data.extract == [1, 2]
-    if moveZeroesOut:
-      doAssert data.extract == [0, 0]
+    doAssert data.extract == [0, 0]
 
   block:
     type
@@ -130,5 +118,5 @@ proc main(moveZeroesOut: static bool) =
     doAssert $x == """@[(value: "1234")]"""
 
 
-static: main(moveZeroesOut = false)
-main(moveZeroesOut = true)
+static: main()
+main()

From f41aafcb3eae78c693face210ee54795d26a5324 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 6 May 2024 20:12:05 +0200
Subject: [PATCH 083/169] fix(sem): issues with method-call syntax in templates
 (#1298)

## Summary

Fix two issues with the method-call syntax in non-dirty templates:
* non-overloaded symbols weren't bound early, falling back to late
  binding (https://github.com/nim-works/nimskull/issues/1292)
* gensym'ed symbols couldn't be used as the callee

## Details

### `semTemplBody` restructuring

Restructure `semTemplBody` so that the `TemplCtx.noGenSym` field
becomes unnecessary:
* the name part of `nkExprColonExpr`/`nkExprEqExpr` can only bind to
  template parameters, so `qualifiedLookUp` is used directly
* resolving an identifier to a symbol or symbol choice is moved to
  `templBindSym`
* for dot expressions (`a.b`), handling symbol binding for the `b` part
  is done manually via symbol lookup + `templBindSym`

### Missing early binding

* if `b` in `a.b` is a non-overloaded symbol, wrap it in a symbol-
  choice, to prevent `dotTransformation` from discarding it again
* for backwards-compatibility an *open* symbol choice is used in this
  case, not a *closed* one (non-overloaded symbols are closed by
  default)
* a `knownIssue` test is added for the incorrect symbol binding in dot
  expressions (`tclosed_symbol_with_method_call`)

### Bind `gensym` symbols

* if `b` in `a.b` resolves to a gensym, the symbols is now bound
* only routine, type, and generic parameter symbols are bound for `b`
  in `a.b`. This prevents, incorrect symbol binding in cases such as
  `var x = 1; a.x = 2`
* to still allow `a.b` resolving to a field access even if a gensym was
  bound to `b` (and later turned into `b'gensym` identifier),
  `builtInFieldAccess` and `propertyWriteAccess` strip the `'gensym`
  suffix from the identifier before trying to use it
* so that rendering of custom string literals (which reach `sem` as
  `(DotExpr (...) (Ident 'suffix))` stays the same,
  `renderer.isCustomLit` has to account for symbol-choices in the
  second slot

A bug with `symChoice` uncovered by the other changes is fixed: gensyms
were added to the symbol choice, even if `isField` (now rename to the
more accurately named `noGenSyms`) was true.

### Misc

* various comments documenting issues with how the symbol binding works
  are added
---
 compiler/ast/renderer.nim                     |  10 +-
 compiler/sem/sem.nim                          |   1 +
 compiler/sem/semexprs.nim                     |  14 +-
 compiler/sem/semtempl.nim                     | 158 +++++++++++-------
 doc/manual.rst                                |  35 ----
 .../template/mmethod_call_symbol_binding.nim  |   5 +
 .../tclosed_symbol_with_method_call.nim       |  26 +++
 .../template/template_issues.nim              |  16 ++
 .../template/tmethod_call_symbol_binding.nim  |  12 ++
 9 files changed, 174 insertions(+), 103 deletions(-)
 create mode 100644 tests/lang_callable/template/mmethod_call_symbol_binding.nim
 create mode 100644 tests/lang_callable/template/tclosed_symbol_with_method_call.nim
 create mode 100644 tests/lang_callable/template/tmethod_call_symbol_binding.nim

diff --git a/compiler/ast/renderer.nim b/compiler/ast/renderer.nim
index 991c0113756..d45eaae4aa3 100644
--- a/compiler/ast/renderer.nim
+++ b/compiler/ast/renderer.nim
@@ -958,9 +958,13 @@ proc infixArgument(g: var TSrcGen, n: PNode, i: int) =
   if needsParenthesis:
     put(g, tkParRi, ")")
 
-proc isCustomLit(n: PNode): bool =
+proc isCustomLit(n: PNode, g: TSrcGen): bool =
   if n.len == 2 and n[0].kind == nkRStrLit:
-    let ident = n[1].getPIdent
+    let ident =
+      if n[1].kind in nkSymChoices:
+        getPIdent(n[1][0])
+      else:
+        getPIdent(n[1])
     result = ident != nil and ident.s.startsWith('\'')
 
 proc gsub(g: var TSrcGen, n: PNode, c: TContext, fromStmtList = false) =
@@ -1187,7 +1191,7 @@ proc gsub(g: var TSrcGen, n: PNode, c: TContext, fromStmtList = false) =
     gcomma(g, n, c)
     put(g, tkBracketRi, "]")
   of nkDotExpr:
-    if isCustomLit(n):
+    if isCustomLit(n, g):
       put(g, tkCustomLit, n[0].strVal)
       gsub(g, n, 1)
     else:
diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index 381526fdea4..4a3d75c9cf8 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -12,6 +12,7 @@
 import
   std/[
     strutils,
+    hashes,
     math,
     strtabs,
     intsets,
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 5c74f0625ad..7a5ab7a6dc7 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -1716,6 +1716,16 @@ proc tryReadingTypeField(c: PContext, n: PNode, i: PIdent, ty: PType): PNode =
   else:
     result = tryReadingGenericParam(c, n, i, ty)
 
+proc originalName(cache: IdentCache, ident: PIdent): PIdent =
+  ## Returns the identifier stripped off of the '`gensym' suffix, if any.
+  let i = find(ident.s, '`')
+  if i != -1:
+    # if there's a backtick in the name, the name must come from a gensym'ed
+    # symbol. Strip the '`gensym' suffix
+    cache.getIdent(ident.s.cstring, i, hashIgnoreStyle(ident.s, 0, i - 1))
+  else:
+    ident
+
 proc builtinFieldAccess(c: PContext, n: PNode, flags: TExprFlags): PNode =
   ## returns nil if it's not a built-in field access
   checkSonsLen(n, 2, c.config)
@@ -1742,7 +1752,7 @@ proc builtinFieldAccess(c: PContext, n: PNode, flags: TExprFlags): PNode =
 
   n[0] = semExprWithType(c, n[0], flags)
   var
-    i = legacyConsiderQuotedIdent(c, n[1], n)
+    i = originalName(c.cache, legacyConsiderQuotedIdent(c, n[1], n))
     ty = n[0].typ
     f: PSym = nil
 
@@ -2067,7 +2077,7 @@ proc semArrayAccess(c: PContext, n: PNode, flags: TExprFlags): PNode =
     result = semExpr(c, result, flags)
 
 proc propertyWriteAccess(c: PContext, n, a: PNode): PNode =
-  var id = legacyConsiderQuotedIdent(c, a[1],a)
+  var id = originalName(c.cache, legacyConsiderQuotedIdent(c, a[1],a))
   var setterId = newIdentNode(getIdent(c.cache, id.s & '='), a[1].info)
   # a[0] is already checked for semantics, that does ``builtinFieldAccess``
   # this is ugly. XXX Semantic checking should use the ``nfSem`` flag for
diff --git a/compiler/sem/semtempl.nim b/compiler/sem/semtempl.nim
index 554c08ea14a..83c7817956d 100644
--- a/compiler/sem/semtempl.nim
+++ b/compiler/sem/semtempl.nim
@@ -94,7 +94,7 @@ type
     scClosed, scOpen, scForceOpen
 
 proc symChoice(c: PContext, n: PNode, s: PSym, r: TSymChoiceRule;
-               isField = false): PNode =
+               noGenSyms = false): PNode =
   var
     a: PSym
     o: TOverloadIter
@@ -112,11 +112,11 @@ proc symChoice(c: PContext, n: PNode, s: PSym, r: TSymChoiceRule;
     # XXX this makes more sense but breaks bootstrapping for now:
     # (s.kind notin routineKinds or s.magic != mNone):
     # for instance 'nextTry' is both in tables.nim and astalgo.nim ...
-    if not(isField and sfGenSym in s.flags):
+    if noGenSyms and sfGenSym in s.flags:
+      result = n
+    else:
       result = newSymNode(s, info)
       markUsed(c, info, s)
-    else:
-      result = n
   else:
     # semantic checking requires a type; `fitNode` deals with it
     # appropriately
@@ -125,7 +125,7 @@ proc symChoice(c: PContext, n: PNode, s: PSym, r: TSymChoiceRule;
     result = newNodeIT(kind, info, newTypeS(tyNone, c))
     a = initOverloadIter(o, c, n)
     while a != nil:
-      if a.kind != skModule and not(isField and sfGenSym in s.flags):
+      if a.kind != skModule and not(noGenSyms and sfGenSym in a.flags):
         incl(a.flags, sfUsed)
         markOwnerModuleAsUsed(c, a)
         result.add newSymNode(a, info)
@@ -215,7 +215,6 @@ type
     owner: PSym
     cursorInBody: bool # only for nimsuggest
     scopeN: int
-    noGenSym: int
     inTemplateHeader: int
 
 proc getIdentNode(c: var TemplCtx, n: PNode): PNode =
@@ -251,10 +250,13 @@ proc getIdentNode(c: var TemplCtx, n: PNode): PNode =
                   expectedKinds: {nkPostfix, nkPragmaExpr, nkIdent,
                                   nkAccQuoted}))
 
+func isTemplParam(c: TemplCtx, s: PSym): bool {.inline.} =
+  ## True if `s` is a parameter symbol of the current template.
+  s.kind == skParam and s.owner == c.owner and sfTemplateParam in s.flags
+
 func isTemplParam(c: TemplCtx, n: PNode): bool {.inline.} =
   ## True if `n` is a parameter symbol of the current template.
-  n.kind == nkSym and n.sym.kind == skParam and n.sym.owner == c.owner and
-    sfTemplateParam in n.sym.flags
+  n.kind == nkSym and isTemplParam(c, n.sym)
 
 func definitionTemplParam(c: TemplCtx, n: PNode): bool {.inline.} =
   ## True if `n` is an `untyped` parameter symbol of the current template.
@@ -418,19 +420,13 @@ proc semTemplSymbol(c: PContext, n: PNode, s: PSym; isField: bool): PNode =
         n           # Introduced in this pass! Leave it as an identifier.
   of OverloadableSyms-{skEnumField}:
     result = symChoice(c, n, s, scOpen, isField)
-  of skGenericParam:
-    if isField and sfGenSym in s.flags: result = n
-    else: result = newSymNodeTypeDesc(s, c.idgen, n.info)
+  of skType, skGenericParam:
+    result = newSymNodeTypeDesc(s, c.idgen, n.info)
   of skParam:
     result = n
-  of skType:
-    if isField and sfGenSym in s.flags: result = n
-    else: result = newSymNodeTypeDesc(s, c.idgen, n.info)
   else:
     if s.kind == skEnumField and overloadableEnums in c.features:
       result = symChoice(c, n, s, scOpen, isField)
-    elif isField and sfGenSym in s.flags:
-      result = n
     else:
       result = newSymNode(s, n.info)
     # Issue #12832
@@ -440,6 +436,22 @@ proc semTemplSymbol(c: PContext, n: PNode, s: PSym; isField: bool): PNode =
     if not isField and {optStyleHint, optStyleError} * c.config.globalOptions != {}:
       styleCheckUse(c.config, n.info, s)
 
+proc templBindSym(c: TemplCtx, s: PSym, n: PNode, isField: bool): PNode =
+  if contains(c.toBind, s.id):
+    result = symChoice(c.c, n, s, scClosed, isField)
+  elif contains(c.toMixin, s.name.id):
+    result = symChoice(c.c, n, s, scForceOpen, isField)
+  elif s.owner == c.owner and sfGenSym in s.flags:
+    # XXX: this is a tremendous hack. Symbol choices cannot contain
+    #      template-introduced gensyms, since gensym'ed symbols are turned
+    #      into identifiers during template evaluation. To at least support
+    #      basic usage of gensyms, they're bound directly. As a consequence,
+    #      overloads part of the definition scope won't be considered
+    incl(s.flags, sfUsed)
+    result = newSymNode(s, n.info)
+  else:
+    result = semTemplSymbol(c.c, n, s, isField)
+
 proc semRoutineInTemplName(c: var TemplCtx, n: PNode): PNode =
   ## Analyses the `namePos` in a routine-like occurring in a template body,
   ## producing a checked name node or an `nkError`.
@@ -626,21 +638,12 @@ proc semTemplBody(c: var TemplCtx, n: PNode): PNode =
       discard     # result is already set to n
     elif s.isError:
       result = s.ast
+    elif isTemplParam(c, s):
+      incl(s.flags, sfUsed)
+      result = newSymNode(s, n.info)
     else:
-      if s.owner == c.owner and s.kind == skParam and sfTemplateParam in s.flags:
-        incl(s.flags, sfUsed)
-        result = newSymNode(s, n.info)
-      elif contains(c.toBind, s.id):
-        result = symChoice(c.c, n, s, scClosed, c.noGenSym > 0)
-      elif contains(c.toMixin, s.name.id):
-        result = symChoice(c.c, n, s, scForceOpen, c.noGenSym > 0)
-      elif s.owner == c.owner and sfGenSym in s.flags and c.noGenSym == 0:
-        # template tmp[T](x: var seq[T]) =
-        # var yz: T
-        incl(s.flags, sfUsed)
-        result = newSymNode(s, n.info)
-      else:
-        result = semTemplSymbol(c.c, n, s, c.noGenSym > 0)
+      result = templBindSym(c, s, n, isField=false)
+
   of nkBind:
     result = semTemplBody(c, n[0])
   of nkBindStmt:
@@ -906,47 +909,76 @@ proc semTemplBody(c: var TemplCtx, n: PNode): PNode =
     # so we use the generic code for nkDotExpr too
     let s = qualifiedLookUp(c.c, n, {})
 
-    if s.isNil:
-      discard
-    elif s.isError:
-      result = s.ast
-    else:
-      # do not symchoice a quoted template parameter (bug #2390):
-      if s.owner == c.owner and s.kind == skParam and
-          n.kind == nkAccQuoted and n.len == 1:
+    if s != nil:
+      if isTemplParam(c, s):
         incl(s.flags, sfUsed)
-        return newSymNode(s, n.info)
+        result = newSymNode(s, n.info)
+      elif s.isError:
+        result = s.ast
       elif contains(c.toBind, s.id):
-        return symChoice(c.c, n, s, scClosed, c.noGenSym > 0)
+        result = symChoice(c.c, n, s, scClosed)
       elif contains(c.toMixin, s.name.id):
-        return symChoice(c.c, n, s, scForceOpen, c.noGenSym > 0)
+        result = symChoice(c.c, n, s, scForceOpen)
       else:
-        return symChoice(c.c, n, s, scOpen, c.noGenSym > 0)
-
-    case n.kind
-    of nkDotExpr:
-      result = n
-
-      result[0] = semTemplBody(c, n[0])
-      
-      inc c.noGenSym
-      result[1] = semTemplBody(c, n[1])
-      dec c.noGenSym
+        # FIXME: ``semTemplSymbol`` needs to be used here to ensure correct
+        #        typing for type symbols
+        result = symChoice(c.c, n, s, scOpen)
 
-      if nkError in {result[0].kind, result[1].kind}:
-        result = c.c.config.wrapError(result)
-    of nkAccQuoted:
-      result = semTemplBodySons(c, n)
-    else:
-      unreachable("should never have gotten here")
-  of nkExprColonExpr, nkExprEqExpr:
-    if n.len == 2:
-      inc c.noGenSym
+    elif n.kind == nkDotExpr:
+      # a normal dot expression
       result[0] = semTemplBody(c, n[0])
-      dec c.noGenSym
-      result[1] = semTemplBody(c, n[1])
+      var
+        iter: TOverloadIter
+        s = initOverloadIter(iter, c.c, n[1])
+
+      block resolve:
+        # only routines and types are eligible for the right-hand side, look
+        # for such a symbol:
+        while s != nil:
+          if s.isError:
+            localReport(c.c.config, s.ast)
+          elif isTemplParam(c, s):
+            # template parameters are bound eagerly
+            incl(s.flags, sfUsed)
+            result[1] = newSymNode(s, n[1].info)
+            break resolve
+          elif s.kind in routineKinds + {skType, skGenericParam}:
+            break # found a symbol that fits
+          s = nextOverloadIter(iter, c.c, n[1])
+
+        if s != nil:
+          var field = templBindSym(c, s, n[1], isField=true)
+          if field.kind == nkSym and sfGenSym notin field.sym.flags and
+             field.sym.kind in OverloadableSyms:
+            # ``semexprs.dotTransformation`` ignores single symbols, so we
+            # need to wrap the symbol in a sym-choice, to preserve the bound
+            # symbol
+            field = newTreeIT(nkOpenSymChoice, n[1].info,
+                              newTypeS(tyNone, c.c), field)
+            # XXX: should be a closed symbol choice, like it works for
+            #      generics, but code relies on the symbol being open...
+            # XXX: ``dotTransformation`` should not ignore symbols in the
+            #      first place
+
+          result[1] = field
+
+      hasError = nkError in {result[0].kind, result[1].kind}:
     else:
+      # a quoted identifier or identifier construction
       result = semTemplBodySons(c, n)
+
+  of nkExprColonExpr, nkExprEqExpr:
+    let s = qualifiedLookUp(c.c, n[0], {})
+    # template parameters can be substituted into the name position of a
+    # ``a: b`` or ``a = b`` construct
+    if s != nil and isTemplParam(c, s):
+      result[0] = newSymNode(s, n[0].info)
+    elif n[0].kind == nkAccQuoted and n[0].len > 1:
+      # make sure to also process identifier constructions
+      result[0] = semTemplBody(c, n[1])
+
+    result[1] = semTemplBody(c, n[1])
+    hasError = nkError in {result[0].kind, result[1].kind}
   of nkTableConstr:
     # also transform the keys (bug #12595)
     for i in 0..<n.len:
diff --git a/doc/manual.rst b/doc/manual.rst
index 2c0efbada36..b2e5cc734e5 100644
--- a/doc/manual.rst
+++ b/doc/manual.rst
@@ -5731,41 +5731,6 @@ no semantics outside of a template definition and cannot be abstracted over:
 To get rid of hygiene in templates, one can use the `dirty`:idx: pragma for
 a template. `inject` and `gensym` have no effect in `dirty` templates.
 
-`gensym`'ed symbols cannot be used as `field` in the `x.field` syntax.
-Nor can they be used in the `ObjectConstruction(field: value)`
-and `namedParameterCall(field = value)` syntactic constructs.
-
-The reason for this is that code like
-
-.. code-block:: nim
-    :test: "nim c $1"
-
-  type
-    T = object
-      f: int
-
-  template tmp(x: T) =
-    let f = 34
-    echo x.f, T(f: 4)
-
-
-should work as expected.
-
-However, this means that the method call syntax is not available for
-`gensym`'ed symbols:
-
-.. code-block:: nim
-    :test: "nim c $1"
-    :status: 1
-
-  template tmp(x) =
-    type
-      T {.gensym.} = int
-
-    echo x.T # invalid: instead use:  'echo T(x)'.
-
-  tmp(12)
-
 
 
 Limitations of the method call syntax
diff --git a/tests/lang_callable/template/mmethod_call_symbol_binding.nim b/tests/lang_callable/template/mmethod_call_symbol_binding.nim
new file mode 100644
index 00000000000..6968285b6db
--- /dev/null
+++ b/tests/lang_callable/template/mmethod_call_symbol_binding.nim
@@ -0,0 +1,5 @@
+proc p(x: int): int = x
+
+template templ*(x: untyped): untyped =
+  # `p` is a symbol that's not overloaded
+  x.p()
diff --git a/tests/lang_callable/template/tclosed_symbol_with_method_call.nim b/tests/lang_callable/template/tclosed_symbol_with_method_call.nim
new file mode 100644
index 00000000000..721f353900a
--- /dev/null
+++ b/tests/lang_callable/template/tclosed_symbol_with_method_call.nim
@@ -0,0 +1,26 @@
+discard """
+  description: '''
+    Ensure that non-overloaded symbols used as the method in the method-call
+    syntax are closed symbols
+  '''
+  action: reject
+  knownIssue: '''
+    Non-overloaded symbols used as the callee with the method call syntax
+    are always open
+  '''
+"""
+
+proc p(x: int) =
+  discard
+
+template test(x: string) =
+  # `p` is not overloaded at this point, and it's thus a closed symbol
+  x.p()
+
+# the overload with which the call would work:
+proc p(x: string) =
+  discard
+
+# the symbol of the callee is bound early and is closed, so the correct
+# overload cannot be picked, meaning that an error ensues
+test("")
diff --git a/tests/lang_callable/template/template_issues.nim b/tests/lang_callable/template/template_issues.nim
index 2c87d314ad6..dcfd3277bc8 100644
--- a/tests/lang_callable/template/template_issues.nim
+++ b/tests/lang_callable/template/template_issues.nim
@@ -304,3 +304,19 @@ block static_parameter_with_default:
     discard int(b)
 
   x() # the default value for the parameter must be used
+
+block method_call_syntax_with_gensym_routine:
+  # using the method-call syntax with gensym'ed routines didn't work
+  template test(x: int): untyped =
+    proc p(v: int): int {.gensym.} = v
+    x.p()
+
+  doAssert test(1) == 1
+
+block method_call_syntax_with_gensym_type:
+  # using the method-call syntax with gensym'ed types didn't work
+  template test(x: int): float =
+    type Typ {.gensym.} = float
+    x.Typ
+
+  doAssert test(1) == 1.0
diff --git a/tests/lang_callable/template/tmethod_call_symbol_binding.nim b/tests/lang_callable/template/tmethod_call_symbol_binding.nim
new file mode 100644
index 00000000000..373a79619cc
--- /dev/null
+++ b/tests/lang_callable/template/tmethod_call_symbol_binding.nim
@@ -0,0 +1,12 @@
+discard """
+  description: '''
+    Ensure that non-overloaded symbols from a template's definition scope are
+    bound early when using the method-call syntax.
+
+    Derived from https://github.com/nim-works/nimskull/issues/1292.
+  '''
+"""
+
+import mmethod_call_symbol_binding
+
+doAssert templ(1) == 1

From 0351072eb2ada968f4a62f3c900b00c8bbaa6c58 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 6 May 2024 20:15:19 +0200
Subject: [PATCH 084/169] fix(testament): batching being ignored for megatest
 (#1299)

## Summary

Fix batching being ignored for the megatest. Only tests part of the
current batch are now joined into the megatest.

Fixes https://github.com/nim-works/nimskull/issues/1037

## Details

In order to not duplicate the computation of whether the test is in the
current batch, a pseudo `TTest` instance is created that's then passed
to `computeEarly`.
---
 testament/categories.nim | 9 ++++++---
 testament/testament.nim  | 3 +++
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/testament/categories.nim b/testament/categories.nim
index 9738ec1f62d..b3ebda4f57c 100644
--- a/testament/categories.nim
+++ b/testament/categories.nim
@@ -360,9 +360,12 @@ proc runJoinedTest(r: var TResults, targets: set[TTarget], testsDir, options: st
       for file in walkDirRec(testsDir / cat):
         if isTestFile(file):
           try:
-            let spec = parseSpec(file, cat.Category.defaultTargets, nativeTarget())
-            if isJoinableSpec(spec, targets, computeEarly(spec, true)):
-              specs.add spec
+            # setup a pseudo test instance for the purpose of computing
+            # whether it can be joined
+            let test = initTest(file, "", cat.Category):
+              parseSpec(file, cat.Category.defaultTargets, nativeTarget())
+            if isJoinableSpec(test.spec, targets, computeEarly(test)):
+              specs.add test.spec
           except ValueError:
             msg Undefined:
               "parseSpec raised ValueError for: '$1', assuming this will be handled outside of megatest" % file
diff --git a/testament/testament.nim b/testament/testament.nim
index 4b09a4d51fc..be47463c69b 100644
--- a/testament/testament.nim
+++ b/testament/testament.nim
@@ -1147,6 +1147,9 @@ proc computeEarly(spec: TSpec, inCurrentBatch: bool): TResultEnum =
   else:
     reSuccess
 
+proc computeEarly(test: TTest): TResultEnum {.inline.} =
+  computeEarly(test.spec, test.inCurrentBatch)
+
 proc produceRuns(r: var TResults, test: TTest, early: TResultEnum,
                   runs: var seq[TestRun]) =
   ## Takes a test description (`test`) and the computed early result and

From f401e73639c2d15f2aefbad04c96199c8308b3dc Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 6 May 2024 22:00:05 +0200
Subject: [PATCH 085/169] lower `mChckField` magic with MIR pass (#1300)

## Summary

Lower the `mChckField` magic with a MIR pass instead of as part of C
code generation, shrinking down `cgen`.

## Details

* the lowering is integrated into `rtchecks.lowerChecks`
* it's a straightforward MIR port of how `cgen` handled the
  `mChckField` magic
* `lowerChecks` now needs access to the `MirBody`, so that the
  `mChckField` lowering can access the source map
---
 compiler/backend/ccgexprs.nim    | 68 ------------------------
 compiler/backend/ccgliterals.nim |  9 ----
 compiler/mir/mirpasses.nim       |  2 +-
 compiler/mir/rtchecks.nim        | 89 ++++++++++++++++++++++++++++++--
 4 files changed, 87 insertions(+), 81 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 9900fee52f3..71c81089c0b 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -561,72 +561,6 @@ proc genRecordField(p: BProc, e: CgNode, d: var TLoc) =
     r.addf(".$1", [p.fieldName(field)])
     putIntoDest(p, d, e, r, a.storage)
 
-proc genInExprAux(p: BProc, e: CgNode, a, b, d: var TLoc)
-
-proc genFieldCheck(p: BProc, e: CgNode) =
-  var test, u, v: TLoc
-  if true:
-    initLocExpr(p, e[1], u)
-    initLocExpr(p, e[2], v)
-    genInExprAux(p, e, u, v, test)
-    var strLit: Rope
-    if optDeclaredLocs in p.config.globalOptions:
-      # xxx this should be controlled by a separate flag, and
-      # used for other similar defects so that location information is shown
-      # even without the expensive `--stacktrace`; binary size could be optimized
-      # by encoding the file names separately from `file(line:col)`, essentially
-      # passing around `TLineInfo` + the set of files in the project.
-      let msg = toFileLineCol(p.config, e.info) & " " & getString(p, e[4])
-      # don't commit the string to the string table, as it's likely to be
-      # unique and never used again
-      strLit = genStringLiteral(p.module, msg)
-    else:
-      strLit = genStringLiteral(p.module, e[4])
-
-    ## discriminant check
-    template fun(code) = linefmt(p, cpsStmts, code, [rdLoc(test)])
-    if e[3].intVal == 1:
-      # the third operand indicates whether the result needs to be inverted
-      fun("if ($1) ")
-    else:
-      fun("if (!($1)) ")
-
-    let base = v.t.skipTypes(abstractRange)
-    var raiseProc, toStr: string
-    # generate and emit the code for the failure case:
-    case base.kind
-    of tyEnum:
-      # use the compiler-generated enum-to-string procedure
-      let prc = p.module.g.graph.getToStringProc(v.t)
-      discard registerLateProc(p.module, prc)
-
-      var tmp: TLoc
-      expr(p, newSymNode(p.env, prc), tmp)
-      toStr = "$1($2)" % [rdLoc(tmp), rdLoc(v)]
-      raiseProc = "raiseFieldErrorStr"
-
-    of tyChar:
-      # XXX: rendering as a character is supported by the runtime
-      #raiseProc = "raiseFieldErrorChar"
-      toStr = rdCharLoc(v)
-      raiseProc = "raiseFieldErrorUInt"
-    of tyBool:
-      raiseProc = "raiseFieldErrorBool"
-    of tyInt..tyInt64:
-      raiseProc = "raiseFieldErrorInt"
-    of tyUInt..tyUInt64:
-      raiseProc = "raiseFieldErrorUInt"
-    else:
-      discard
-      # unreachable()
-
-    if toStr == "":
-      toStr = rdLoc(v)
-
-    discard cgsym(p.module, raiseProc) # make sure the compilerproc is generated
-    linefmt(p, cpsStmts, "{ $1($3, $4); $2} $n",
-            [raiseProc, raiseInstr(p, e.exit), strLit, toStr])
-
 proc genUncheckedArrayElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   var a, b: TLoc
   initLocExpr(p, x, a)
@@ -1637,8 +1571,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     initLocExpr(p, e[2], a)
     initLocExpr(p, e[3], b)
     genBoundsCheck(p, arr, a, b, e.exit)
-  of mChckField:
-    genFieldCheck(p, e)
   of mChckObj:
     var a: TLoc
     initLocExpr(p, e[1], a)
diff --git a/compiler/backend/ccgliterals.nim b/compiler/backend/ccgliterals.nim
index 016e372e672..d1442bc5b5d 100644
--- a/compiler/backend/ccgliterals.nim
+++ b/compiler/backend/ccgliterals.nim
@@ -55,15 +55,6 @@ proc genStringLiteralV2Const(m: BModule; str: StringId; isConst: bool): Rope =
     pureLit = m.tmpBase & rope(id)
   result = "{$1, (NimStrPayload*)&$2}" % [rope(m.g.env[str].len), pureLit]
 
-proc genStringLiteral(m: BModule, str: string): Rope =
-  ## Spawns and emits a new global C constant storing a NimString with content
-  ## `str` -- no caching is performed.
-  let content = getTempName(m)
-  genStringLiteralDataOnlyV2(m, str, content, true)
-  result = getTempName(m)
-  m.s[cfsData].addf("static const NimStringV2 $1 = {$2, (NimStrPayload*)&$3};$n",
-                    [result, rope(str.len), content])
-
 # ------ Version selector ---------------------------------------------------
 
 proc genNilStringLiteral(m: BModule; info: TLineInfo): Rope =
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index c67db569866..41b82eadc50 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -678,7 +678,7 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
 
     if target == targetC:
       lowerNew(body.code, graph, env, c)
-      lowerChecks(body.code, graph, env, c)
+      lowerChecks(body, graph, env, c)
       injectStrPreparation(body.code, graph, env, c)
 
   # instrument the body with profiler calls after all lowerings, but before
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index a2b863e4676..5af10aed5db 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -17,19 +17,26 @@ import
     magicsys
   ],
   compiler/mir/[
+    mirbodies,
     mirchangesets,
     mirconstr,
     mirenv,
     mirtrees,
-    mirtypes
+    mirtypes,
+    sourcemaps
   ],
   compiler/utils/[
     int128,
     idioms
   ]
 
+import compiler/front/options as comp_options
+# XXX: no source position inspection should take place here
+from compiler/front/msgs import toFileLineCol
+
 # shorten some common parameter declarations:
 using
+  body: MirBody
   tree: MirTree
   call: NodePosition
   graph: ModuleGraph
@@ -43,7 +50,8 @@ template subTree(bu; k: MirNodeKind, t: TypeId, body: untyped) =
 template buildIf(bu; cond: Value, body: untyped) =
   bu.subTree mnkIf:
     bu.use cond
-    body
+    bu.subTree mnkScope:
+      body
 
 template buildIfNot(bu; cond: Value, body: untyped) =
   let c = bu.wrapTemp BoolType:
@@ -191,8 +199,78 @@ proc emitNanCheck(tree; call; graph; env; bu) =
     bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseFloatInvalidOp")):
       discard
 
-proc lowerChecks*(tree; graph; env; changes: var Changeset) =
+proc emitFieldCheck(tree; source: SourceMap; call; graph; env; bu) =
+  ## For ``chckField(set, discr, invert, msg)`` emits the MIR equivalent of:
+  ##   if not contains(set, discr):
+  ##     raiseFieldError(msg, ...)
+  let
+    setVal   = bu.inline(tree, NodePosition tree.argument(call, 0))
+    discrVal = bu.inline(tree, NodePosition tree.argument(call, 1))
+
+  var cond = bu.wrapTemp BoolType:
+    bu.buildMagicCall mInSet, BoolType:
+      bu.emitByVal setVal
+      bu.emitByVal discrVal
+
+  # the third argument is a boolean indicating whether the test is inverted
+  if env.getInt(tree[tree.argument(call, 2)]) == Zero:
+    cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mNot, BoolType:
+        bu.emitByVal cond
+
+  var msgVal: Value
+  if optDeclaredLocs in graph.config.globalOptions:
+    # XXX: this an inadequate hack for supporting showing the source line
+    #      information as part of the error message, even when stack-traces are
+    #      disabled. This needs to be replaced with a general solution that
+    #      applies to all run-time checks
+    # fetch the line information of the call, render it, and prepend it to the
+    # message
+    var msg = toFileLineCol(graph.config, source[tree[call].info].info)
+    msg.add " "
+    msg.add env[tree[tree.argument(call, 3)].strVal]
+    msgVal = literal(env.getOrIncl(msg), StringType)
+  else:
+    # use the original message as-is
+    msgVal = bu.inline(tree, NodePosition tree.argument(call, 3))
+
+  bu.buildIf cond:
+    let typ = env[discrVal.typ].skipTypes(abstractRange)
+    var
+      raiseProc: string
+      extra = discrVal # the extra value to pass to the raise procedure
+
+    case typ.kind
+    of tyEnum:
+      # turn the run-time enum value into a string using the compiler-generated
+      # enum-to-string procedure for the type
+      let prc = graph.getToStringProc(typ)
+      extra = bu.wrapTemp StringType:
+        bu.buildCall env.procedures.add(prc), StringType:
+          bu.emitByVal discrVal
+
+      raiseProc = "raiseFieldErrorStr"
+    of tyChar:
+      # XXX: needs to use a dedicated raise procedure, once the runtime
+      #      supports it
+      raiseProc = "raiseFieldErrorUInt"
+    of tyBool:
+      raiseProc = "raiseFieldErrorBool"
+    of tyInt..tyInt64:
+      raiseProc = "raiseFieldErrorInt"
+    of tyUInt..tyUInt64:
+      raiseProc = "raiseFieldErrorUInt"
+    else:
+      unreachable(typ.kind)
+
+    bu.emitCall(tree, call, env.addCompilerProc(graph, raiseProc)):
+      bu.emitByVal msgVal
+      bu.emitByVal extra
+
+proc lowerChecks*(body; graph; env; changes: var Changeset) =
   ## Lowers all magic calls implementing the run-time checks.
+  template tree: MirTree = body.code
+
   for i, n in tree.pairs:
     if n.kind == mnkMagic:
       case n.magic
@@ -211,5 +289,10 @@ proc lowerChecks*(tree; graph; env; changes: var Changeset) =
         # make sure to take the ``mnkVoid`` wrapper into account
         changes.replaceMulti(tree, tree.parent(call), bu):
           emitNanCheck(tree, call, graph, env, bu)
+      of mChckField:
+        let call = tree.parent(i)
+        # make sure to take the ``mnkVoid`` wrapper into account
+        changes.replaceMulti(tree, tree.parent(call), bu):
+          emitFieldCheck(tree, body.source, call, graph, env, bu)
       else:
         discard "not relevant"

From 588a767a85b0391786197fb5f552f2d93502a60e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 10 May 2024 21:35:07 +0200
Subject: [PATCH 086/169] threads: improve interface and fix bugs (#1302)

## Summary

Make `Thread` a proper thread handle, fixing multiple bugs and making
the interface more robust:
* a thread is now officially allowed to outlive the `Thread` instance
  (which would previously lead to crashes)
* a `Thread` handle for a running thread can now be safely moved around
* there's now a `createThread` overload that returns a `Thread`
  instance
* `Thread.finished` having a race condition

## Details

The management-data for a thread was previously part of the `Thread`
type itself, with a pointer to the `Thread` instance passed to the
internal thread procedure, requiring the `Thread` instance for a
running thread to always stay at the same memory location.

As a consequence of this design, moving the `Thread` instance, or the
`Thread` instance going out of scope before the thread is finished,
resulted in undefined behaviour.

To address this problem, the management-data is made part of a heap-
allocated structure (`ThreadCore`), which is then shared between the
handle and spawned thread. The type uses manual reference counting in
order to support detached threads (threads that outlive their handle).

Since a `Thread` instance can now be moved around in memory, the base
`createThread` procedure can now return a `Thread`, which is the better
interface, as it prevents leaks caused by forgetting to destroy the
`Thread` instance first. For backwards compatibility, an in-place
`createThread` overload is added.

### Tests

Two new tests are added:
* a test for ensuring that the thread's internal data is freed
  correctly
* a test for ensuring that the thread parameter is destroyed

The pre-existing `tthread_destroy_before_finish.nim` test had a few
issues, which are now fixed:
* it had no proper description
* it wasn't guaranteed to actually fail (in the edge-case that the
  spawned thread finishes before the `reset` call)
* access to the `ok` global was not atomic (resulting in a race
  condition)
* it unnecessarily imported `std/os`
---
 lib/system/threadlocalstorage.nim             |  11 +-
 lib/system/threads.nim                        | 113 ++++++++++++------
 tests/threads/tinternal_thread_cleanup.nim    |  43 +++++++
 .../threads/tthread_destroy_before_finish.nim |  27 +++--
 tests/threads/tthread_param_is_destroyed.nim  |  22 ++++
 5 files changed, 161 insertions(+), 55 deletions(-)
 create mode 100644 tests/threads/tinternal_thread_cleanup.nim
 create mode 100644 tests/threads/tthread_param_is_destroyed.nim

diff --git a/lib/system/threadlocalstorage.nim b/lib/system/threadlocalstorage.nim
index f105776fda7..b6e9e362234 100644
--- a/lib/system/threadlocalstorage.nim
+++ b/lib/system/threadlocalstorage.nim
@@ -181,12 +181,6 @@ when emulatedThreadVars:
 const nimTlsSize {.intdefine.} = 16000
 type
   ThreadLocalStorage = array[0..(nimTlsSize div sizeof(float)), float]
-  PGcThread = ptr GcThread
-  GcThread {.pure, inheritable.} = object
-    when emulatedThreadVars:
-      tls: ThreadLocalStorage
-    else:
-      nil
 
 when emulatedThreadVars:
   var globalsSlot {.noInit.}: ThreadVarSlot
@@ -195,10 +189,11 @@ when emulatedThreadVars:
   # here
 
   when not defined(useNimRtl):
-    var mainThread: GcThread
+    var mainThread: ThreadLocalStorage
+      ## the thread-local storage of the main thread
 
   proc GetThreadLocalVars(): pointer {.compilerRtl, inl.} =
-    result = addr(cast[PGcThread](threadVarGetValue(globalsSlot)).tls)
+    result = cast[ptr ThreadLocalStorage](threadVarGetValue(globalsSlot))
 
   proc initThreadVarsEmulation() {.compilerproc, inline.} =
     when not defined(useNimRtl):
diff --git a/lib/system/threads.nim b/lib/system/threads.nim
index bad9966f95e..10eb3a00561 100644
--- a/lib/system/threads.nim
+++ b/lib/system/threads.nim
@@ -39,7 +39,7 @@
 ##  initLock(L)
 ##
 ##  for i in 0..high(thr):
-##    createThread(thr[i], threadFunc, (i*10, i*10+5))
+##    thr[i] = createThread(threadFunc, (i*10, i*10+5))
 ##  joinThreads(thr)
 ##
 ##  deinitLock(L)
@@ -61,16 +61,42 @@ const
 # use ``stdcall`` since it is mapped to ``noconv`` on UNIX anyway.
 
 type
-  Thread*[TArg] = object
-    core: PGcThread
-    sys: SysThread
+  ThreadCore[TArg] = object
+    ## The internal managnement data associated with a thread. Allocated
+    ## by the spawning thread, and - initially - owned by both the spawning
+    ## and spawned thread (shared ownership). If the spawned thread finishes
+    ## before the `Thread <#Thread>` handle owned by the spawning thread goes
+    ## out of scope, the spawning thread frees the instance, otherwise the
+    ## spawned thread does.
+    when emulatedThreadVars:
+      tls: ThreadLocalStorage
+
+    rc: int
+      ## ref-counter. Has a maximum value of 2. All operations on it must be
+      ## atomic
+
     when TArg is void:
       dataFn: proc () {.nimcall, gcsafe.}
     else:
       dataFn: proc (m: TArg) {.nimcall, gcsafe.}
       data: TArg
 
+  Thread*[TArg] = object
+    core: ptr ThreadCore[TArg]
+    sys: SysThread
+
 proc `=copy`*[TArg](x: var Thread[TArg], y: Thread[TArg]) {.error.}
+proc `=destroy`[TArg](x: var Thread[TArg])
+
+proc release[TArg](core: ptr ThreadCore[TArg]) =
+  if atomicDec(core.rc, 1, ATOMIC_ACQ_REL) == 0:
+    deallocShared(core)
+
+proc `=destroy`[TArg](x: var Thread[TArg]) =
+  if x.core != nil:
+    # the spawning thread doesn't own the data passed along to the thread,
+    # so don't touch it
+    release(x.core)
 
 var
   threadDestructionHandlers {.rtlThreadVar.}: seq[proc () {.closure, gcsafe, raises: [].}]
@@ -94,7 +120,7 @@ proc threadTrouble() {.raises: [], gcsafe.}
   ## defined in system/excpt.nim
 
 when true:
-  proc threadProcWrapDispatch[TArg](thrd: ptr Thread[TArg]) {.raises: [].} =
+  proc threadProcWrapDispatch[TArg](thrd: ptr ThreadCore[TArg]) {.raises: [].} =
     try:
       when TArg is void:
         thrd.dataFn()
@@ -106,25 +132,26 @@ when true:
       afterThreadRuns()
 
 template threadProcWrapperBody(closure: untyped): untyped =
-  var thrd = cast[ptr Thread[TArg]](closure)
-  var core = thrd.core
-  when declared(globalsSlot): threadVarSetValue(globalsSlot, thrd.core)
-  threadProcWrapDispatch(thrd)
+  let core = cast[ptr ThreadCore[TArg]](closure)
+  when declared(globalsSlot):
+    threadVarSetValue(globalsSlot, addr(core.tls))
+  threadProcWrapDispatch(core)
   # Since an unhandled exception terminates the whole process (!), there is
   # no need for a ``try finally`` here, nor would it be correct: The current
   # exception is tried to be re-raised by the code-gen after the ``finally``!
   # However this is doomed to fail, because we already unmapped every heap
   # page!
 
+  when TArg isnot void:
+    # the spawned thread has ownership of the extra data, destroy it:
+    reset(core.data)
+
   when compileOption("gc", "orc"):
     # run a full garbage collection pass in order to free all cells
     # kept alive only through reference cycles
     GC_fullCollect()
 
-  # mark as not running anymore:
-  thrd.core = nil
-  thrd.dataFn = nil
-  deallocShared(cast[pointer](core))
+  release(core)
 
 {.push stack_trace:off.}
 # NOTE: the `threadProcWrapper` is currently special-cased by the compiler to
@@ -138,9 +165,18 @@ else:
     threadProcWrapperBody(closure)
 {.pop.}
 
+proc createThreadCore[TArg](tp: proc (arg: TArg) {.thread, nimcall.},
+                           ): ptr ThreadCore[TArg] =
+  ## Allocates and sets up a ``ThreadCore`` instance.
+  result = createShared(ThreadCore[TArg])
+  result.rc = 2 # both threads initially own the data
+  result.dataFn = tp
+
 proc running*[TArg](t: Thread[TArg]): bool {.inline.} =
   ## Returns true if `t` is running.
-  result = t.dataFn != nil
+  # if the spawning thread has unique ownership of the spawned thread's
+  # management data, the thread isn't running anymore
+  result = t.core != nil and atomicLoadN(addr t.core.rc, ATOMIC_RELAXED) == 2
 
 proc handle*[TArg](t: Thread[TArg]): SysThread {.inline.} =
   ## Returns the thread handle of `t`.
@@ -189,23 +225,22 @@ when false:
       t.core = nil
 
 when hostOS == "windows":
-  proc createThread*[TArg](t: var Thread[TArg],
-                           tp: proc (arg: TArg) {.thread, nimcall.},
-                           param: TArg) =
-    ## Creates a new thread `t` and starts its execution.
+  proc createThread*[TArg](tp: proc (arg: TArg) {.thread, nimcall.},
+                           param: TArg): Thread[TArg] =
+    ## Creates a new thread, starts its execution, and returns a handle of the
+    ## thread.
     ##
     ## Entry point is the proc `tp`.
     ## `param` is passed to `tp`. `TArg` can be `void` if you
     ## don't need to pass any data to the thread.
-    t.core = cast[PGcThread](allocShared0(sizeof(GcThread)))
-
-    when TArg isnot void: t.data = param
-    t.dataFn = tp
+    result.core = (createThreadCore[TArg])(tp)
+    when TArg isnot void:
+      result.core.data = param
 
     var dummyThreadId: int32
-    t.sys = createThread(nil, ThreadStackSize, threadProcWrapper[TArg],
-                         addr(t), 0'i32, dummyThreadId)
-    if t.sys <= 0:
+    result.sys = createThread(nil, ThreadStackSize, threadProcWrapper[TArg],
+                              result.core, 0'i32, dummyThreadId)
+    if result.sys <= 0:
       raise newException(ResourceExhaustedError, "cannot create thread")
 
   proc pinToCpu*[Arg](t: var Thread[Arg]; cpu: Natural) =
@@ -216,18 +251,17 @@ when hostOS == "windows":
     setThreadAffinityMask(t.sys, uint(1 shl cpu))
 
 else:
-  proc createThread*[TArg](t: var Thread[TArg],
-                           tp: proc (arg: TArg) {.thread, nimcall.},
-                           param: TArg) =
-    ## Creates a new thread `t` and starts its execution.
+  proc createThread*[TArg](tp: proc (arg: TArg) {.thread, nimcall.},
+                           param: TArg): Thread[TArg] =
+    ## Creates a new thread, starts its execution, and returns a handle of the
+    ## thread.
     ##
     ## Entry point is the proc `tp`. `param` is passed to `tp`.
     ## `TArg` can be `void` if you
     ## don't need to pass any data to the thread.
-    t.core = cast[PGcThread](allocShared0(sizeof(GcThread)))
-
-    when TArg isnot void: t.data = param
-    t.dataFn = tp
+    result.core = (createThreadCore[TArg])(tp)
+    when TArg isnot void:
+      result.core.data = param
 
     var a {.noinit.}: Pthread_attr
     doAssert pthread_attr_init(a) == 0
@@ -235,7 +269,7 @@ else:
     when not defined(ios):
       # This fails on iOS
       doAssert(setstacksizeResult == 0)
-    if pthread_create(t.sys, a, threadProcWrapper[TArg], addr(t)) != 0:
+    if pthread_create(result.sys, a, threadProcWrapper[TArg], result.core) != 0:
       raise newException(ResourceExhaustedError, "cannot create thread")
     doAssert pthread_attr_destroy(a) == 0
 
@@ -251,7 +285,16 @@ else:
       setAffinity(t.sys, csize_t(sizeof(s)), s)
 
 proc createThread*(t: var Thread[void], tp: proc () {.thread, nimcall.}) =
-  (createThread[void])(t, tp)
+  t = (createThread[void])(tp)
+
+proc createThread*[TArg](t: var Thread[TArg],
+                         tp: proc(arg: TArg) {.thread, nimcall.},
+                         param: TArg) =
+  ## Convenience short-hand for creating and assigning a thread in-place.
+  when TArg isnot void:
+    t = createThread[TArg](tp, param)
+  else:
+    t = (createThread[void])(tp)
 
 when not defined(gcOrc):
   include threadids
diff --git a/tests/threads/tinternal_thread_cleanup.nim b/tests/threads/tinternal_thread_cleanup.nim
new file mode 100644
index 00000000000..aa8c7d25e0f
--- /dev/null
+++ b/tests/threads/tinternal_thread_cleanup.nim
@@ -0,0 +1,43 @@
+discard """
+  description: "Ensure that the internal thread management-data is freed"
+  joinable: false
+"""
+
+import std/os
+
+let startMem = getOccupiedSharedMem()
+
+proc run(signal: ptr int) =
+  # busy-wait until the signal is signaled
+  while atomicLoadN(signal, ATOMIC_SEQ_CST) == 0:
+    discard
+
+block detached_thread:
+  # case 1: detached thread (the spawned thread does the cleanup)
+  var
+    signal = 0
+    thread: Thread[ptr int]
+
+  thread.createThread(run, addr signal)
+  # don't wake the thread up
+  thread.reset()
+  # now wake the thread up
+  atomicStoreN(addr signal, 1, ATOMIC_SEQ_CST)
+
+  # without the handle there's no way to know when the thread is finished,
+  # so we sleep for some time
+  sleep(100)
+  doAssert getOccupiedSharedMem() == startMem
+
+block joined_thread:
+  # case 2: joined thread (the current thread does the cleanup)
+  var
+    signal = 0
+    thread: Thread[ptr int]
+
+  thread.createThread(run, addr signal)
+  atomicStoreN(addr signal, 1, ATOMIC_SEQ_CST)
+  thread.joinThread() # wait for the thread to finish
+  reset thread # destroy the thread
+
+  doAssert getOccupiedSharedMem() == startMem
diff --git a/tests/threads/tthread_destroy_before_finish.nim b/tests/threads/tthread_destroy_before_finish.nim
index e56397e784b..36104106597 100644
--- a/tests/threads/tthread_destroy_before_finish.nim
+++ b/tests/threads/tthread_destroy_before_finish.nim
@@ -1,18 +1,20 @@
 discard """
+  description: '''
+    Ensure that detaching a thread (destroying the handle before the spawned
+    thread finishes) works
+  '''
   output: ""
   joinable: false
-  knownIssue: "std/thread is broken"
-  description: '''
-  . if `Thread` is freed before the thread finishes, SIGSEGV
-  . reference counting of `Thread.coreFn` is broken
-'''
 """
 
-import std/os
-
-var ok = false
+var step = 0
 proc whatever() =
-  ok = true
+  # busy-loop until the thread is detached:
+  while atomicLoadN(addr step, ATOMIC_SEQ_CST) < 1:
+    discard
+
+  # thread is detached, increment the counter
+  discard atomicInc(step, 1, ATOMIC_SEQ_CST)
 
 var thread: Thread[void]
 createThread(thread, whatever)
@@ -20,9 +22,10 @@ createThread(thread, whatever)
 # Simulated: variable going out of scope
 thread.reset()
 
-# this breaks as well
-# thread.dataFn.reset()
+# signal that the thread is detached now:
+discard atomicInc(step, 1, ATOMIC_SEQ_CST)
 
-while not ok:
+# wait until the thread is done:
+while atomicLoadN(addr step, ATOMIC_SEQ_CST) < 2:
   discard
 
diff --git a/tests/threads/tthread_param_is_destroyed.nim b/tests/threads/tthread_param_is_destroyed.nim
new file mode 100644
index 00000000000..0d1e9d693a3
--- /dev/null
+++ b/tests/threads/tthread_param_is_destroyed.nim
@@ -0,0 +1,22 @@
+discard """
+  description: "Ensure that thread parameters are destroyed properly"
+  joinable: false
+"""
+
+var counter: int
+
+type Param = object
+  init: bool
+
+proc `=destroy`(x: var Param) =
+  if x.init:
+    discard atomicInc(counter, 1, ATOMIC_SEQ_CST)
+
+proc run(x: Param) {.thread.} =
+  discard
+
+var thread: Thread[Param]
+thread.createThread(run, Param(init: true))
+thread.joinThread()
+
+doAssert atomicLoadN(addr counter, ATOMIC_SEQ_CST) == 1

From b63f0781a8a5f8c1cc7dc11cf7a26386575f4b9b Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 10 May 2024 21:35:47 +0200
Subject: [PATCH 087/169] lower `mChckObj` magic with MIR pass (#1304)

## Summary

Lower the `mChckObj` magic with a MIR pass instead of as part of C code
generation, shrinking down `cgen`.

## Details

* the lowering is integrated into `rtchecks.lowerChecks`
* it's a straightforward MIR port of how `cgen` handled the `mChckObj`
  magic
* so that the syntax stays correct after lowering, `mirgen`now wraps
  the `mChckObj` call in a scope
---
 compiler/backend/ccgexprs.nim             | 10 --------
 compiler/mir/mirgen.nim                   |  9 ++++----
 compiler/mir/rtchecks.nim                 | 28 +++++++++++++++++++++++
 tests/exception/truntime_check_panics.nim |  3 ++-
 4 files changed, 35 insertions(+), 15 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 71c81089c0b..d1b55649f94 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1571,16 +1571,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     initLocExpr(p, e[2], a)
     initLocExpr(p, e[3], b)
     genBoundsCheck(p, arr, a, b, e.exit)
-  of mChckObj:
-    var a: TLoc
-    initLocExpr(p, e[1], a)
-    var nilCheck = ""
-    let r = rdMType(p, a, nilCheck)
-    assert nilCheck != "", "not a pointer-like value?"
-    # the nil-check is expected to have taken place already
-    linefmt(p, cpsStmts, "if (!#isObj($2, $3)){ #raiseObjectConversionError(); $4}$n",
-            [nilCheck, r, genTypeInfo2Name(p.module, e[2].typ),
-             raiseInstr(p, e.exit)])
   of mSamePayload:
     var a, b: TLoc
     initLocExpr(p, e[1], a)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 36030ca8be5..b4331ee8b77 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1825,10 +1825,11 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
               c.buildMagicCall mIsNil, BoolType:
                 c.emitByVal val
       # the check:
-      c.subTree mnkVoid:
-        c.buildDefectMagicCall mChckObj, VoidType:
-          c.emitByVal val
-          c.emitByVal typeLit(c.typeToMir(n.check))
+      c.subTree mnkScope:
+        c.subTree mnkVoid:
+          c.buildDefectMagicCall mChckObj, VoidType:
+            c.emitByVal val
+            c.emitByVal typeLit(c.typeToMir(n.check))
 
     c.buildOp mnkPathConv, typ:
       c.use val
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 5af10aed5db..54d830fd8ec 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -267,6 +267,30 @@ proc emitFieldCheck(tree; source: SourceMap; call; graph; env; bu) =
       bu.emitByVal msgVal
       bu.emitByVal extra
 
+proc emitObjectCheck(tree; call; graph; env; bu) =
+  ## For ``chckObj(o, typ)`` emits:
+  ##   def _1 = of(arg o[], arg typ)
+  ##   def _2 = not(arg _1)
+  ##   if _2:
+  ##     raiseObjectConversionError()
+  let
+    arg = bu.inline(tree, NodePosition tree.argument(call, 0))
+    typ = env[arg.typ].skipTypes(abstractInst + tyUserTypeClasses)
+
+  let cond = bu.wrapTemp BoolType:
+    bu.buildMagicCall mOf, BoolType:
+      # dereference first. Object checks are always guarded by an ``!= nil``
+      # check, so the pointer/ref is guaranteed to be non-nil
+      bu.subTree mnkArg:
+        bu.subTree mnkDeref, env.types.add(typ[^1]):
+          bu.use arg
+      bu.subTree mnkArg:
+        bu.emitFrom(tree, NodePosition tree.argument(call, 1))
+
+  bu.buildIfNot cond:
+    bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseObjectConversionError")):
+      discard
+
 proc lowerChecks*(body; graph; env; changes: var Changeset) =
   ## Lowers all magic calls implementing the run-time checks.
   template tree: MirTree = body.code
@@ -294,5 +318,9 @@ proc lowerChecks*(body; graph; env; changes: var Changeset) =
         # make sure to take the ``mnkVoid`` wrapper into account
         changes.replaceMulti(tree, tree.parent(call), bu):
           emitFieldCheck(tree, body.source, call, graph, env, bu)
+      of mChckObj:
+        let call = tree.parent(i)
+        changes.replaceMulti(tree, tree.parent(call), bu):
+          emitObjectCheck(tree, call, graph, env, bu)
       else:
         discard "not relevant"
diff --git a/tests/exception/truntime_check_panics.nim b/tests/exception/truntime_check_panics.nim
index ee292e3d09c..1427c4ad5c5 100644
--- a/tests/exception/truntime_check_panics.nim
+++ b/tests/exception/truntime_check_panics.nim
@@ -22,7 +22,8 @@ scope:
   def _11: bool = isNil(arg r)
   def _10: bool = not(arg _11)
   if _10:
-    chckObj(arg r, arg type(Sub:ObjectType))
+    scope:
+      chckObj(arg r, arg type(Sub:ObjectType))
   discard r.(Sub)
   def _12: float = mulF64(arg f, arg f)
   chckNaN(arg _12)

From af04de564e749ce08cdc7fcccbbf435ff6aeed86 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 13 May 2024 02:51:39 +0200
Subject: [PATCH 088/169] run destructors for `.threadvar`s on thread exit
 (#1308)

## Summary

All `.threadvars`s that have destructors are now destroyed on thread
exit (including the main thread). Module-level `.threadvar`s are
destroyed *before* procedure-scoped `.threadvar`s, mirroring the
destruction order of non-threadlocal globals.

Fixes https://github.com/nim-works/nimskull/issues/1301.

## Details

Two new module operators are introduced:
* `ThreadDeinit` (destroys all module-level `.threadvar`s)
* `ThreadPostDeinit` (destroys all procedure-scoped `.threadvar`s)

They have the same role for `.threadvar`s as `Deinit` and `PostDeinit`
do for normal globals. In order to make implementation slightly
simpler, destruction of procedure-scoped `.threadvar`s is also done as
part `PostDeinit`. This means that `ThreadPostDeinit` doesn't have to
be called on program teardown.

Finally, `cbackend` (the other backends don't support threads at the
moment) generates and emits the `nimTeardownThreadVars` procedure,
which is then importc'ed by `threads` and run after the destruction
callbacks (which might use threadvars themselves).

Since all backends use `backends.generateMain` (either directly or
indirectly), destruction of `.threadvar`s also automatically works with
the JS and VM backends.
---
 compiler/backend/backends.nim             | 62 +++++++++++++++++------
 compiler/backend/cbackend.nim             | 23 +++++++++
 compiler/sem/modulelowering.nim           | 33 +++++++++---
 lib/system/threads.nim                    |  5 ++
 tests/threads/mthreadvars_destruction.nim | 15 ++++++
 tests/threads/tthreadvars_destruction.nim | 31 ++++++++++++
 6 files changed, 145 insertions(+), 24 deletions(-)
 create mode 100644 tests/threads/mthreadvars_destruction.nim
 create mode 100644 tests/threads/tthreadvars_destruction.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 1f4730c3385..a7f253043d5 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -216,11 +216,30 @@ proc generateTeardown*(graph: ModuleGraph, modules: ModuleList, result: PNode) =
   for it in rclosed(modules):
     if sfSystemModule notin it.sym.flags:
       emitOpCall(graph, it.destructor, result)
+      emitOpCall(graph, it.threadDestructor, result)
       emitOpCall(graph, it.postDestructor, result)
 
+  # the destructor calls for procedure-scoped threadvars are also part of the
+  # postDestructor module op, meaning that the threadPostDestructor op must
+  # not be invoked
+
   emitOpCall(graph, systemModule(modules).destructor, result)
+  emitOpCall(graph, systemModule(modules).threadDestructor, result)
   emitOpCall(graph, systemModule(modules).postDestructor, result)
 
+proc generateThreadTeardown*(graph: ModuleGraph, modules: ModuleList,
+                             result: PNode) =
+  ## Generates the code for de-initializing all threadvars for the program,
+  ## and emits it to `result`. Destruction order is the same as for non-
+  ## threadlocal state.
+  for it in rclosed(modules):
+    if sfSystemModule notin it.sym.flags:
+      emitOpCall(graph, it.threadDestructor, result)
+      emitOpCall(graph, it.threadPostDestructor, result)
+
+  emitOpCall(graph, systemModule(modules).threadDestructor, result)
+  emitOpCall(graph, systemModule(modules).threadPostDestructor, result)
+
 proc generateMainProcedure*(graph: ModuleGraph, idgen: IdGenerator,
                             modules: ModuleList): PSym =
   ## Generates the procedure for initializing, running, and de-initializing
@@ -375,7 +394,7 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
 
 proc produceFragmentsForGlobals(
     env: var MirEnv, identdefs: seq[PNode], graph: ModuleGraph,
-    config: TranslationConfig): tuple[init, deinit: MirBody] =
+    config: TranslationConfig): tuple[init, deinit, threadDeinit: MirBody] =
   ## Given a list of identdefs of lifted globals, produces the MIR code for
   ## initialzing and deinitializing the globals. All not-yet-seen globals and
   ## threadvars are added to `env`.
@@ -395,7 +414,7 @@ proc produceFragmentsForGlobals(
     # we're creating a body here, so there is no list of locals yet
     result = finish(bu, default(Store[LocalId, Local]))
 
-  var init, deinit: MirBuilder
+  var init, deinit, threadDeinit: MirBuilder
 
   # lifted globals can appear re-appear in the identdefs list for two reasons:
   # - the definition appears in the body of a for-loop using an inline iterator
@@ -406,27 +425,32 @@ proc produceFragmentsForGlobals(
   # only want to generate code for the first definition we encounter
   for it in identdefs.items:
     let s = it[0].sym
-    # threadvars don't support initialization nor destruction, so they're
-    # skipped
-    if sfThread in s.flags:
-      discard env.globals.add(s)
-    elif s notin env.globals: # cull duplicates
+    if s notin env.globals: # cull duplicates
       let global = env.globals.add(s)
-      # generate the MIR code for an initializing assignment:
-      prepare(init, result.init.source, graph.emptyNode)
-      generateAssignment(graph, env, config, it, init, result.init.source)
+      if sfThread notin s.flags:
+        # generate the MIR code for an initializing assignment:
+        prepare(init, result.init.source, graph.emptyNode)
+        generateAssignment(graph, env, config, it, init, result.init.source)
+
+      template destroyOp(bu: var MirBuilder, sm: var SourceMap) =
+        prepare(bu, sm, graph.emptyNode)
+        bu.setSource(sm.add(it[0]))
+        genDestroy(bu, graph, env, toValue(global, env.types.add(s.typ)))
 
       # if the global requires one, emit a destructor call into the deinit
       # fragment:
       if hasDestructor(s.typ):
-        prepare(deinit, result.deinit.source, graph.emptyNode)
-        deinit.setSource(result.deinit.source.add(it[0]))
-        genDestroy(deinit, graph, env, toValue(global, env.types.add(s.typ)))
+        destroyOp(deinit, result.deinit.source)
+        if sfThread in s.flags:
+          # also emit a destructor into the thread-deinit fragment:
+          destroyOp(threadDeinit, result.threadDeinit.source)
 
   (result.init.code, result.init.locals) =
     finish(init, result.init.source, graph.emptyNode)
   (result.deinit.code, result.deinit.locals) =
     finish(deinit, result.deinit.source, graph.emptyNode)
+  (result.threadDeinit.code, result.threadDeinit.locals) =
+    finish(threadDeinit, result.threadDeinit.source, graph.emptyNode)
 
 # ----- dynlib handling -----
 
@@ -713,7 +737,8 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
   # mark all procedures that require incremental code generation as forwarded,
   # so that they're not queued for normal code generation
   for _, m in modules.modules.pairs:
-    for it in [m.preInit, m.postDestructor, m.dynlibInit]:
+    for it in [m.preInit, m.postDestructor, m.threadPostDestructor,
+               m.dynlibInit]:
       it.flags.incl sfForward
 
   discovery.progress = checkpoint(env)
@@ -731,6 +756,9 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
     if not isTrivialProc(graph, m.destructor):
       discard env.procedures.add(m.destructor)
 
+    if not isTrivialProc(graph, m.threadDestructor):
+      discard env.procedures.add(m.threadDestructor)
+
     # register the globals and threadvars:
     for s in m.structs.globals.items:
       discard env.globals.add(s)
@@ -811,11 +839,12 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
       queue.prepend(module, WorkItem(kind: wikReportConst, cnst: item.cnst))
     of wikProcessGlobals:
       # produce the init/de-init code for the lifted globals:
-      let (init, deinit) =
+      let (init, deinit, threadDeinit) =
         produceFragmentsForGlobals(env, item.globals, graph, conf.tconfig)
 
       pushProgress(modules[module].preInit, init, module)
       pushProgress(modules[module].postDestructor, deinit, module)
+      pushProgress(modules[module].threadPostDestructor, threadDeinit, module)
     of wikImported:
       let id = item.imported
       # the procedure is always reported from the module its attached to
@@ -841,7 +870,8 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
 
   # unmark all completed incremental procedures:
   for _, m in modules.modules.pairs:
-    for it in [m.preInit, m.postDestructor, m.dynlibInit]:
+    for it in [m.preInit, m.postDestructor, m.threadPostDestructor,
+               m.dynlibInit]:
       if not isTrivialProc(graph, it):
         it.flags.excl sfForward
 
diff --git a/compiler/backend/cbackend.nim b/compiler/backend/cbackend.nim
index 4e9d34bb1bb..bdd66648f7d 100644
--- a/compiler/backend/cbackend.nim
+++ b/compiler/backend/cbackend.nim
@@ -366,6 +366,27 @@ proc generateCodeForMain(m: BModule, modules: ModuleList) =
   # XXX: ^^ this is going to change in the future
   genMainProc(m, code)
 
+proc generateThreadTeardown(m: BModule, modules: ModuleList) =
+  ## Generates and emits the C code for the ``nimTeardownThreadVars``
+  ## procedure.
+  let body = newNode(nkStmtList)
+  generateThreadTeardown(m.g.graph, modules, body)
+
+  let p = newProc(nil, m)
+  p.flags.incl nimErrorFlagDisabled
+  p.options = {}
+  p.body = canonicalize(m.g.graph, m.idgen, m.g.env, m.module, body,
+                        TranslationConfig())
+
+  # manually produced the C code for the procedure:
+  genStmts(p, p.body.code)
+  var code = "void nimTeardownThreadVars(void) {\n"
+  code.add(p.s(cpsLocals))
+  code.add(p.s(cpsInit))
+  code.add(p.s(cpsStmts))
+  code.add "}\n"
+  m.s[cfsProcs].add code
+
 proc generateCode*(graph: ModuleGraph, g: BModuleList, mlist: sink ModuleList)
 
 proc generateCode*(graph: ModuleGraph, mlist: sink ModuleList) =
@@ -499,6 +520,8 @@ proc generateCode*(graph: ModuleGraph, g: BModuleList, mlist: sink ModuleList) =
     if sfMainModule in m.sym.flags:
       finalizeMainModule(bmod)
       generateCodeForMain(bmod, mlist)
+      if optThreads in graph.config.globalOptions:
+        generateThreadTeardown(bmod, mlist)
 
     # code generation for the module is done; its C code will not change
     # anymore beyond this point
diff --git a/compiler/sem/modulelowering.nim b/compiler/sem/modulelowering.nim
index 8ee0ccded31..47c52958b8c 100644
--- a/compiler/sem/modulelowering.nim
+++ b/compiler/sem/modulelowering.nim
@@ -71,8 +71,11 @@ type
     init*: PSym
       ## the procedure responsible for initializing the module's globals
     destructor*: PSym
-      ## the prodcedure responsible for de-initializing the module's
+      ## the procedure responsible for de-initializing the module's
       ## globals
+    threadDestructor*: PSym
+      ## the procedure responsible for de-initializing the module's
+      ## thread-local variables
 
     # XXX: the design around the pre-init and post-destructor procedure is
     #      likely not final yet. At the moment, we set them up here so that
@@ -81,6 +84,8 @@ type
       ## the procedure for initializing the module's lifted globals
     postDestructor*: PSym
       ## the procedure for destroying the module's lifted globals
+    threadPostDestructor*: PSym
+      ## the procedure for destroying the module's lifted threadvars
     dynlibInit*: PSym
       ## the procedure for loading the dynamic libraries, procedure, and
       ## variables associated with the module
@@ -299,12 +304,13 @@ proc genDestroy(graph: ModuleGraph, dest: PNode): PNode =
 
   result = newTreeI(nkCall, dest.info, newSymNode(op), addrExp)
 
-proc generateModuleDestructor(graph: ModuleGraph, m: Module): PNode =
-  ## Generates the body for the destructor procedure of module `m` (also
-  ## referred to as the 'de-init' procedure).
+proc generateDestructor(graph: ModuleGraph, vars: openArray[PSym]): PNode =
+  ## Generates the body for a module destructor (also referred to as the
+  ## 'de-init' procedure). A destructor call for each entitiy in `vars` is
+  ## emitted, in reverse order of appearance.
   result = newNode(nkStmtList)
-  for i in countdown(m.structs.globals.high, 0):
-    let s = m.structs.globals[i]
+  for i in countdown(vars.high, 0):
+    let s = vars[i]
     if hasDestructor(s.typ):
       result.add genDestroy(graph, newSymNode(s))
 
@@ -414,11 +420,22 @@ proc setupModule*(graph: ModuleGraph, idgen: IdGenerator, m: PSym,
   result.dataInit = createModuleOp(graph, idgen, "DatInit", m, newNode(nkEmpty), options)
 
   # setup the module struct clean-up operator:
-  let destructorBody = generateModuleDestructor(graph, result)
-  result.destructor = createModuleOp(graph, idgen, "Deinit", m, destructorBody, options)
+  result.destructor =
+    createModuleOp(graph, idgen, "Deinit", m,
+                   generateDestructor(graph, result.structs.globals),
+                   options)
+
+  # setup the per-thread module struct clean-up operator:
+  result.threadDestructor =
+    createModuleOp(graph, idgen, "ThreadDeinit", m,
+                   generateDestructor(graph, result.structs.threadvars),
+                   options)
 
   result.preInit = createModuleOp(graph, idgen, "PreInit", m, newNode(nkEmpty), options)
   result.postDestructor = createModuleOp(graph, idgen, "PostDeinit", m, newNode(nkEmpty), options)
+  result.threadPostDestructor =
+    createModuleOp(graph, idgen, "ThreadPostDeinit", m, newNode(nkEmpty),
+                   options)
   result.dynlibInit = createModuleOp(graph, idgen, "DynlibInit", m, newNode(nkEmpty), options)
 
 # Below is the `passes` interface implementation
diff --git a/lib/system/threads.nim b/lib/system/threads.nim
index 10eb3a00561..82c92745838 100644
--- a/lib/system/threads.nim
+++ b/lib/system/threads.nim
@@ -119,6 +119,10 @@ proc deallocOsPages() {.rtl, raises: [].}
 proc threadTrouble() {.raises: [], gcsafe.}
   ## defined in system/excpt.nim
 
+proc nimTeardownThreadVars() {.noconv, importc: "nimTeardownThreadVars".}
+  ## Generated by the compiler. Runs the destructor for every thread-local
+  ## variable.
+
 when true:
   proc threadProcWrapDispatch[TArg](thrd: ptr ThreadCore[TArg]) {.raises: [].} =
     try:
@@ -130,6 +134,7 @@ when true:
       threadTrouble()
     finally:
       afterThreadRuns()
+      nimTeardownThreadVars()
 
 template threadProcWrapperBody(closure: untyped): untyped =
   let core = cast[ptr ThreadCore[TArg]](closure)
diff --git a/tests/threads/mthreadvars_destruction.nim b/tests/threads/mthreadvars_destruction.nim
new file mode 100644
index 00000000000..540243e5aa2
--- /dev/null
+++ b/tests/threads/mthreadvars_destruction.nim
@@ -0,0 +1,15 @@
+type Object* = object
+  val*: int
+
+proc `=destroy`(x: var Object) =
+  if x.val != 0:
+    echo x.val
+
+let global = Object(val: 7)
+var tv1 {.threadvar.}: Object
+tv1 = Object(val: 8)
+
+proc init*() =
+  tv1 = Object(val: 3)
+  var tv2 {.threadvar.}: Object
+  tv2 = Object(val: 4)
diff --git a/tests/threads/tthreadvars_destruction.nim b/tests/threads/tthreadvars_destruction.nim
new file mode 100644
index 00000000000..50066a3c777
--- /dev/null
+++ b/tests/threads/tthreadvars_destruction.nim
@@ -0,0 +1,31 @@
+discard """
+  description: '''
+    Ensure that threadvars are destroyed and that the order is correct:
+    1. inter-module: the module closed last has threadvars destroyed first
+    2. intra-module:
+      i. top-level threadvars are destroyed, in reverse order of definition
+      ii. threadvars defined within routines are destroyed, in an
+         unspecified order
+
+    For the main thread, module-level threadvars are destroyed after top-level
+    thread-globals but before procedure-scoped threadvars and thread-globals.
+  '''
+  output: "1\n2\n3\n4\n5\n6\n7\n8\n"
+"""
+
+import mthreadvars_destruction
+
+# the threadvars and globals from this module are destoyed first
+let global = Object(val: 5)
+var tv1 {.threadvar.}: Object
+tv1 = Object(val: 6)
+
+proc run() {.thread.} =
+  tv1 = Object(val: 1)
+  var tv2 {.threadvar.}: Object
+  tv2 = Object(val: 2)
+
+  init()
+
+var t = (createThread[void])(run)
+t.joinThread()

From e224dbf00144cc715e1b1062627d7566d9ec6031 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 13 May 2024 23:30:46 +0200
Subject: [PATCH 089/169] add the `supportsZeroMem` type trait (#1307)

## Summary

The type is intended for libraries to figure out whether `zeroMem`
leaves a location in its "default-initialized" state, something that's
useful to know for optimization or correctness purposes in generic
code.

## Details

Without the type trait, either approximation via `is`, or a type-
inspection macro would have to be used. A built-in type trait is
better than a macro, since it's both more efficient and usable in
the `system` module.

The only types not supporting `zeroMem` for initialization are:
* types that don't have a zero-default (such as `range` types, enums
  not starting at zero, `.requiresInit` types, not-nil pointers, etc.)
* object types that have a type header field (non-pure object types
  that can be inherited from)
* incomplete package-level object types
* aggregate types containing the former three

The `nimskullHasSupportsZeroMem` conditional symbol is added so that
support for type-trait can be detected at compile-time.
---
 compiler/front/condsyms.nim                   |  1 +
 compiler/sem/semmagic.nim                     | 12 +++++++
 lib/pure/typetraits.nim                       |  6 ++++
 .../tno_supports_zero_mem.nim                 | 15 +++++++++
 tests/lang_objects/metatype/ttypetraits.nim   | 33 +++++++++++++++++++
 5 files changed, 67 insertions(+)
 create mode 100644 tests/lang_experimental/package_level_objects/tno_supports_zero_mem.nim

diff --git a/compiler/front/condsyms.nim b/compiler/front/condsyms.nim
index 9746de20026..3d88114beeb 100644
--- a/compiler/front/condsyms.nim
+++ b/compiler/front/condsyms.nim
@@ -77,3 +77,4 @@ proc initDefines*(symbols: StringTableRef) =
   defineSymbol("nimskullNewExceptionRt")
   defineSymbol("nimskullNoNkStmtListTypeAndNkBlockType")
   defineSymbol("nimskullNoNkNone")
+  defineSymbol("nimskullHasSupportsZeroMem")
diff --git a/compiler/sem/semmagic.nim b/compiler/sem/semmagic.nim
index a2e826b97a6..a4e6bdf1122 100644
--- a/compiler/sem/semmagic.nim
+++ b/compiler/sem/semmagic.nim
@@ -222,6 +222,18 @@ proc evalTypeTrait(c: PContext; traitCall: PNode, operand: PType, context: PSym)
     let complexObj = containsGarbageCollectedRef(t) or
                      hasDestructor(t)
     result = newIntNodeT(toInt128(ord(not complexObj)), traitCall, c.idgen, c.graph)
+  of "supportsZeroMem":
+    # Zero initialization is not valid for:
+    # * types requiring explicit initialization
+    # * partial types (package-level objects)
+    # * object types with a type header
+    proc pred(t: PType): bool =
+      # object with type header? or package-level object?
+      t.kind == tyObject and (not isObjLackingTypeField(t) or
+        sfForward in t.sym.flags)
+
+    let cond = requiresInit(operand) or searchTypeFor(operand, pred)
+    result = newIntNodeT(toInt128(ord(not cond)), traitCall, c.idgen, c.graph)
   of "isNamedTuple":
     var operand = operand.skipTypes({tyGenericInst})
     let cond = operand.kind == tyTuple and operand.n != nil
diff --git a/lib/pure/typetraits.nim b/lib/pure/typetraits.nim
index 2f210cbecb1..9b3877decfd 100644
--- a/lib/pure/typetraits.nim
+++ b/lib/pure/typetraits.nim
@@ -93,6 +93,12 @@ proc supportsCopyMem*(t: typedesc): bool {.magic: "TypeTrait".}
   ##
   ## Other languages name a type like these `blob`:idx:.
 
+proc supportsZeroMem*(t: typedesc): bool {.magic: "TypeTrait".}
+  ## This trait returns true if using `zeroMem`:idx: on a location of type `t`
+  ## brings the location into its "default-initialized" state. This doesn't
+  ## imply that using `zeroMem`:idx: on a location already storing a value is
+  ## valid.
+
 proc isNamedTuple*(T: typedesc): bool {.magic: "TypeTrait".} =
   ## Returns true for named tuples, false for any other type.
   runnableExamples:
diff --git a/tests/lang_experimental/package_level_objects/tno_supports_zero_mem.nim b/tests/lang_experimental/package_level_objects/tno_supports_zero_mem.nim
new file mode 100644
index 00000000000..03229b9b2ef
--- /dev/null
+++ b/tests/lang_experimental/package_level_objects/tno_supports_zero_mem.nim
@@ -0,0 +1,15 @@
+discard """
+  description: '''
+    Until completed, a package-level object type counts as not supporting
+    zero-initialization
+  '''
+  action: compile
+"""
+
+import std/typetraits
+
+type
+  mypackage.Foo = object
+
+static:
+  doAssert not supportsZeroMem(Foo)
diff --git a/tests/lang_objects/metatype/ttypetraits.nim b/tests/lang_objects/metatype/ttypetraits.nim
index acfe1e69559..631615dd5a9 100644
--- a/tests/lang_objects/metatype/ttypetraits.nim
+++ b/tests/lang_objects/metatype/ttypetraits.nim
@@ -388,3 +388,36 @@ block: # enum.len
     doAssert MyEnum.enumLen == 4
     doAssert OtherEnum.enumLen == 3
     doAssert MyFlag.enumLen == 4
+
+{.experimental: "strictNotNil".}
+
+block supports_zero_mem:
+  type
+    RequiresInit {.requiresInit.} = object
+    WithDestructor = object
+    Distinct = distinct int
+    PtrNotNil = ptr int not nil
+
+  proc `=destroy`(x: var WithDestructor) =
+    discard
+
+  # primitive types and built-in dynamic containers support zeroMem
+  doAssert supportsZeroMem(int)
+  doAssert supportsZeroMem((int, int))
+  doAssert supportsZeroMem(seq[int])
+  doAssert supportsZeroMem(Distinct)
+
+  # a type having a destructor doesn't preclude it from being initialize-able
+  # with zeroMem
+  doAssert supportsZeroMem(WithDestructor)
+
+  doAssert not supportsZeroMem(range[1..2])
+  doAssert not supportsZeroMem(openArray[int])
+  doAssert not supportsZeroMem(var int)
+  doAssert not supportsZeroMem(PtrNotNil)
+  # requiresInit types - and the types they're part of - do not support zeroMem
+  doAssert not supportsZeroMem(RequiresInit)
+  # knownIssue: the requiresInit condition isn't propagated to array and tuple
+  # types
+  doAssert supportsZeroMem(array[1, RequiresInit]), "works now"
+  doAssert supportsZeroMem((RequiresInit,)), "works now"

From bbb519af6f86d1e4357eb1557455497de8f006df Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 14 May 2024 01:00:52 +0000
Subject: [PATCH 090/169] build(deps): Bump softprops/action-gh-release from
 2.0.4 to 2.0.5 (#1309)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[softprops/action-gh-release](https://github.com/softprops/action-gh-release)
from 2.0.4 to 2.0.5.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/releases">softprops/action-gh-release's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.5</h2>
<ul>
<li>Factor in file names with spaces when upserting files <a

href="https://redirect.github.com/softprops/action-gh-release/pull/446">#446</a>
via <a
href="https://github.com/MystiPanda"><code>@​MystiPanda</code></a></li>
<li>Improvements to error handling <a

href="https://redirect.github.com/softprops/action-gh-release/pull/449">#449</a>
via <a href="https://github.com/till"><code>@​till</code></a></li>
</ul>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/blob/master/CHANGELOG.md">softprops/action-gh-release's
changelog</a>.</em></p>
<blockquote>
<h2>2.0.5</h2>
<ul>
<li>Factor in file names with spaces when upserting files <a

href="https://redirect.github.com/softprops/action-gh-release/pull/446">#446</a>
via <a
href="https://github.com/MystiPanda"><code>@​MystiPanda</code></a></li>
<li>Improvements to error handling <a

href="https://redirect.github.com/softprops/action-gh-release/pull/449">#449</a>
via <a href="https://github.com/till"><code>@​till</code></a></li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/softprops/action-gh-release/commit/69320dbe05506a9a39fc8ae11030b214ec2d1f87"><code>69320db</code></a>
update changelog</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/9771ccf55ff16f083af69228ef39c5da2c54f02b"><code>9771ccf</code></a>
update changelog rebuild dist</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/0a76e4214a22dfa2946790a0b56e12720488e0d2"><code>0a76e42</code></a>
Fix: error handling (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/449">#449</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/3989e4b325fd35af0f19f42a37021d50b48b77e0"><code>3989e4b</code></a>
document impl detail</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/72e945e627950fcf3856e5ed050e717cba6004fd"><code>72e945e</code></a>
update changelog</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/40bf9ec7aa10e323231ddc29feb3b271d2432b7e"><code>40bf9ec</code></a>
fmt and build</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/998623f0c3438e2dc850076c2ac4d7ceeed7c000"><code>998623f</code></a>
fix: support space in file name (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/446">#446</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/0979303f0222052f8b9e0d89ccaba124618f4abf"><code>0979303</code></a>
Fix failure (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/447">#447</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/9b795e578288d5ff64564dfa7dd4cda7b04bb648"><code>9b795e5</code></a>
Update README.md (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/432">#432</a>)</li>
<li>See full diff in <a

href="https://github.com/softprops/action-gh-release/compare/v2.0.4...v2.0.5">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=softprops/action-gh-release&package-manager=github_actions&previous-version=2.0.4&new-version=2.0.5)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index fb8c0790fb9..5398dfb6e39 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -101,7 +101,7 @@ jobs:
 
       - id: release
         name: Create pre-release
-        uses: softprops/action-gh-release@v2.0.4
+        uses: softprops/action-gh-release@v2.0.5
         with:
           prerelease: true
           files: ${{ steps.release-files.outputs.result }}

From 1d644ababb3c29ba8d8740ebb247407300da9d10 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 14 May 2024 22:59:55 +0200
Subject: [PATCH 091/169] always clear slots when growing `seq` with `setLen`
 (#1306)

## Summary

Growing a `seq[T]` with `setLen` after shrinking it now doesn't retain
the slots' previous state, default-initializing them instead. This was
already the behaviour for destructor-having element types, but not for
other types.

## Details

For efficiency, two optimizations are used:
* the slots memory is only default-initialized when *growing* with
  `setLen`, not when shrinking
* if the element type supports it, a single `zeroMem` call is used for
  clearing the new slots after growing

For types that don't support `zeroMem`, `default(T)` is assigned to
every new slot, which fixes type header for non-pure inheritable
objects not being initialized (and `of` thus crashing).

The `seq` implementation procedures have to assume that after resizing,
the memory of the new slots is in an undefined state, which means that
no hook calls (`=copy` or `=sink`) must be used. This is guaranteed by
performing the assignments within `.nodestroy` procedures.

Since slot assignments never expand to hook calls now, the payload
memory doesn't have to be zero'ed on allocation anymore.
---
 lib/system/seqs_v2.nim                  | 47 ++++++++++++++++++++---
 tests/stdlib/types/collections/tseq.nim | 51 +++++++++++++++++++++++++
 2 files changed, 92 insertions(+), 6 deletions(-)

diff --git a/lib/system/seqs_v2.nim b/lib/system/seqs_v2.nim
index b0af6d67f1d..7751c1aff1f 100644
--- a/lib/system/seqs_v2.nim
+++ b/lib/system/seqs_v2.nim
@@ -12,6 +12,12 @@
 # strs already imported allocateds for us.
 
 proc supportsCopyMem(t: typedesc): bool {.magic: "TypeTrait".}
+when defined(nimskullHasSupportsZeroMem):
+  proc supportsZeroMem(t: typedesc): bool {.magic: "TypeTrait".}
+else:
+  # approximate detection of whether a type supports zeroMem
+  template supportsZeroMem(t: typedesc): bool =
+    t is (SomeNumber or enum or ptr or ref or pointer or proc or seq or string)
 
 ## Default seq implementation used by Nim's core.
 type
@@ -35,7 +41,7 @@ proc newSeqPayload(cap, elemSize, elemAlign: int): pointer {.compilerRtl, raises
   # we have to use type erasure here as Nim does not support generic
   # compilerProcs. Oh well, this will all be inlined anyway.
   if cap > 0:
-    var p = cast[ptr NimSeqPayloadBase](alignedAlloc0(align(sizeof(NimSeqPayloadBase), elemAlign) + cap * elemSize, elemAlign))
+    var p = cast[ptr NimSeqPayloadBase](alignedAlloc(align(sizeof(NimSeqPayloadBase), elemAlign) + cap * elemSize, elemAlign))
     p.cap = cap
     result = p
   else:
@@ -62,14 +68,14 @@ proc prepareSeqAdd(len: int; p: pointer; addlen, elemSize, elemAlign: int): poin
       let oldCap = p.cap and not strlitFlag
       let newCap = max(resize(oldCap), len+addlen)
       if (p.cap and strlitFlag) == strlitFlag:
-        var q = cast[ptr NimSeqPayloadBase](alignedAlloc0(headerSize + elemSize * newCap, elemAlign))
+        var q = cast[ptr NimSeqPayloadBase](alignedAlloc(headerSize + elemSize * newCap, elemAlign))
         copyMem(q +! headerSize, p +! headerSize, len * elemSize)
         q.cap = newCap
         result = q
       else:
         let oldSize = headerSize + elemSize * oldCap
         let newSize = headerSize + elemSize * newCap
-        var q = cast[ptr NimSeqPayloadBase](alignedRealloc0(p, oldSize, newSize, elemAlign))
+        var q = cast[ptr NimSeqPayloadBase](alignedRealloc(p, oldSize, newSize, elemAlign))
         q.cap = newCap
         result = q
 
@@ -77,13 +83,18 @@ proc shrink*[T](x: var seq[T]; newLen: Natural) =
   when nimvm:
     setLen(x, newLen)
   else:
-    #sysAssert newLen <= x.len, "invalid newLen parameter for 'shrink'"
     when not supportsCopyMem(T):
+      # destroy all cut-off items, but don't reset the memory yet
       for i in countdown(x.len - 1, newLen):
-        reset x[i]
+        `=destroy`(x[i])
+
     # XXX This is wrong for const seqs that were moved into 'x'!
     cast[ptr NimSeqV2[T]](addr x).len = newLen
 
+proc rawAssign[T](dest: var T, value: sink T) {.inline, nodestroy.} =
+  # the copy takes place at the callsite, only a blit copy is performed here
+  dest = value
+
 proc grow*[T](x: var seq[T]; newLen: Natural; value: T) =
   let oldLen = x.len
   #sysAssert newLen >= x.len, "invalid newLen parameter for 'grow'"
@@ -93,7 +104,13 @@ proc grow*[T](x: var seq[T]; newLen: Natural; value: T) =
     xu.p = cast[typeof(xu.p)](prepareSeqAdd(oldLen, xu.p, newLen - oldLen, sizeof(T), alignof(T)))
   xu.len = newLen
   for i in oldLen .. newLen-1:
-    xu.p.data[i] = value
+    when supportsCopyMem(T):
+      # no copy hook exists, a direct assignment can be used
+      xu.p.data[i] = value
+    else:
+      # the slot is in an unknown state, so a direct assignment (which would
+      # invoke the copy hook) cannot be used
+      rawAssign(xu.p.data[i], value)
 
 proc add*[T](x: var seq[T]; value: sink T) {.magic: "AppendSeqElem", noSideEffect, nodestroy.} =
   ## Generic proc for adding a data item `y` to a container `x`.
@@ -113,6 +130,19 @@ proc add*[T](x: var seq[T]; value: sink T) {.magic: "AppendSeqElem", noSideEffec
   # We also save the `wasMoved + destroy` pair for the sink parameter.
   xu.p.data[oldLen] = value
 
+{.push checks: off.}
+
+proc prepareSeqSlots[T](xu: ptr NimSeqV2[T],
+                        oldLen, newLen: int) {.inline, nodestroy.} =
+  var i = oldLen
+  while i < newLen:
+    # the memory is in an unknown state, and ``.nodestroy`` makes sure that
+    # the assignment is a blit-copy
+    xu.p.data[i] = default(T)
+    inc i
+
+{.pop.}
+
 proc setLen[T](s: var seq[T], newlen: Natural) =
   {.noSideEffect.}:
     if newlen < s.len:
@@ -124,6 +154,11 @@ proc setLen[T](s: var seq[T], newlen: Natural) =
       if xu.p == nil or xu.p.cap < newlen:
         xu.p = cast[typeof(xu.p)](prepareSeqAdd(oldLen, xu.p, newlen - oldLen, sizeof(T), alignof(T)))
       xu.len = newlen
+      when supportsZeroMem(T):
+        # optimization: clear the whole memory region in one go
+        zeroMem(addr xu.p.data[oldLen], (newlen - oldLen) * sizeof(T))
+      else:
+        prepareSeqSlots(xu, oldLen, newlen)
 
 proc newSeq[T](s: var seq[T], len: Natural) =
   shrink(s, 0)
diff --git a/tests/stdlib/types/collections/tseq.nim b/tests/stdlib/types/collections/tseq.nim
index 16a242ae6de..dd62eb0a5a2 100644
--- a/tests/stdlib/types/collections/tseq.nim
+++ b/tests/stdlib/types/collections/tseq.nim
@@ -201,3 +201,54 @@ for i in 0..100:
   var test = newSeqOfCap[uint32](1)
   test.setLen(1)
   doAssert test[0] == 0, $(test[0], i)
+
+block shrink_resets:
+  # ensure that the cut-off items are in the default state after shrinking and
+  # then growing the seq
+  var s = newSeq[int](10) # with primitive type
+  for it in s.mitems:
+    it = 1
+
+  s.setLen(5)
+  s.setLen(6) # grow again
+  doAssert s[5] == 0
+
+block shrink_resets_with_destructor:
+  # test with type that requires destruction
+  type Obj = object
+    has: bool
+
+  var destroyed {.global.} = 0
+
+  proc `=destroy`(x: var Obj) =
+    if x.has:
+      inc destroyed
+
+  var s = newSeq[Obj](10)
+  for it in s.mitems:
+    it = Obj(has: true)
+
+  s.setLen(5)
+  doAssert destroyed == 5
+  s.setLen(6)
+  doAssert s[5].has == false
+
+block item_with_type_field:
+  # ensure that object with type fields have their type fields initialized
+  # properly
+  type Obj = object of RootObj
+
+  proc test(x: ptr RootObj) =
+    # if the type field wasn't initialized, the `of` check is going to crash
+    # with a nil-access defect
+    doAssert x of Obj
+
+  # after ``newSeq``:
+  var s: seq[Obj]
+  s.newSeq(1)
+  test(addr s[0])
+
+  # after ``setLen``:
+  var s2: seq[Obj]
+  s.setLen(1)
+  test(addr s[0])

From 2f3fba00e3da7389ea240e1b4791fe41e5648680 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 15 May 2024 00:07:21 +0200
Subject: [PATCH 092/169] profiler: prevent infinite recursion (#1310)

## Summary

The profiler runtime enabled with `--profiler:on` now guards against
infinite recursion when the profiler callbacks call instrumented
procedures. This fixes crashes caused by a stack overflow when
using `nimprof`.

## Details

* a thread-local boolean is used to guard against `nimProfile`
  recursing
* the workaround previously required in `tprofiler.nim` is obsolete
  and thus removed
---
 lib/system/profiler.nim              | 19 +++++++++++++++----
 tests/compilerfeatures/tprofiler.nim |  4 ----
 2 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/lib/system/profiler.nim b/lib/system/profiler.nim
index 0649f117674..63216e5750c 100644
--- a/lib/system/profiler.nim
+++ b/lib/system/profiler.nim
@@ -63,6 +63,15 @@ var
   profilingRequestedHook*: proc (): bool {.nimcall, locks: 0, gcsafe.}
     ## set this variable to provide a procedure that implements a profiler in
     ## user space. See the `nimprof` module for a reference implementation.
+  profilerGuard {.threadvar.}: bool
+
+template guard(body: untyped) =
+  # prevent infinite recursion when the profiler callbacks call instrumented
+  # procedures
+  if not profilerGuard:
+    profilerGuard = true
+    body
+    profilerGuard = false
 
 when defined(memProfiler):
   type
@@ -79,8 +88,9 @@ when defined(memProfiler):
     hook(st, requestedSize)
 
   proc nimProfile(requestedSize: int) =
-    if not isNil(profilingRequestedHook) and profilingRequestedHook():
-      callProfilerHook(profilerHook, requestedSize)
+    guard:
+      if not isNil(profilingRequestedHook) and profilingRequestedHook():
+        callProfilerHook(profilerHook, requestedSize)
 else:
   var
     profilerHook*: ProfilerHook
@@ -97,7 +107,8 @@ else:
 
   proc nimProfile() =
     ## This is invoked by the compiler in every loop and on every proc entry!
-    if not isNil(profilingRequestedHook) and profilingRequestedHook():
-      callProfilerHook(profilerHook)
+    guard:
+      if not isNil(profilingRequestedHook) and profilingRequestedHook():
+        callProfilerHook(profilerHook)
 
 {.pop.}
diff --git a/tests/compilerfeatures/tprofiler.nim b/tests/compilerfeatures/tprofiler.nim
index 88e71fe8f4d..ad3955c57e8 100644
--- a/tests/compilerfeatures/tprofiler.nim
+++ b/tests/compilerfeatures/tprofiler.nim
@@ -21,14 +21,10 @@ var
 
 proc enabledCallback(): bool =
   result = enabled
-  # XXX: an issue with the profiler runtime requires disabling the callback
-  #      until the `profileCallback` is done
-  enabled = false
 
 proc profileCallback(st: StackTrace) =
   traces[numTraces] = st
   inc numTraces
-  enabled = true # re-enable
 
 {.pop.}
 

From a6d4723ea9590be11ab99c03b34063d2ef2ceed7 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 17 May 2024 23:16:08 +0200
Subject: [PATCH 093/169] fix: move analyzer regression with variants (#1311)

## Summary

Separate the `switch` lowering and destructor injection into two proper
passes and apply them concurrently, fixing a move analyzer regression.

## Details

* move the `switch` lowering out of `injectDestructorCalls`
* pass a `Changeset` instead of a mutable `MirBody` to the two passes
  in `injectdestructors`
* destructor injection and `switch` lowering are applied in a single
  batch by `backends.process`
* the `switch` lowering is still disabled for the VM backend
* update the doc comment of `injectDestructorCalls` to reflect reality

### Move Analyzer

Applying both passes concurrently - instead of the destructor-
injection/move-analysis after `switch` lowering - fixes a regression
from ae543125c222693c915e3cfaa3cc3edb0110c569

The move analyzer now sees a discriminator assignment as:
```nim
x.discr = y
```
instead of:
```nim
if x.discr != y:
  =destroy(x) # variant destructor
x.discr = y
```

allowing it to perform automatic moves from non-variant fields again
(refer to `tmove_from_non_variant_field.nim`).

### Misc

* fix MIR pretty-printing for object/ref constructors -- the colon was
  missing between the field and value
---
 compiler/backend/backends.nim                 | 14 ++++-
 compiler/mir/utils.nim                        |  1 +
 compiler/sem/injectdestructors.nim            | 61 ++++++-------------
 .../tmove_from_non_variant_field.nim          | 43 +++++++++++++
 4 files changed, 77 insertions(+), 42 deletions(-)
 create mode 100644 tests/optimization/tmove_from_non_variant_field.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index a7f253043d5..d15d892dee5 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -26,6 +26,7 @@ import
     injecthooks,
     mirbodies,
     mirbridge,
+    mirchangesets,
     mirconstr,
     mirenv,
     mirgen,
@@ -347,7 +348,18 @@ proc process(body: var MirBody, prc: PSym, graph: ModuleGraph,
   ## Applies all applicable MIR passes to the `body`. `prc` is the enclosing
   ## procedure.
   if shouldInjectDestructorCalls(prc):
-    injectDestructorCalls(graph, idgen, env, prc, body)
+    block:
+      var c = initChangeset(body)
+      injectDestructorCalls(body.code, graph, env, c)
+      # XXX: ``vmgen`` doesn't support the code resulting from the switch
+      #      lowering, so branch destructors are disabled for the VM target
+      #      at the moment
+      if graph.config.backend != backendNimVm:
+        lowerBranchSwitch(body.code, graph, idgen, env, c)
+      body.apply(c)
+
+    # hook injection needs to happen *after* move analysis and destroy
+    # injection
     injectHooks(body, graph, env, prc)
 
     if graph.config.arcToExpand.hasKey(prc.name.s):
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index b5fe4cb5b9a..d0963a050af 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -418,6 +418,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
     tree "(":
       commaSeparated:
         fieldToStr(next(nodes, i).field, typ, result, c)
+        result.add ": "
         argToStr()
       result.add ")"
   of mnkCall:
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index e33517292d2..be260e88740 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -826,56 +826,35 @@ func shouldInjectDestructorCalls*(owner: PSym): bool =
      {sfInjectDestructors, sfGeneratedOp} * owner.flags == {sfInjectDestructors} and
      (owner.kind != skIterator or not isInlineIterator(owner.typ))
 
-proc injectDestructorCalls*(g: ModuleGraph, idgen: IdGenerator,
-                            env: var MirEnv, owner: PSym,
-                            body: var MirBody) =
-  ## The ``injectdestructors`` pass entry point. The pass is made up of
-  ## multiple sub-passes, hence the mutable `body` (as opposed
-  ## to returning a ``Changeset``).
-  ##
-  ## For now, semantic errors and other diagnostics related to lifetime-hook
-  ## usage are also reported here.
-
-  # apply the first batch of passes:
-  block:
-    var changes = initChangeset(body)
-    # the VM implements branch switching itself - performing the lowering for
-    # code meant to run in it would be harmful
-    # FIXME: discriminant assignment lowering also needs to be disabled for
-    #        when generating code running at compile-time (e.g. inside a
-    #        macro)
-    # XXX: the lowering is *always* necessary, as the destructors for
-    #      fields inside switched-away-from branches won't be called
-    #      otherwise
-    # TODO: make the branch-switch lowering a separate and standalone pass --
-    #       it's not directly related to the rest of the processing here
-    if g.config.backend != backendNimVm:
-      for i, n in body.code.pairs:
-        if n.kind == mnkSwitch:
-          changes.replaceMulti(body.code, i, buf):
-            lowerBranchSwitch(buf, body.code, g, idgen, env, i)
-
-    body.apply(changes)
-
-  # apply the second batch of passes:
+proc lowerBranchSwitch*(tree: MirTree, g: ModuleGraph, idgen: IdGenerator,
+                        env: var MirEnv, changes: var Changeset) =
+  ## Lowers ``mnkSwitch`` operations into normal assignments, with a branch
+  ## destructor injected if the respective record-case requires it (i.e.,
+  ## because it contains fields requiring destruction).
+  for i, n in tree.pairs:
+    if n.kind == mnkSwitch:
+      changes.replaceMulti(tree, i, buf):
+        lowerBranchSwitch(buf, tree, g, idgen, env, i)
+
+proc injectDestructorCalls*(tree: MirTree, g: ModuleGraph, env: var MirEnv,
+                            changes: var Changeset) =
+  ## Collapses sink assignments into either copy or move assignments, and
+  ## injects the destroy operations for all entities requiring destruction.
   block:
     var
-      changes = initChangeset(body)
-      actx = AnalyseCtx(graph: g, cfg: computeDfg(body.code))
+      actx = AnalyseCtx(graph: g, cfg: computeDfg(tree))
 
     let
-      entities = initEntityDict(body.code, actx.cfg, env)
-      moves = collapseSink(body.code, actx.cfg, entities, env.types)
+      entities = initEntityDict(tree, actx.cfg, env)
+      moves = collapseSink(tree, actx.cfg, entities, env.types)
 
-    let destructors = computeDestructors(body.code, actx.cfg, entities)
+    let destructors = computeDestructors(tree, actx.cfg, entities)
 
     rewriteAssignments(
-      body.code, actx,
+      tree, actx,
       AnalysisResults(moves: cursor(moves),
                       entities: cursor(entities),
                       destroy: cursor(destructors)),
       env.types, changes)
 
-    injectDestructors(body.code, g, destructors, env, changes)
-
-    body.apply(changes)
+    injectDestructors(tree, g, destructors, env, changes)
diff --git a/tests/optimization/tmove_from_non_variant_field.nim b/tests/optimization/tmove_from_non_variant_field.nim
new file mode 100644
index 00000000000..485d96d5984
--- /dev/null
+++ b/tests/optimization/tmove_from_non_variant_field.nim
@@ -0,0 +1,43 @@
+discard """
+  description: '''
+    Ensure that a discriminator assignment doesn't prevent automatic moves
+    from fields outside the record-case
+  '''
+  action: compile
+  matrix: "--expandArc:test --checks:off"
+  nimout: '''--expandArc: test
+scope:
+  def _3: WithHooks = ()
+  def x: Object = (a: consume _3, kind: consume true)
+  bind_mut _4: WithHooks = x.a
+  result := move _4
+  wasMoved(name _4)
+  bind_mut _5: bool = x.kind
+  def _6: bool = copy kind
+  def _7: bool = eqB(arg _5, arg _6)
+  def _8: bool = not(arg _7)
+  if _8:
+    =destroy(name x)
+  _5 = _6
+  =destroy(name x)
+
+-- end of expandArc ------------------------'''
+"""
+
+type
+  WithHooks = object
+  Object = object
+    a: WithHooks
+    case kind: bool
+    of true, false:
+      b: WithHooks
+
+proc `=destroy`(x: var WithHooks) =
+  discard
+
+proc test(kind: bool): WithHooks {.exportc.} =
+  var x = Object(a: WithHooks(), kind: true)
+  result = x.a # can be moved
+  # the discriminator assignment must not prevent `x.a` from being moved out
+  # of
+  x.kind = kind

From 39c85f08dc18a8cbb1f2d0d4feebeb298414087a Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 18 May 2024 02:04:51 +0200
Subject: [PATCH 094/169] internal: use AST for dynlib loaders (#1312)

## Summary

Instead of directly producing MIR code for the dynlib loaders, first
produce an AST that is then translated to the MIR, reducing the amount
of code that needs to be adjusted when the MIR changes.

## Details

Generating an intermediate AST means that `mirgen` can fully be
leveraged for the translation, instead of only partially, which ensures
proper translation even when the MIR changes.

The `mirgen.generateCode` overload for appending to an existing
`MirBuilder` is now obsolete and thus removed. In addition, the pre-
and post-MIR-translation body for dynlib loaders can now be echoed via
the `-d:nimShowMirInput` and `-d:nimShowMir` debug facilities.
---
 compiler/backend/backends.nim | 171 +++++++++++++++-------------------
 compiler/mir/mirgen.nim       |  37 ++------
 2 files changed, 81 insertions(+), 127 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index d15d892dee5..4e2d1ab070a 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -466,75 +466,80 @@ proc produceFragmentsForGlobals(
 
 # ----- dynlib handling -----
 
-proc genLoadLib(bu: var MirBuilder, graph: ModuleGraph, env: var MirEnv,
-                loc, name: Value): Value =
-  ## Emits the MIR code for ``loc = nimLoadLibrary(name); loc.isNil``.
-  let loadLib = graph.getCompilerProc("nimLoadLibrary")
-
-  bu.subTree MirNode(kind: mnkAsgn):
-    bu.use loc
-    bu.buildCall env.procedures.add(loadLib), env.types.add(loadLib.typ[0]):
-      bu.emitByVal name
-
-  bu.wrapTemp(BoolType):
-    bu.buildMagicCall mIsNil, BoolType:
-      bu.emitByVal loc
-
-proc genLibSetup(graph: ModuleGraph, env: var MirEnv, conf: BackendConfig,
-                 libVar: GlobalId, path: PNode,
-                 bu: var MirBuilder, source: var SourceMap) =
-  ## Emits the MIR code for loading a dynamic library to `dest`, with `name`
-  ## being the symbol of the location that stores the handle and `path` the
-  ## expression used with the ``.dynlib`` pragma.
+proc newCall(sym: PSym, info: TLineInfo, args: varargs[PNode]): PNode =
+  # if the symbol has no type (likely because it's a magic), use nil for the
+  # type and have ``mirgen`` figure it out
+  result = newTreeIT(nkCall, info, (if sym.typ != nil: sym.typ[0] else: nil))
+  result.add newSymNode(sym)
+  for it in args.items:
+    result.add it
+
+proc newBoolCall(sym: PSym, info: TLineInfo, graph: ModuleGraph,
+                 a: PNode; b = PNode(nil)): PNode =
+  result = newTreeIT(nkCall, info, graph.getSysType(unknownLineInfo, tyBool))
+  result.add newSymNode(sym)
+  result.add a
+  if b != nil:
+    result.add b
+
+proc genLoadLib(graph: ModuleGraph, loc, name: PNode): PNode =
+  ## Generates the AST for ``loc = nimLoadLibrary(name); loc.isNil``.
+  let
+    loadLib = graph.getCompilerProc("nimLoadLibrary")
+    typ = graph.getSysType(unknownLineInfo, tyBool)
+
+  result = nkStmtListExpr.newTreeIT(loc.info, typ,
+    newTree(nkAsgn, loc, newCall(loadLib, loc.info, name)),
+    newBoolCall(graph.operators.opIsNil, loc.info, graph, loc))
+
+proc genLibSetup(graph: ModuleGraph, libVar: PNode, path: PNode): PNode =
+  ## Generates the AST for a statement loading and assigning a dynlib handle
+  ## to `libVar`, with `path` being the expression used with the ``.dynlib``
+  ## pragma.
   let
     errorProc = graph.getCompilerProc("nimLoadLibraryError")
-    val       = toValue(libVar, env.types.add(env[libVar].typ))
 
   if path.kind in nkStrKinds:
     # the library name is known at compile-time
     var candidates: seq[string]
     libCandidates(path.strVal, candidates)
 
-    let outer = LabelId(1) # labels are 1-based
-
-    # generate an 'or' chain that tries every candidate until one is found
+    # generate an 'and' chain that tries every candidate until one is found
     # for which loading succeeds
-    bu.subTree MirNode(kind: mnkBlock, label: outer):
-      bu.add MirNode(kind: mnkStmtList) # manual, for less visual nesting
-      for candidate in candidates.items:
-        var tmp = genLoadLib(bu, graph, env, val):
-          literal(env.getOrIncl(candidate), StringType)
-
-        tmp = bu.wrapTemp(BoolType):
-          bu.buildMagicCall mNot, BoolType:
-            bu.emitByVal tmp
-
-        bu.subTree mnkIf:
-          bu.use tmp
-          bu.add MirNode(kind: mnkBreak, label: outer)
-
-      # if none of the candidates worked, a run-time error is reported:
-      bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), VoidType:
-          bu.emitByVal literal(env.getOrIncl(path.strVal), StringType)
-      bu.add endNode(mnkStmtList)
+    var check = PNode(nil)
+    for candidate in candidates.items:
+      let e = genLoadLib(graph, libVar):
+        newStrNode(candidate, errorProc.typ[1])
+      if check.isNil:
+        check = e
+      else:
+        check = newBoolCall(graph.operators.opAnd, path.info, graph, check, e)
+
+    assert check != nil
+    # if all candidates failed, the error reporting proc is called
+    result = nkIfStmt.newTree(
+      nkElifBranch.newTree(check, newCall(errorProc, path.info, path)))
   else:
     # the name of the dynamic library to load the procedure from is only known
     # at run-time
-    let nameTemp = bu.allocTemp(StringType)
-    bu.buildStmt mnkDef:
-      bu.use nameTemp
-      generateCode(graph, env, conf.tconfig, path, bu, source)
-
-    let cond = genLoadLib(bu, graph, env, val, nameTemp)
-    bu.subTree mnkIf:
-      bu.use cond
-      bu.subTree mnkVoid:
-        bu.buildCall env.procedures.add(errorProc), VoidType:
-          bu.emitByVal nameTemp
+
+    # since the temporary is translated to MIR immediately afterwards, using
+    # nil as the owner is fine
+    let tmp = newSym(skLet, graph.cache.getIdent(":tmp"), nextSymId graph.idgen,
+                     nil, path.info, path.typ)
+    # the expression is captured in a temporary first, which is then passed to
+    # ``nimLoadLibrary``
+    result = nkStmtList.newTree(
+      nkLetSection.newTree(
+        nkIdentDefs.newTree(newSymNode(tmp), graph.emptyNode, path)),
+      nkIfStmt.newTree(
+        nkElifBranch.newTree(
+          genLoadLib(graph, libVar, newSymNode(tmp)),
+          newCall(errorProc, path.info, newSymNode(tmp)))))
 
 proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
-                   env: var MirEnv, conf: BackendConfig, sym: PSym): MirBody =
+                   env: var MirEnv, conf: BackendConfig,
+                   owner, sym: PSym): MirBody =
   ## Produces a MIR fragment with the load-at-run-time logic for procedure/
   ## variable `sym`. If not generated already, the loading logic for the
   ## necessary dynamic library is emitted into the fragment and the global
@@ -544,21 +549,11 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
     loadProc = graph.getCompilerProc("nimGetProcAddr")
     path     = transformExpr(graph, m.idgen, m.sym, lib.path)
     extname  = newStrNode(nkStrLit, sym.extname)
+    magic    = createMagic(graph, graph.idgen, "asgnDynlibVar", mAsgnDynlibVar)
 
   extname.typ = graph.getSysType(lib.path.info, tyCstring)
 
-  var bu = initBuilder(result.source.add(path))
-  discard bu.addLocal(Local()) # empty result slot
-
-  let dest =
-    if sym.kind in routineKinds:
-      toValue(env.procedures[sym], env.types.add(sym.typ))
-    else:
-      toValue(env.globals[sym], env.types.add(sym.typ))
-
-  # the scope makes sure that locals are destroyed once loading the
-  # procedure has finished
-  bu.add MirNode(kind: mnkScope)
+  var body: PNode
 
   if path.kind in nkCallKinds and path.typ != nil and
      path.typ.kind in {tyPointer, tyProc}:
@@ -566,41 +561,25 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
     path[^1] = extname # update to the correct name
     # XXX: ^^ maybe sem should do this instead...
 
-    let tmp = bu.allocTemp(dest.typ)
-    bu.buildStmt mnkDef:
-      bu.use tmp
-      generateCode(graph, env, conf.tconfig, path, bu, result.source)
-    bu.subTree mnkVoid:
-      bu.buildMagicCall mAsgnDynlibVar, VoidType:
-        bu.emitByName(dest, ekReassign)
-        bu.emitByVal(tmp)
+    body = newCall(magic, path.info): [newSymNode(sym), path]
   else:
     # the imported procedure is identified by the symbol's external name and
     # the built-in proc loading logic is to be used
-    let
-      isNew = lib.name in env.globals
-      libVar = env.globals.add(lib.name)
-      rtyp = env.types.add(loadProc.typ[0])
-
-    if not isNew:
+    body = newTree(nkStmtList)
+    if lib.name notin env.globals:
       # the library hasn't been loaded yet
-      genLibSetup(graph, env, conf, libVar, path, bu, result.source)
+      body.add genLibSetup(graph, newSymNode(lib.name), path)
       if path.kind in nkStrKinds: # only register statically-known dependencies
         data.libs.add sym.annex
 
-    # generate the code for ``sym = cast[typ](nimGetProcAddr(lib, extname))``
-    let tmp = bu.wrapTemp(rtyp):
-      bu.buildCall env.procedures.add(loadProc), rtyp:
-        bu.emitByVal toValue(libVar, env.types.add(lib.name.typ))
-        bu.emitByVal literal(env.getOrIncl(extname.strVal), CstringType)
-
-    bu.subTree mnkVoid:
-      bu.buildMagicCall mAsgnDynlibVar, VoidType:
-        bu.emitByName(dest, ekReassign)
-        bu.emitByVal tmp
+    # generate the AST for ``asgnDynlibVar(sym, nimGetProcAddr(lib, extname))``
+    body.add newCall(magic, path.info, [
+      newSymNode(sym),
+      newCall(loadProc, path.info, newSymNode(lib.name), extname)])
 
-  bu.add endNode(mnkScope)
-  (result.code, result.locals) = finish(bu, result.locals)
+  echoInput(graph.config, sym, body)
+  result = generateCode(graph, env, owner, conf.tconfig, body)
+  echoMir(graph.config, sym, result)
 
 # ----- discovery and queueing logic -----
 
@@ -806,7 +785,7 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
     if exfDynamicLib in it.extFlags:
       let module = moduleId(it).FileIndex
       var frag = produceLoader(graph, modules[module], discovery, env, conf,
-                               it)
+                               modules[module].dynlibInit, it)
       pushProgress(modules[module].dynlibInit, frag, module)
 
   # let the entities discovered while producing the loaders "bleed" over
@@ -868,7 +847,7 @@ iterator process*(graph: ModuleGraph, modules: var ModuleList,
 
       # ... then produce the loader code
       let frag = produceLoader(graph, modules[module], discovery, env, conf,
-                               env[id])
+                               modules[module].dynlibInit, env[id])
       pushProgress(modules[module].dynlibInit, frag, module)
     of wikReport:
       reportBody(item.fragId, module, item.evt, item.frag)
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index b4331ee8b77..6c36f31a68d 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1084,7 +1084,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
         arg n[2]
     else:
       genCall(c, n)
-  of mNot, mLtI, mLengthSeq, mLengthStr, mSamePayload:
+  of mNot, mLtI, mLengthSeq, mLengthStr, mSamePayload, mIsNil:
     if n[0].typ == nil:
       # simple translation. None of the arguments need to be passed by lvalue
       c.buildMagicCall m, rtyp:
@@ -1111,6 +1111,11 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
       # The normal one doesn't (see ``cyclebreaker.getDynamicTypeInfo``), so we
       # can safely use ``genCall``
       genCall(c, n)
+  of mAsgnDynlibVar:
+    c.buildMagicCall m, VoidType:
+      # note: the first operand may be a procedure symbol
+      c.emitByName ekReassign, genOperand(c, n[1])
+      arg n[2]
 
   # special macro related magics:
   of mExpandToAst:
@@ -2132,36 +2137,6 @@ proc generateAssignment*(graph: ModuleGraph, env: var MirEnv,
   swapState()
   env = move c.env # move back
 
-proc generateCode*(graph: ModuleGraph, env: var MirEnv,
-                   config: TranslationConfig, n: PNode,
-                   builder: var MirBuilder, source: var SourceMap) =
-  ## Generates MIR code that is semantically equivalent to the expression or
-  ## statement `n`, appending the resulting code and the corresponding origin
-  ## information to `code` and `source`, respectively.
-  var c = TCtx(context: skUnknown, graph: graph, config: config, env: move env)
-  c.scopeDepth = 2 # assume that this is not top-level code
-
-  template swapState() =
-    swap(c.sp.map, source)
-    swap(c.builder, builder)
-
-  # for the duration of ``generateCode`` we move the state into ``TCtx``
-  swapState()
-
-  if n.typ.isEmptyType:
-    withFront c.builder:
-      gen(c, n)
-  else:
-    c.builder.useSource(c.sp, n)
-    # XXX: restructure the ``mirgen`` API to use a dedicated procedure for
-    #      generating expression code
-    let v = genUse(c, n)
-    c.use v
-
-  # move the state back into the output parameters:
-  swapState()
-  env = move c.env
-
 proc addParams(c: var TCtx, prc: PSym, signature: PType) =
   ## Translates the result variable and the parameters (taken from `signature`)
   ## to their MIR representation and adds them to the list of locals.

From 4c31272a1e77a361c0a4d911835462823ff708b4 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 20 May 2024 01:53:43 +0200
Subject: [PATCH 095/169] fix(js): compiler crash with globals (#1314)

## Summary

Fix a compiler crash that happened when having globals with type
`array[N, T]`, where `N` is greater than 32 and `T` is a non-primitive
type. Only the JavaScript backend was affected.

## Details

Defer adding the `arrayConstr` compilerproc to the MIR environment if
not within a proper procedure context. This prevents modifications of
the MIR environment from within `defineGlobal` (which calls
`createVar`), which is what caused the assertion in `backends.flush` to
fail.

Registration is deferred until the procedure is code generated, which
works due to discovery of a global currently being guaranteed to
precede code generation of some procedure.
---
 compiler/backend/jsgen.nim      | 18 +++++++++++++++---
 lib/system/jssys.nim            |  2 +-
 tests/js/tlarge_array_crash.nim |  9 +++++++++
 3 files changed, 25 insertions(+), 4 deletions(-)
 create mode 100644 tests/js/tlarge_array_crash.nim

diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index cecdc04eb8a..ad6497fb984 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -114,6 +114,8 @@ type
     typeInfoGenerated: IntSet
     dataGenerated: IntSet
     unique: int    # for temp identifier generation
+    requestArrayConstr: bool
+      ## used for deferring registration of the ``arrayConstr`` proc
 
     names: Table[int, string]
       ## maps a symbol IDs to the symbol's JavaScript name
@@ -1456,9 +1458,12 @@ proc createVar(p: PProc, typ: PType, indirect: bool): Rope =
     if jsTyp.len > 0:
       result = "new $1($2)" % [rope(jsTyp), rope(length)]
     elif length > 32:
-      useMagic(p, "arrayConstr")
-      # XXX: arrayConstr depends on nimCopy. This line shouldn't be necessary.
-      useMagic(p, "nimCopy")
+      if p.prc.isNil:
+        # we're called in a context where registering a new procedure could be
+        # disallowed, so the magic cannot be directly marked as used
+        p.g.requestArrayConstr = true
+      else:
+        useMagic(p, "arrayConstr")
       result = "arrayConstr($1, $2, $3)" % [rope(length),
           createVar(p, e, false), genTypeInfo(p, e)]
     else:
@@ -2378,8 +2383,14 @@ proc genStmts(p: PProc, stmts: openArray[CgNode]) =
   # too, hence -1 as the start
   gen(p, desc, stmts, -1)
 
+proc handleRequestArrayConstr(g: PGlobals, graph: ModuleGraph) =
+  if g.requestArrayConstr:
+    discard g.env.procedures.add(graph.getCompilerProc("arrayConstr"))
+    g.requestArrayConstr = false
+
 proc genProc*(g: PGlobals, module: BModule, id: ProcedureId,
               body: sink Body): Rope =
+  handleRequestArrayConstr(g, module.graph)
   var p = startProc(g, module, id, body)
   p.nested: genStmts(p, p.fullBody.code.kids)
   result = finishProc(p)
@@ -2388,6 +2399,7 @@ proc genPartial*(p: PProc, n: CgNode) =
   ## Generates the JavaScript code for `n` and appends the result to `p`. This
   ## is intended for CG IR that wasn't already available when calling
   ## `startProc`.
+  handleRequestArrayConstr(p.g, p.module.graph)
   synchronize(p.locals, p.fullBody.locals)
   analyseIfAddressTaken(p.fullBody.code, p.addrTaken)
   genStmts(p, n.kids)
diff --git a/lib/system/jssys.nim b/lib/system/jssys.nim
index 363d20a976a..e04705eda48 100644
--- a/lib/system/jssys.nim
+++ b/lib/system/jssys.nim
@@ -696,7 +696,7 @@ proc arrayConstr(len: int, value: JSRef, typ: PNimType): JSRef {.
   # types are fake
   asm """
     var result = new Array(`len`);
-    for (var i = 0; i < `len`; ++i) result[i] = nimCopy(null, `value`, `typ`);
+    for (var i = 0; i < `len`; ++i) result[i] = `nimCopy`(null, `value`, `typ`);
     return result;
   """
 
diff --git a/tests/js/tlarge_array_crash.nim b/tests/js/tlarge_array_crash.nim
new file mode 100644
index 00000000000..cb2c4356aba
--- /dev/null
+++ b/tests/js/tlarge_array_crash.nim
@@ -0,0 +1,9 @@
+discard """
+  description: '''
+    Regression test for a compiler crash caused by the JavaScript code
+    generator
+  '''
+"""
+
+# every array length > 32 caused the crash
+var global: array[33, (int, int)]

From 5a3e8fa53775cddb1a00b155f5be42a7d37d59e2 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 20 May 2024 17:10:38 +0200
Subject: [PATCH 096/169] fix(js): slow code generation (#1313)

## Summary

Replace an algorithm - used by the JavaScript code generator -
potentially taking an exponential amount of time with one taking
linear time. In some edge cases, the previous algorithm was so slow
that the compiler would effectively get stuck.

## Details

`jsflow` is responsible for translating the goto-based control-flow of
the CGIR into JavaScript control-flow (`break`, `try`, etc.). This
requires reordering the initial list of block starts (openings) and
ends such that all openings are paired with their corresponding end.

### Previous Algorithm

The algorithm used for reordering the list works by:
1. start with the last slot in the list
2. shift the block/try opening in the slot backwards (towards the
   start) until it is on the same nesting depth as its corresponding
   end
3. repeat 2 until a fixpoint is reached (the item in the slot no longer
   requires shifting)
4. repeat the previous two steps with the previous slot

Consider the following (where `n` is a value >= 2):
```
block { // 0
  block { // n
    ... // (n - 2) .. 1
    block { // n - 1
    } // 0
  } // 1
  ...
} // n
```

In the situation show above, reaching a fixpoint for the slot
originally containing the `n - 1` block requires `3 * (2 ^ (n - 2))`
iterations/shifts (exponential time).

For large `n` (> 30), the time spent on sorting grew so large that the
compiler would appear to be effectively stuck.

### New Algorithm

The new algorithm requires `n` number of shifts in the worst-case,
where `n` is the number of labels in the input CGIR.

It works by first computing an order value for every label, based on
the position of the label. The relevant openings (block and try) are
then reordered such that they're only enclosed by openings with a
higher order value.
---
 compiler/backend/jsflow.nim | 145 +++++++++++++++++++++---------------
 1 file changed, 85 insertions(+), 60 deletions(-)

diff --git a/compiler/backend/jsflow.nim b/compiler/backend/jsflow.nim
index 4e2ec3d1d60..bdb6544b412 100644
--- a/compiler/backend/jsflow.nim
+++ b/compiler/backend/jsflow.nim
@@ -59,6 +59,15 @@ type
 const
   Terminators = {stkReturn, stkTerminator}
 
+proc rotateRight[T](s: var seq[T], a, b: int) =
+  ## Rotates the items in slice a..b to the right by one element.
+  let backup = s[b]
+  var i = b
+  while i > a:
+    s[i] = s[i - 1]
+    dec i
+  s[a] = backup
+
 func finalTarget*(n: CgNode): CgNode =
   ## Given a label or target list, retrieves the target.
   case n.kind
@@ -143,6 +152,79 @@ func endsInTerminator(structs: seq[Structure], start: int): bool =
 
   result = false # doesn't end in a terminator
 
+proc sort(structs: var seq[Structure]) =
+  ## Reorders the openings in `structs` such that each opening is paired with
+  ## its corresponding end. Pre-conditions:
+  ## * all ends have the correct relative order to each other
+  ## * if a block encloses a ``stkStructStart``, the end of the block is not
+  ##   enclosed by the ``stkStructStart``
+  var
+    order: seq[int] # indexed by LabelId
+    orderVal = 0
+
+  # associate a unique "order" value with each label. We need it to establish a
+  # correct ordering between parent and child openings
+  for i, it in structs.pairs:
+    if it.kind == stkEnd:
+      let idx = it.label.int
+      if idx >= order.len:
+        order.setLen(idx + 1)
+
+      order[idx] = orderVal
+      inc orderVal
+
+  var stack: seq[tuple[pos: int, order: int]]
+
+  # now we want to establish the following: for each parent/child opening, the
+  # parent has a *greater* order value than the child. Structure, catch, and
+  # finally openings must stay associated with their original statement -- they
+  # cannot move
+  for i in 0..<structs.len:
+    template invariant(): bool =
+      # the loop invariant
+      stack.len < 2 or stack[^2].order > stack[^1].order
+
+    let it = structs[i]
+    case it.kind
+    of stkTry, stkBlock:
+      stack.add (i, order[it.label.int])
+      if not invariant():
+        # restore the loop invariant by shifting the new item to the first
+        # position where the invariant holds again
+        var insert = stack.len - 2
+        while insert >= 0 and stack[insert].order < stack[^1].order:
+          dec insert
+        insert += 1
+
+        # attach the opening to the same statement as the opening we're placing
+        # it before:
+        structs[i].stmt = structs[stack[insert].pos].stmt
+        # shift the opening in the `structs` list and reflect the shift in the
+        # `stack`:
+        rotateRight(structs, stack[insert].pos, i)
+        rotateRight(stack, insert, stack.high)
+
+        # we've moved some items in the `structs` list, and the affected stack
+        # items need to reflect that
+        stack[insert].pos = stack[insert + 1].pos
+        for x in (insert + 1) ..< stack.len:
+          inc stack[x].pos
+
+    of stkStructStart:
+      stack.add (i, order[it.label.int])
+    of stkFinally, stkCatch:
+      # keep the 'try'-opening on the stack
+      assert stack[^1].order == order[it.label.int]
+    of stkEnd:
+      # if the pre-conditions hold, the end corresponds to opening at the stack
+      # head -- pop the block
+      let e = stack.pop()
+      assert e.order == order[it.label.int]
+    of stkTerminator, stkReturn:
+      discard
+
+    assert invariant()
+
 proc toStructureList*(stmts: openArray[CgNode]): StructDesc =
   ## Creates and returns the JavaScript control-flow-construct-focused
   ## representation for `stmts`.
@@ -226,66 +308,9 @@ proc toStructureList*(stmts: openArray[CgNode]): StructDesc =
     else:
       discard "not relevant"
 
-  # the list of openings and closing produced by the first pass will in most
-  # cases not be valid JavaScript code. We have to "solve" the representation
-  # by reordering the openings until they're matched with their corresponding
-  # end. ``stkCatch``, ``stkFinally``, ``stkStructStart``, and ``stkEnd`` must
-  # keep their relative order and stay attached to the same statements, only
-  # ``stkTry`` and ``stkBlock`` can be moved, but only backwards
-  var i = structs.high
-  while i > 0:
-    if structs[i].kind in {stkTry, stkBlock}:
-      # compute the difference in nesting between the try/block and its
-      # corresponding end:
-      var
-        depth = 1
-        j = i
-      while true:
-        inc j
-        case structs[j].kind
-        of stkTry, stkBlock, stkStructStart:
-          inc depth
-        of stkFinally, stkCatch:
-          if structs[j].label == structs[i].label:
-            dec depth
-            break
-        of stkEnd:
-          dec depth
-          if structs[j].label == structs[i].label:
-            break
-        of Terminators:
-          discard "not relevant"
-
-      # depth < 0 means that the try/block start is more nested than its end.
-      # In other words, the try or block start is currently too nested. Move
-      # it backwards (i.e., associate it with an earlier statement) until it's
-      # at the same level as its end
-      let moved = depth < 0
-      var x = i
-      while depth < 0:
-        # change the associated statement...
-        structs[x].stmt = structs[x - 1].stmt
-        # ... then swap
-        swap(structs[x], structs[x - 1])
-
-        case structs[x].kind
-        of stkEnd:
-          dec depth
-        of stkBlock, stkTry, stkStructStart:
-          inc depth
-        of Terminators, stkCatch, stkFinally:
-          # catch and finally don't change the nesting (the try's body is at
-          # the same level as catch/finally's body)
-          discard
-
-        dec x
-
-      if moved:
-        # a different item than before is in the slot now; it needs to be
-        # processed too
-        continue # skip the following decrement
-
-    dec i
+  # now make sure that all openings in the list are matched with their
+  # respective end
+  sort(structs)
 
   # note: changing what statements a 'try' encloses can alter semantics! That's
   # none of our concern here, however: the code generator is reponsible for

From e400093ea204e14932821e09850c437c9c189e3f Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 21 May 2024 19:12:12 +0000
Subject: [PATCH 097/169] build(deps): Bump
 JamesIves/github-pages-deploy-action from 4.6.0 to 4.6.1 (#1315)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[JamesIves/github-pages-deploy-action](https://github.com/jamesives/github-pages-deploy-action)
from 4.6.0 to 4.6.1.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/jamesives/github-pages-deploy-action/releases">JamesIves/github-pages-deploy-action's
releases</a>.</em></p>
<blockquote>
<h2>v4.6.1</h2>
<h2>What's Changed</h2>
<h3>Fixes</h3>
<ul>
<li>Resolved an issue where workflows were suddenly failing due to a
worktree in use error. The action will now attempt to create a temp
branch name if the existing branch name is already checked out by a
prior to step to ensure it can occur. This issue was only occurring in a
handful of workflows, and likely stemmed from a git version change on
the official GitHub runners. The actual root cause is still somewhat
unknown.</li>
</ul>
<h3>Dependencies</h3>
<ul>
<li>build(deps-dev): bump eslint-plugin-jest from 28.2.0 to 28.5.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1577">JamesIves/github-pages-deploy-action#1577</a></li>
<li>build(deps): bump <code>@​eslint/js</code> from 9.0.0 to 9.2.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1576">JamesIves/github-pages-deploy-action#1576</a></li>
<li>build(deps-dev): bump eslint from 9.0.0 to 9.2.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1575">JamesIves/github-pages-deploy-action#1575</a></li>
<li>build(deps): bump typescript-eslint from 7.7.0 to 7.8.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1569">JamesIves/github-pages-deploy-action#1569</a></li>
<li>build(deps-dev): bump <code>@​types/node</code> from 20.12.7 to
20.12.9 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1578">JamesIves/github-pages-deploy-action#1578</a></li>
<li>build(deps-dev): bump <code>@​types/node</code> from 20.12.9 to
20.12.10 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1579">JamesIves/github-pages-deploy-action#1579</a></li>
<li>build(deps-dev): bump rimraf from 5.0.5 to 5.0.7 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1583">JamesIves/github-pages-deploy-action#1583</a></li>
<li>build(deps): bump codecov/codecov-action from 4.3.0 to 4.4.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1588">JamesIves/github-pages-deploy-action#1588</a></li>
<li>build(deps): bump typescript-eslint from 7.8.0 to 7.9.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1586">JamesIves/github-pages-deploy-action#1586</a></li>
<li>build(deps): bump the eslint group with 3 updates by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1592">JamesIves/github-pages-deploy-action#1592</a></li>
<li>build(deps-dev): bump the misc group with 2 updates by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/JamesIves/github-pages-deploy-action/pull/1593">JamesIves/github-pages-deploy-action#1593</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/JamesIves/github-pages-deploy-action/compare/v4...v4.6.1">https://github.com/JamesIves/github-pages-deploy-action/compare/v4...v4.6.1</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/5c6e9e9f3672ce8fd37b9856193d2a537941e66c"><code>5c6e9e9</code></a>
Deploy Production Code for Commit
e9abb9ce6e35175032a1e82dd997ac600ad10c9b 🚀</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/e9abb9ce6e35175032a1e82dd997ac600ad10c9b"><code>e9abb9c</code></a>
Merge branch 'dev' into releases/v4</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/079c29cbbe91fe1b06f83be57ad53e8a0d3c8c38"><code>079c29c</code></a>
build(deps-dev): bump the misc group with 2 updates (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1593">#1593</a>)</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/e0e9b96aa6f01a03b77ee464c4f301e7487a62ab"><code>e0e9b96</code></a>
build(deps): bump the eslint group with 3 updates (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1592">#1592</a>)</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/dfda8148a1c8cf43d97aa3421867d44c372d0cd3"><code>dfda814</code></a>
Merge branch 'dev' of <a

href="https://github.com/JamesIves/github-pages-deploy-action">https://github.com/JamesIves/github-pages-deploy-action</a>...</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/c2821857f23a224815824e852567e7a60e985d52"><code>c282185</code></a>
chore: update dependabot groups</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/91fd6eeeda825848072ae08203639c55c255eec6"><code>91fd6ee</code></a>
fix: :bug: Use commish to make branch unique (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1591">#1591</a>)</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/5bb052c41a7c97d60f4147c7fae34725b9e8abbe"><code>5bb052c</code></a>
build(deps): bump typescript-eslint from 7.8.0 to 7.9.0 (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1586">#1586</a>)</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/ef33bcd4947b3e43b815809dedf0f4e19c4257fb"><code>ef33bcd</code></a>
build(deps): bump codecov/codecov-action from 4.3.0 to 4.4.0 (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1588">#1588</a>)</li>
<li><a

href="https://github.com/JamesIves/github-pages-deploy-action/commit/1a64cb8ec57c97ea1608e5fd6689d7efec6adaa2"><code>1a64cb8</code></a>
build(deps-dev): bump rimraf from 5.0.5 to 5.0.7 (<a

href="https://redirect.github.com/jamesives/github-pages-deploy-action/issues/1583">#1583</a>)</li>
<li>Additional commits viewable in <a

href="https://github.com/jamesives/github-pages-deploy-action/compare/v4.6.0...v4.6.1">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=JamesIves/github-pages-deploy-action&package-manager=github_actions&previous-version=4.6.0&new-version=4.6.1)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 5398dfb6e39..625cb2aa20a 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -71,7 +71,7 @@ jobs:
           path: release-staging
 
       - name: Publish docs
-        uses: JamesIves/github-pages-deploy-action@v4.6.0
+        uses: JamesIves/github-pages-deploy-action@v4.6.1
         with:
           branch: gh-pages
           folder: doc/html

From 5abb1acf846b7516e63d3f941045c168bc09292a Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 23 May 2024 03:00:49 +0200
Subject: [PATCH 098/169] fix csource compilation with many modules (#1320)

## Summary

Make building the csource compiler on Windows via the `build.bat` batch
script work when the link command length exceeds the maximum command
line length due to a large number of object files.

## Details

On Windows, everything beyond 8192 characters is cut off from the
command-line arguments, leading to not all arguments reaching the
linker.

Instead of directly appending the object file paths to a the link
command, `build.bat` now writes the paths to the temporary
"linker_args.rsp" file, which is then passed to gcc as a "response
file".

For simplicity, this is done even when the command-line would not
exceed the maximum length.
---
 tools/niminst/buildbat.nimf | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/tools/niminst/buildbat.nimf b/tools/niminst/buildbat.nimf
index f9577147d5f..0e1c78ad383 100644
--- a/tools/niminst/buildbat.nimf
+++ b/tools/niminst/buildbat.nimf
@@ -6,6 +6,7 @@ SET LINKER=gcc
 SET COMP_FLAGS=?{c.ccompiler.flags}
 SET LINK_FLAGS=?{c.linker.flags}
 SET BIN_DIR=?{firstBinPath(c).toWin}
+SET RSP_FILE=linker_args.rsp
 
 REM Detect gcc arch
 IF DEFINED ARCH (
@@ -21,43 +22,43 @@ ECHO Building with %ARCH% bit %CC%
 
 if NOT EXIST %BIN_DIR%\nul mkdir %BIN_DIR%
 
+if EXIST %RSP_FILE% rm %RSP_FILE%
+
 REM call the compiler:
 
 IF %ARCH% EQU 32 (
 
 #  block win32:
-#    var linkCmd = ""
 #    if cpuIndex32 != -1:
 #      for ff in items(c.cfiles[winIndex][cpuIndex32]):
 #        let f = ff.toWin
   ECHO %CC% %COMP_FLAGS% -Ic_code -c ?{f} -o ?{changeFileExt(f, "o")}
   CALL %CC% %COMP_FLAGS% -Ic_code -c ?{f} -o ?{changeFileExt(f, "o")}
-#        linkCmd.add(" " & changeFileExt(f, "o"))
+  ECHO ?{replace(changeFileExt(f, "o"), "\\", "/")} >> %RSP_FILE%
   IF ERRORLEVEL 1 (GOTO:END)
 #      end for
 #    end if
 
-  ECHO %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe ?linkCmd %LINK_FLAGS%
-  CALL %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe ?linkCmd %LINK_FLAGS%
+  ECHO %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe @%RSP_FILE% %LINK_FLAGS%
+  CALL %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe @%RSP_FILE% %LINK_FLAGS%
 
 #  end block
 
 ) ELSE IF %ARCH% EQU 64 (
 
 #  block win64:
-#    var linkCmd = ""
 #    if cpuIndex64 != -1:
 #      for ff in items(c.cfiles[winIndex][cpuIndex64]):
 #        let f = ff.toWin
   ECHO %CC% %COMP_FLAGS% -Ic_code -c ?{f} -o ?{changeFileExt(f, "o")}
   CALL %CC% %COMP_FLAGS% -Ic_code -c ?{f} -o ?{changeFileExt(f, "o")}
-#        linkCmd.add(" " & changeFileExt(f, "o"))
+  ECHO ?{replace(changeFileExt(f, "o"), "\\", "/")} >> %RSP_FILE%
   IF ERRORLEVEL 1 (GOTO:END)
 #      end for
 #    end if
 
-  ECHO %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe ?linkCmd %LINK_FLAGS%
-  CALL %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe ?linkCmd %LINK_FLAGS%
+  ECHO %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe @%RSP_FILE% %LINK_FLAGS%
+  CALL %LINKER% -o ?{"%BIN_DIR%"\toLowerAscii(c.name)}.exe @%RSP_FILE% %LINK_FLAGS%
 
 #  end block
 )

From f5147bb02285ffc116cf3cfdf5c7b6141d42a8b6 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 25 May 2024 01:05:51 +0200
Subject: [PATCH 099/169] fix(sem): crash with `void` fields in instantiated
 tuple types (#1319)

## Summary

Handle removal of `void` fields from tuple types properly when
instantiating generic types, fixing various compiler crashes.

Fixes https://github.com/nim-works/nimskull/issues/1316.

## Details

The problem was that `void` fields weren't removed from the type, like
what happens for `tyObject` and `tyProc` types. Therefore:
* `tyVoid` types unexpectedly reached the code generators as part of
  records
* `computeSizeAlign` crashed because it expects the `nkRecList` of a
  `tyTuple` to only contain `nkSym` nodes, but `replaceTypeVarsN`
  replaced the `nkSym` node for `void` fields with empty `nkRecList`
  nodes earlier

In order to remove the `void` fields properly:
* custom logic is used for the tuple's record AST, which - compared to
  `replaceTypeVarsN` - also updates the fields' position
* the type and record slots of void are removed with a generalized
  version of `eraseVoidParams` (`eraseVoidTypes`)

Finally, the `propagateFieldFlags` call for tuple types is removed. It
is redundant,  since the type flags are already propagated when the
type variables are replaced.
---
 compiler/sem/semtypinst.nim                   | 62 ++++++++++-------
 .../tgeneric_tuple_with_void_param.nim        | 67 +++++++++++++++++++
 2 files changed, 103 insertions(+), 26 deletions(-)
 create mode 100644 tests/lang_callable/generics/tgeneric_tuple_with_void_param.nim

diff --git a/compiler/sem/semtypinst.nim b/compiler/sem/semtypinst.nim
index 7e90a126ff7..f27329caf1c 100644
--- a/compiler/sem/semtypinst.nim
+++ b/compiler/sem/semtypinst.nim
@@ -658,25 +658,32 @@ proc handleGenericInvocation(cl: var TReplTypeVars, t: PType): PType =
           attachedAsgn, col)
       excl mm.flags, tfFromGeneric
 
-proc eraseVoidParams*(t: PType) =
-  # transform '(): void' into '()' because old parts of the compiler really
-  # don't deal with '(): void':
-  if t[0] != nil and t[0].kind == tyVoid:
-    t[0] = nil
-
-  for i in 1..<t.len:
+proc eraseVoidTypes(t: PType; start = 0) =
+  ## Removes all ``tyVoid`` items from `t`. If `t` has attached AST, the slots
+  ## corresponding to the type items are removed too.
+  for i in start..<t.len:
     # don't touch any memory unless necessary
     if t[i].kind == tyVoid:
       var pos = i
       for j in i+1..<t.len:
         if t[j].kind != tyVoid:
           t[pos] = t[j]
-          t.n[pos] = t.n[j]
+          if t.n != nil:
+            t.n[pos] = t.n[j]
           inc pos
       setLen t.sons, pos
-      setLen t.n.sons, pos
+      if t.n != nil:
+        setLen t.n.sons, pos
       break
 
+proc eraseVoidParams*(t: PType) =
+  # transform '(): void' into '()' because old parts of the compiler really
+  # don't deal with '(): void':
+  if t[0] != nil and t[0].kind == tyVoid:
+    t[0] = nil
+
+  eraseVoidTypes(t, start=1)
+
 proc skipIntLiteralParams*(t: PType; idgen: IdGenerator) =
   for i in 0..<t.len:
     let p = t[i]
@@ -691,20 +698,6 @@ proc skipIntLiteralParams*(t: PType; idgen: IdGenerator) =
   if t[0] != nil and t[0].kind == tyStatic:
     t[0] = t[0].base
 
-proc propagateFieldFlags(t: PType, n: PNode) =
-  # This is meant for objects and tuples
-  # The type must be fully instantiated!
-  if n.isNil:
-    return
-  #internalAssert n.kind != nkRecWhen
-  case n.kind
-  of nkSym:
-    propagateToOwner(t, n.sym.typ)
-  of nkRecList, nkRecCase, nkOfBranch, nkElse:
-    for son in n:
-      propagateFieldFlags(t, son)
-  else: discard
-
 proc replaceTypeVarsTAux(cl: var TReplTypeVars, t: PType): PType =
   template bailout =
     if cl.recursionLimit > 100:
@@ -800,21 +793,38 @@ proc replaceTypeVarsTAux(cl: var TReplTypeVars, t: PType): PType =
           result[i] = r
           if result.kind != tyArray or i != 0:
             propagateToOwner(result, r)
-      # bug #4677: Do not instantiate effect lists
-      result.n = replaceTypeVarsN(cl, result.n, ord(result.kind==tyProc))
       case result.kind
       of tyArray:
         let idx = result[0]
         internalAssert(cl.c.config, idx.kind != tyStatic, "[FIXME]")
 
       of tyTuple:
-        propagateFieldFlags(result, result.n)
+        if result.n != nil:
+          # update the record description
+          result.n = shallowCopy(t.n)
+          var pos = 0
+          for i, it in t.n.pairs:
+            # don't copy void fields, they're removed afterwards
+            if result[i].kind != tyVoid:
+              # always copy the symbol to make sure we can modify it
+              let s = copySym(it.sym, nextSymId cl.c.idgen)
+              s.typ = result[i]
+              incl(s.flags, sfFromGeneric)
+              s.position = pos
+              inc pos
+              result.n[i] = newSymNode(s, it.info)
+
+        # now erase the void types, which will also eliminate the empty slots
+        eraseVoidTypes(result)
 
       of tyProc:
+        # bug #4677: Do not instantiate effect lists
+        result.n = replaceTypeVarsN(cl, result.n, 1)
         eraseVoidParams(result)
         skipIntLiteralParams(result, cl.c.idgen)
 
       of tyRange:
+        result.n = replaceTypeVarsN(cl, result.n, 0)
         result[0] = result[0].skipTypes({tyStatic, tyDistinct})
 
       else: discard
diff --git a/tests/lang_callable/generics/tgeneric_tuple_with_void_param.nim b/tests/lang_callable/generics/tgeneric_tuple_with_void_param.nim
new file mode 100644
index 00000000000..fafb3ade853
--- /dev/null
+++ b/tests/lang_callable/generics/tgeneric_tuple_with_void_param.nim
@@ -0,0 +1,67 @@
+discard """
+  description: '''
+    Ensure that fields whose type is substituted with `void` are properly
+    removed from tuple types during instantiation
+  '''
+"""
+
+type
+  Anon[A, B, C] = (A, B, C)
+  Named[A, B, C] = tuple[a: A, b: B, c: C]
+
+block trailing_field_is_void:
+  var x: Anon[int, string, void]
+  doAssert x is (int, string)
+  doAssert sizeof(x) == sizeof((int, string))
+  doAssert not compiles(x[2])
+  # make sure the fields are accessible:
+  x[0] = 1
+  x[1] = ""
+
+  # with generic named tuple:
+  var y: Named[int, string, void]
+  doAssert y is tuple[a: int, b: string]
+  doAssert sizeof(y) == sizeof((int, string))
+  doAssert not compiles(y.c)
+  # make sure the fields are accessible:
+  y.a = 1
+  y.b = ""
+
+block middle_field_is_void:
+  var x: Anon[int, void, string]
+  doAssert x is (int, string)
+  doAssert sizeof(x) == sizeof((int, string))
+  doAssert not compiles(x[2])
+  # make sure the fields are accessible:
+  x[0] = 1
+  x[1] = ""
+
+  # with generic named tuple:
+  var y: Named[int, void, string]
+  doAssert y is tuple[a: int, c: string]
+  doAssert sizeof(y) == sizeof((int, string))
+  doAssert not compiles(y.b)
+  y.a = 1
+  y.c = ""
+
+block all_fields_are_void:
+  var x: Anon[void, void, void]
+  doAssert sizeof(x) == 1
+  doAssert not compiles(x[0])
+
+  var y: Named[void, void, void]
+  doAssert sizeof(y) == 1
+  doAssert not compiles(y.a)
+
+block non_generic_field:
+  type Tup[T] = tuple[a: T, b: int]
+
+  # instantiate the type with a non-void parameter first
+  var x: Tup[string]
+  x.a = ""
+  x.b = 0
+
+  # instantiating the type with a void parameter must not affect previous
+  # instantiations (code generation would fail if it does)
+  var y: Tup[void]
+  y.b = 0

From afcd3c0aba3f670efb880f1cef0e12f998fcb1e7 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 25 May 2024 23:18:47 +0200
Subject: [PATCH 100/169] mir: implement the new control-flow primitives
 (#1281)

## Summary

Replace the legacy control-flow primitives with the new ones outlined
in the documentation. This is a refactor for the most part, but - as a
side effect - a bug is fixed too, and destructors are no longer called
on not-yet-alive locations.

Fixes #1303.

## Details

The new control-flow primitives are those documented in the `mir.rst`
file -- the node kinds for the legacy ones are all removed. They're the
same as those used by the CGIR, removing the largest remaining
difference between the two IRs, preparing for the CGIR's removal.

In broad:
* translating the `try`/`block`/`break` control-flow to the goto-based
  control-flow now happens during AST -> MIR translation (`mirgen`)
  instead of during MIR -> CGIR translation (`cgirgen`)
* elimination of unreachable code now happens during AST -> MIR
  translation already
* all necessary destroy operations are injected during AST -> MIR
  translation
* the "destructor injection" pass now only collapses sink operations
  and eliminates destroy operations that turn out to be redundant

Adding new finally sections after the initial MIR production would
require patching all intercepted gotos and checked calls, which is
complex and hurts composition of the pass, hence this approach being
decided against.

### Multiple `finally`s Per Scope

Instead of using a single `finally` per scope (or none at all),
multiple ones are used, depending on the placement of unstructured
scope exits. As a consequence:
```nim
block:
  var x = Object()
  if cond:
    break # no longer invokes the destructor for `y`
  var y = Object() # destruction doesn't require a finally
```

This generally enables better code generation, since locals destroyed
in `finally` sections don't have to conservatively be zero'ed on scope
entry anymore.

### Other Changes

* the MIR pretty-printer (`mir/utils.nim`) is updated to render the new
  node kinds
* `transf` no longer wraps `while` loop bodies in a `block`, which was
  previously required for proper destruction of locals defined as part
  of the body
* `mirtrees.numArgs` now only returns the number of arguments in a call
  tree, not the number of child nodes
* repeated are `pirMat`/`pirMatCursor` nodes are guarded against during
  PMIR production
* the `mnkDefUnpack` node kind is obsolete now that destroy operations
  are placed by `mirgen` -- it's removed

### Test Changes

* tests using now-removed MIR node kinds are changed to use different
  ones
* some assertions in now-working tests are updated
* the `--expandArc`-using tests are updated to the changes in MIR
  rendering
---
 compiler/backend/backends.nim                 |   2 +-
 compiler/backend/cgirgen.nim                  | 457 +++----------
 compiler/mir/analysis.nim                     | 120 +---
 compiler/mir/injecthooks.nim                  |   6 +-
 compiler/mir/mirchangesets.nim                |  11 +
 compiler/mir/mirconstr.nim                    |  28 +
 compiler/mir/mirgen.nim                       | 628 ++++++++++++------
 compiler/mir/mirgen_blocks.nim                | 297 +++++++++
 compiler/mir/mirpasses.nim                    |  19 +-
 compiler/mir/mirtrees.nim                     | 101 +--
 compiler/mir/proto_mir.nim                    |  30 +-
 compiler/mir/rtchecks.nim                     |  10 +-
 compiler/mir/utils.nim                        | 214 ++++--
 compiler/sem/injectdestructors.nim            | 256 ++-----
 compiler/sem/mirexec.nim                      | 395 +++++------
 compiler/sem/transf.nim                       |   9 +-
 doc/mir.rst                                   |  45 +-
 tests/arc/topt_cursor.nim                     |  76 ++-
 tests/arc/topt_no_cursor.nim                  | 294 ++++----
 tests/arc/topt_refcursors.nim                 |  72 +-
 tests/arc/topt_wasmoved_destroy_pairs.nim     | 148 +++--
 tests/compiler/tmir_exec.nim                  |  27 +-
 tests/compiler/tmir_trees.nim                 |   2 +-
 tests/compiler/ttreechangesets.nim            |   4 +-
 .../tdestruction_in_unreachable.nim           |   7 +-
 .../destructor/timplicit_move_bug.nim         |  37 ++
 tests/lang_objects/destructor/tv2_cast.nim    |  98 +--
 tests/misc/tdont_fold_procedure_cast.nim      |   2 +-
 28 files changed, 1696 insertions(+), 1699 deletions(-)
 create mode 100644 compiler/mir/mirgen_blocks.nim
 create mode 100644 tests/lang_objects/destructor/timplicit_move_bug.nim

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 4e2d1ab070a..2893dd51e46 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -283,7 +283,7 @@ func isEmpty*(tree: MirTree): bool =
   ## Returns whether `tree` contains either no nodes or only nodes that have
   ## no meaning by themselves.
   for n in tree.items:
-    if n.kind notin {mnkScope, mnkStmtList, mnkEnd}:
+    if n.kind notin {mnkScope, mnkEnd}:
       return false
 
   result = true
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 892e3d7ebe4..6256c31f910 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -43,16 +43,11 @@ import
   ]
 
 import std/options as std_options
-from std/sequtils import delete
 
 from compiler/ast/ast import newSym, newType, rawAddSon
 from compiler/sem/semdata import makeVarType
 
 type
-  NodeLabelPair = tuple
-    node: CgNode
-    target: LabelId
-
   TranslateCl = object
     graph: ModuleGraph
     idgen: IdGenerator
@@ -62,38 +57,16 @@ type
 
     owner: PSym
 
-    blocks: seq[tuple[input, actual: LabelId]]
-      ## the stack of enclosing blocks for the currently processed node
-
-    numLabels: int
-      ## incremented when a new label ID is allocated
-    exits: seq[NodeLabelPair]
-      ## non-exception goto-like statements that need patching when crossing
-      ## ``try``, ``finally``, or ``except`` boundaries
-    raiseExits: seq[NodeLabelPair]
-      ## similar to `exits`, but for exceptional control-flow statements/
-      ## nodes. The label doesn't matter, it's only there so that `raiseExits`
-      ## can be passed to the same procedures as `exits`
-    returnLabel: Option[LabelId]
-      ## the label to be placed after all other statements. A label is only
-      ## allocated if an ``mnkReturn`` appears somewhere in the MIR code
-    isActive: bool
-      ## whether translation of statements is enabled. Used to eliminate
-      ## unreachable code
-
     locals: Store[LocalId, Local]
       ## the list of all locals in the body, taken from the ``MirBody``.
       ## Only needed for updating the type for alias locals
 
-    # a 'def' in the MIR means that the the local starts to exists and that it
-    # is accessible in all connected basic blocks part of the enclosing
-    # ``mnkScope``. The ``CgNode`` IR doesn't use same notion of scope,
-    # so for now, all 'def's (without the initial values) within nested
-    # control-flow-related trees are moved to the start of the enclosing
-    # ``mnkScope``.
-    inUnscoped: bool
+    inUnscoped: int
       ## whether the currently proceesed statement/expression is part of an
-      ## unscoped control-flow context
+      ## unscoped control-flow context. Used to move definitions to the start
+      ## of the enclosing scope, which is currently required for temporaries
+      ## requiring destruction that are spawned as part of the right-hand
+      ## operand of ``and``/``or``
     defs: seq[CgNode]
       ## the stack of locals/globals for which the ``cnkDef``/assignemnt needs
       ## to be inserted later
@@ -103,12 +76,6 @@ type
     pos: uint32 ## the index of the currently pointed to node
     origin {.cursor.}: PNode ## the source node
 
-func delete[T](s: var seq[T], a, b: int) =
-  # XXX: this procedure is a workaround for ``sequtils.delete`` not handling
-  #      empty slices properly (an IndexDefect is erroneously raised)
-  if b > a:
-    sequtils.delete(s, a..(b-1))
-
 func newMagicNode(magic: TMagic, info: TLineInfo): CgNode =
   CgNode(kind: cnkMagic, info: info, magic: magic)
 
@@ -144,9 +111,6 @@ template hasNext(cr: TreeCursor, t: MirBody): bool =
 template `[]=`(x: CgNode, i: Natural, n: CgNode) =
   x.kids[i] = n
 
-template `[]=`(x: CgNode, i: BackwardsIndex, n: CgNode) =
-  x.kids[i] = n
-
 template add(x: CgNode, y: CgNode) =
   x.kids.add y
 
@@ -181,8 +145,8 @@ func newTypeNode(info: TLineInfo, typ: PType): CgNode =
 func newFieldNode(s: PSym; info = unknownLineInfo): CgNode =
   CgNode(kind: cnkField, info: info, typ: s.typ, field: s)
 
-func newLabelNode(blk: BlockId; info = unknownLineInfo): CgNode =
-  CgNode(kind: cnkLabel, info: info, label: blk)
+func newLabelNode(label: LabelId; info = unknownLineInfo): CgNode =
+  CgNode(kind: cnkLabel, info: info, label: BlockId(label))
 
 proc newExpr(kind: CgNodeKind, info: TLineInfo, typ: PType,
              kids: sink seq[CgNode]): CgNode =
@@ -226,9 +190,6 @@ proc genObjConv(n: CgNode, to: PType, info: TLineInfo): CgNode =
     if diff < 0: cnkObjUpConv else: cnkObjDownConv,
     info, to): n
 
-func disable(cl: var TranslateCl) {.inline.} =
-  cl.isActive = false
-
 # forward declarations:
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
               cr: var TreeCursor, stmts: var seq[CgNode])
@@ -387,6 +348,34 @@ proc valueToIr(tree: MirBody, cl: var TranslateCl,
   else:
     unreachable("not a value: " & $tree[cr].kind)
 
+proc labelToIr(tree: MirBody, cr: var TreeCursor): CgNode =
+  ## Translates a MIR label to a CGIR label.
+  assert tree[cr].kind == mnkLabel
+  newLabelNode(tree.get(cr).label)
+
+proc targetToIr(tree: MirBody, cr: var TreeCursor): CgNode =
+  ## Translates a MIR target list to its CGIR counterpart. Both share the same
+  ## structure, so the translation is straightforward.
+  proc actionToIr(tree: MirBody, n: MirNode, info: TLineInfo): CgNode =
+    case n.kind
+    of mnkLabel:  newLabelNode(n.label)
+    of mnkLeave:  newTree(cnkLeave, info, newLabelNode(n.label))
+    of mnkResume: CgNode(kind: cnkResume, info: info)
+    else:
+      unreachable(n.kind)
+
+  let n {.cursor.} = tree.get(cr)
+  case n.kind
+  of mnkLabel:
+    result = actionToIr(tree, n, cr.info)
+  of mnkTargetList:
+    result = newTree(cnkTargetList, cr.info)
+    while tree[cr].kind != mnkEnd:
+      result.add actionToIr(tree, tree.get(cr), cr.info)
+    leave(tree, cr)
+  else:
+    unreachable(n.kind)
+
 proc argToIr(tree: MirBody, cl: var TranslateCl,
              cr: var TreeCursor): (bool, CgNode) =
   ## Translates a MIR argument tree to the corresponding CG IR tree.
@@ -436,7 +425,7 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
                result[0].magic in FakeVarParams
 
   # translate the arguments:
-  while tree[cr].kind != mnkEnd:
+  while tree[cr].kind in ArgumentNodes:
     var (mutable, arg) = argToIr(tree, cl, cr)
     if noAddr:
       if arg.typ.kind == tyVar:
@@ -448,6 +437,9 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
 
     result.add arg
 
+  if n.kind == mnkCheckedCall:
+    result.add targetToIr(tree, cr)
+
   leave(tree, cr)
 
 proc exprToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode
@@ -531,7 +523,7 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
 
   case def.kind
   of cnkLocal:
-    if cl.inUnscoped and not isLet:
+    if cl.inUnscoped > 0 and not isLet:
       # add the local to the list of moved definitions and only emit
       # an assignment
       cl.defs.add copyTree(def)
@@ -552,14 +544,14 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
         # known to us, not that it starts its lifetime here -> don't
         # initialize or move it
         result = arg
-      elif cl.inUnscoped:
+      elif cl.inUnscoped > 0:
         # move the default initialization to the start of the scope
         cl.defs.add def
         result = arg
       else:
         result = newStmt(cnkAsgn, info, [def, newDefaultCall(info, def.typ)])
     else:
-      if sfImportc notin env.globals[def.global].flags and cl.inUnscoped:
+      if sfImportc notin env.globals[def.global].flags and cl.inUnscoped > 0:
         # default intialization is required at the start of the scope
         cl.defs.add def
       result = newStmt(cnkAsgn, info, [def, arg])
@@ -568,151 +560,14 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   else:
     unreachable()
 
-proc bodyToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
-              cr: var TreeCursor, stmts: var seq[CgNode]) =
-  ## Generates the ``CgNode`` tree for the body of a construct that implies
-  ## some form of control-flow.
-  let prev = cl.inUnscoped
-  # assume the body is unscoped until stated otherwise
-  cl.inUnscoped = true
-  stmtToIr(tree, env, cl, cr, stmts)
-  cl.inUnscoped = prev
-
 proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor, stmts: var seq[CgNode])
-
-func newLabel(cl: var TranslateCl): LabelId =
-  ## Allocates a new label ID and returns it.
-  result = LabelId(cl.numLabels)
-  inc cl.numLabels
-
-func getReturnLabel(cl: var TranslateCl): LabelId =
-  ## Returns the label that points to the end of the current procedure.
-  if cl.returnLabel.isSome:
-    result = cl.returnLabel.unsafeGet()
-  else:
-    # allocate a new label first
-    result = newLabel(cl)
-    cl.returnLabel = some result
-
-func node(lbl: LabelId): CgNode =
-  newLabelNode(BlockId(lbl))
-
-proc patch(stmt: CgNode, target: sink CgNode) =
-  ## Appends `target` to the goto-like statement `stmt`, always wrapping
-  ## `target` in a ``cnkTargetList`` if there's none yet.
-  if stmt[^1] == nil:
-    stmt[^1] = newTree(cnkTargetList, unknownLineInfo, target)
-  else:
-    # a target list already exists
-    stmt[^1].kids.add target
-
-proc patchSingle(stmt: CgNode, target: sink CgNode) =
-  ## Appends `target` to the goto-like statement `stmt`.
-  if stmt[^1] == nil:
-    stmt[^1] = target
-  else:
-    stmt[^1].kids.add target
-
-proc patch(x: seq[NodeLabelPair], start: int, exit: LabelId) =
-  for i in start..<x.len:
-    patch(x[i].node, node(exit))
-
-proc patchLeave(x: seq[NodeLabelPair], start: int, exit: LabelId) =
-  for i in start..<x.len:
-    patch(x[i].node, newTree(cnkLeave, x[i].node.info, node(exit)))
-
-proc patchResume(x: seq[NodeLabelPair], start: int) =
-  for i in start..<x.len:
-    patch(x[i].node, newNode(cnkResume, x[i].node.info))
-
-proc join(stmts: var seq[CgNode], cl: var TranslateCl, info: TLineInfo,
-          target: LabelId, required: bool) =
-  ## Emits a join statement with label `target`, enabling translation
-  ## again if it's disabled and an exit targetting `target` exists.
-  ## If `required` is false and a join statement was immediately emitted
-  ## prior, no new join statement is emitted.
-  var label = target
-
-  # if allowed and possible, coalesce a join with the previous one:
-  if not required and stmts.len > 0 and stmts[^1].kind == cnkJoinStmt:
-    label = stmts[^1][0].label.LabelId
-
-  var
-    i = 0
-    found = false
-  # search for exits targetting `target`, update them with the correct label,
-  # and then remove them from the list
-  while i < cl.exits.len:
-    if cl.exits[i][1] == target:
-      patchSingle(cl.exits[i][0], node(label))
-      cl.exits.del(i)
-      # remember that at least one exit was found:
-      found = true
-    else:
-      inc i
-
-  # emit the join, but only if no coalescing took place and the label is
-  # actually targeted:
-  if label == target and (found or required):
-    stmts.add newTree(cnkJoinStmt, info, node(label))
-
-  if found:
-    # code is alive if following a join that is targeted by an alive goto
-    cl.isActive = true
-
-template join(info: TLineInfo, lbl: LabelId; required = false) =
-  join(stmts, cl, info, lbl, required)
-
-template goto(kind: CgNodeKind, info: TLineInfo, target: LabelId) =
-  ## Emits a fixed goto-like statement targeting `target`.
-  stmts.add newStmt(kind, info, node(target))
-
-template exit(lbl: LabelId) =
-  ## Emits a goto statement and registers it with `lbl` as the target.
-  if cl.isActive:
-    let n = newStmt(cnkGotoStmt, unknownLineInfo, nil)
-    stmts.add n
-    cl.exits.add((n, lbl))
-    cl.disable()
-
-template guarded(lbl: LabelId, body: untyped) =
-  ## Updates all exits emitted as part of `body` with a leave instruction
-  ## targetting `lbl`.
-  let
-    raiseStart = cl.raiseExits.len
-    exitStart = cl.exits.len
-  body
-  patchLeave(cl.raiseExits, raiseStart, lbl)
-  patchLeave(cl.exits, exitStart, lbl)
+              cr: var TreeCursor): CgNode
 
 proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
               cr: var TreeCursor, stmts: var seq[CgNode]) =
-
-  # skip the statement if translation is disabled, but with a caveat. Consider
-  # the following MIR:
-  #   try:
-  #     return
-  #     def _1 = ...
-  #   finally:
-  #     =destroy(name _1)
-  #
-  # Although nonesense, this is currently both legal and possible MIR. If
-  # translation would be disabled beyond the ``return``, then the temporary
-  # wouldn't be registered. Therefore, translation is always enabled in unscoped
-  # contexts (such as the above)
-  # XXX: eliminating unreachable code needs to happen much earlier, either in
-  #      ``mirgen`` or ``transf``
-  if not cl.isActive and not cl.inUnscoped:
-    tree.skip(cr)
-    return
-
   let n {.cursor.} = tree.get(cr)
   let info = cr.info ## the source information of `n`
 
-  template body() =
-    bodyToIr(tree, env, cl, cr, stmts)
-
   template to(kind: CgNodeKind, args: varargs[untyped]) =
     let r = newStmt(kind, info, args)
     leave(tree, cr)
@@ -733,124 +588,36 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       dst = lvalueToIr(tree, cl, cr)
       (src, useFast) = sourceExprToIr(tree, cl, cr)
     to (if useFast: cnkFastAsgn else: cnkAsgn), dst, src
-  of mnkRepeat:
-    let label = newLabel(cl)
-    stmts.add newTree(cnkLoopJoinStmt, info, node(label))
-    body()
-    stmts.add newStmt(cnkLoopStmt, info, node(label))
-    leave(tree, cr)
-  of mnkBlock:
-    cl.blocks.add (n.label, newLabel(cl))
-    body()
-    join info, cl.blocks.pop().actual
-    leave(tree, cr)
-  of mnkTry:
-    assert n.len <= 2
-    let
-      raiseExitStart = cl.raiseExits.len
-      exitStart      = cl.exits.len
-
-    body() # body of the try block
-    let target = newLabel(cl)
-    exit target # jump past the except and/or finally sections
-
-    for _ in 0..<n.len:
-      let it {.cursor.} = enter(tree, cr)
-
-      case it.kind
-      of mnkExcept:
-        # only translate the except section if it's actually entered
-        if raiseExitStart < cl.raiseExits.len:
-          var next = newLabel(cl)
-            ## the label of the next except branch
-          for i in raiseExitStart..<cl.raiseExits.len:
-            patchSingle(cl.raiseExits[i][0], node(next))
-
-          # translating the handler could add new exceptional exits, so pop
-          # the raise exits first
-          cl.raiseExits.setLen(raiseExitStart)
-
-          for bIdx in 0..<it.len:
-            let br {.cursor.} = enter(tree, cr)
-            assert br.kind == mnkBranch
-
-            let
-              this = next ## label of the current except branch
-              excpt = newTree(cnkExcept, cr.info, node(this))
-            for j in 0..<br.len:
-              excpt.add tbExceptItem(tree, cl, cr)
-
-            # no filters mean that this is a catch-all branch
-            if br.len > 0:
-              if bIdx == it.len-1:
-                # last branch in the handler block
-                excpt.add nil
-                cl.raiseExits.add (excpt, LabelId(0))
-              else:
-                # setup the label for the follow-up handler
-                next = newLabel(cl)
-                excpt.add node(next)
-
-            stmts.add excpt
-            guarded this:
-              cl.isActive = true # each branch starts as active
-              body() # body of the handler
-              exit target # jump to the after the try statement
-              stmts.add newStmt(cnkEnd, excpt.info, [node(this)])
-
-            leave(tree, cr)
-
-        else:
-          # skip all branches
-          for _ in 0..<it.len:
-            tree.skip(cr)
-      of mnkFinally:
-        # only translate the finally if it's actually entered
-        if raiseExitStart < cl.raiseExits.len or exitStart < cl.exits.len:
-          let label = newLabel(cl)
-          # add the finalizer as an intermediate target
-          patch(cl.raiseExits, raiseExitStart, label)
-          patch(cl.exits, exitStart, label)
-
-          # remember the states prior to translating the body:
-          let
-            raiseExitStart2 = cl.raiseExits.len
-            exitStart2 = cl.exits.len
-
-          stmts.add newStmt(cnkFinally, info, node(label))
-          guarded label:
-            cl.isActive = true
-            body()
-
-          if not cl.isActive:
-            # the finally section has no structured exit. Discard all
-            # intercepted exits; their final target is the finally
-            cl.raiseExits.delete(raiseExitStart, raiseExitStart2)
-            cl.exits.delete(exitStart, exitStart2)
-
-          stmts.add newStmt(cnkContinueStmt, info, node(label))
-        else:
-          tree.skip(cr) # skip the body
-
-      else:
-        unreachable(it.kind)
+  of mnkGoto:
+    to cnkGotoStmt, targetToIr(tree, cr)
+  of mnkLoop:
+    to cnkLoopStmt, targetToIr(tree, cr)
+  of mnkLoopJoin:
+    to cnkLoopJoinStmt, targetToIr(tree, cr)
+  of mnkJoin:
+    to cnkJoinStmt, labelToIr(tree, cr)
+  of mnkExcept:
+    let excpt = newTree(cnkExcept, info, labelToIr(tree, cr))
+    if n.len > 1:
+      # not a catch-all handler. Translate the filter items:
+      for j in 1..<n.len-1:
+        excpt.add tbExceptItem(tree, cl, cr)
+
+      # then the jump target of the next handler:
+      excpt.add targetToIr(tree, cr)
 
-      leave(tree, cr)
-
-    cl.disable()
-    # if structured control-flow exits the try statement, the join will enable
-    # translation again
-    join info, target
     leave(tree, cr)
-  of mnkBreak:
-    # find the stack index of the enclosing 'block' identified by the break's
-    # label
-    var idx = cl.blocks.high
-    while idx >= 0 and cl.blocks[idx].input != n.label:
-      dec idx
-    exit cl.blocks[idx].actual
-  of mnkReturn:
-    exit getReturnLabel(cl)
+    stmts.add excpt
+    # XXX: temporary workaround, refer to ``inUnscoped`` doc comment
+    inc cl.inUnscoped
+  of mnkFinally:
+    to cnkFinally, labelToIr(tree, cr)
+  of mnkContinue:
+    stmts.add newStmt(cnkContinueStmt, info, labelToIr(tree, cr))
+    # skip the candidate list, it's not relevant to code generation:
+    for _ in 1..<n.len:
+      tree.skip(cr)
+    leave(tree, cr)
   of mnkVoid:
     var res = exprToIr(tree, cl, cr)
     if res.typ.isEmptyType():
@@ -861,14 +628,13 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     leave(tree, cr)
     stmts.add res
   of mnkIf:
-    let label = newLabel(cl)
-    stmts.add newStmt(cnkIfStmt, info, [valueToIr(tree, cl, cr), node(label)])
-    body()
-    stmts.add newStmt(cnkEnd, info, [node(label)])
-    # if control-flow reaches the ``if`` itself, it also reaches the code
-    # following the ``if``
-    cl.isActive = true
-    leave(tree, cr)
+    to cnkIfStmt, valueToIr(tree, cl, cr), labelToIr(tree, cr)
+    # XXX: temporary workaround, refer to ``inUnscoped`` doc comment
+    inc cl.inUnscoped
+  of mnkEndStruct:
+    # XXX: temporary workaround, refer to ``inUnscoped`` doc comment
+    dec cl.inUnscoped
+    to cnkEnd, labelToIr(tree, cr)
   of mnkRaise:
     # the operand can either be empty or an lvalue expression
     let
@@ -878,23 +644,17 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
         of mnkNone: newEmpty()
         else:       lvalueToIr(tree, cl, arg, cr)
 
-    res.add nil # reserve a slot for the label
-    cl.raiseExits.add (res, LabelId(0))
+    res.add targetToIr(tree, cr)
     stmts.add res
-    cl.disable()
     leave(tree, cr)
   of mnkCase:
-    caseToIr(tree, env, cl, n, cr, stmts)
+    stmts.add caseToIr(tree, env, cl, n, cr)
   of mnkAsm:
     toList cnkAsmStmt:
       res.add valueToIr(tree, cl, cr)
   of mnkEmit:
     toList cnkEmitStmt:
       res.add valueToIr(tree, cl, cr)
-  of mnkStmtList:
-    while tree[cr].kind != mnkEnd:
-      stmtToIr(tree, env, cl, cr, stmts)
-    leave(tree, cr)
   of mnkScope:
     scopeToIr(tree, env, cl, cr, stmts)
   of mnkDestroy:
@@ -918,43 +678,24 @@ proc setElementToIr(tree: MirBody, cl: var TranslateCl,
     unreachable()
 
 proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
-              cr: var TreeCursor, stmts: var seq[CgNode]) =
+              cr: var TreeCursor): CgNode =
   assert n.kind == mnkCase
-  let
-    exit = newLabel(cl)
-    result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
-  # whether the statement has a structured exit is computed manually
-  var doesExit = false
+  result = newStmt(cnkCaseStmt, cr.info, [valueToIr(tree, cl, cr)])
 
-  stmts.add result # add the case statement already
-  for j in 0..<n.len:
+  # translate the branches:
+  for _ in 1..<n.len:
     let br {.cursor.} = enter(tree, cr)
 
-    result.add newTree(cnkBranch, cr.info)
-    for x in 0..<br.len:
-      result[^1].add setElementToIr(tree, cl, cr)
-
-    let label = newLabel(cl)
-    result[^1].add node(label)
+    let branch = newTree(cnkBranch, cr.info)
+    for _ in 0..<br.len-1:
+      branch.add setElementToIr(tree, cl, cr)
 
-    # start each branch as active again:
-    cl.isActive = true
-
-    join cr.info, label, required=true
-    bodyToIr(tree, env, cl, cr, stmts)
-    if cl.isActive:
-      doesExit = true
-      goto cnkGotoStmt, result.info, exit
+    # the jump target is in the last slot:
+    branch.add labelToIr(tree, cr)
 
+    result.add branch
     leave(tree, cr)
 
-  if doesExit:
-    # we used manual gotos, so emission of a join statement has to be forced
-    join result.info, exit, required=true
-    cl.isActive = true
-  else:
-    cl.disable()
-
   leave(tree, cr)
 
 proc exprToIr(tree: MirBody, cl: var TranslateCl,
@@ -1016,13 +757,8 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
     treeOp cnkObjConstr:
       let f = newFieldNode(lookupInType(typ, get(tree, cr).field))
       res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
-  of mnkCall:
+  of mnkCall, mnkCheckedCall:
     callToIr(tree, cl, n, cr)
-  of mnkCheckedCall:
-    let res = callToIr(tree, cl, n, cr)
-    res.kids.add nil # reserve the slot for the target
-    cl.raiseExits.add (res, LabelId(0))
-    res
   of UnaryOps:
     const Map = [mnkNeg: cnkNeg]
     treeOp Map[n.kind]:
@@ -1058,7 +794,7 @@ proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     start = stmts.len
 
   # a scope is entered, meaning that we're no longer in an unscoped context
-  cl.inUnscoped = false
+  cl.inUnscoped = 0
 
   # translate all statements:
   while cr.hasNext(tree) and tree[cr].kind != mnkEnd:
@@ -1083,13 +819,6 @@ proc tb(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   var cr = TreeCursor(pos: start.uint32)
   var stmts: seq[CgNode]
   scopeToIr(tree, env, cl, cr, stmts)
-  if cl.raiseExits.len > 0:
-    # there's unhandled exceptional control-flow
-    patchResume(cl.raiseExits, 0)
-
-  # emit the join for the return label, if used
-  if cl.returnLabel.isSome:
-    join unknownLineInfo, cl.returnLabel.get()
 
   # XXX: the list of statements is still wrapped in a node for now, but
   #      this needs to change once all code generators use the new CGIR
@@ -1103,8 +832,6 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
   ## using `idgen` to provide new IDs when creating symbols.
   var cl = TranslateCl(graph: graph, idgen: idgen, env: addr env,
                        owner: owner, locals: move body.locals)
-  # enable translation:
-  cl.isActive = true
 
   result = Body()
   result.code = tb(body, env, cl, NodePosition 0)
diff --git a/compiler/mir/analysis.nim b/compiler/mir/analysis.nim
index 977a07bd095..7cb97390dcd 100644
--- a/compiler/mir/analysis.nim
+++ b/compiler/mir/analysis.nim
@@ -18,35 +18,14 @@
 ## aforementioned relationship doesn't exist.
 
 import
-  std/[
-    packedsets,
-    tables
-  ],
-  compiler/ast/[
-    ast_types,
-    ast_query
-  ],
   compiler/mir/[
     mirtrees
   ],
   compiler/sem/[
     aliasanalysis,
     mirexec,
-  ],
-  compiler/utils/[
-    containers
   ]
 
-type
-  AliveState = enum
-    unchanged
-    dead
-    alive
-
-  ComputeAliveProc[T] =
-    proc(tree: MirTree, loc: T, op: Opcode,
-         n: OpValue): AliveState {.nimcall, noSideEffect.}
-
 func skipConversions*(tree: MirTree, val: OpValue): OpValue =
   ## Returns the expression after skipping handle-only conversions.
   result = val
@@ -84,7 +63,7 @@ func isAlive*(tree: MirTree, cfg: DataFlowGraph,
         # return already
         return true
 
-    of opKill, opConsume:
+    of opKill, opConsume, opDestroy:
       if isPartOf(tree, loc, path n) == yes:
         # the location's value is consumed or the location is killed. No
         # operation coming before the current one can change that, so we can
@@ -141,7 +120,7 @@ func isLastRead*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph,
         # the location is partially written to
         return false
 
-    of opKill:
+    of opKill, opDestroy:
       let cmp = compare(tree, loc, path n)
       if isAPartOfB(cmp) == yes:
         # the location is definitely killed, it no longer stores the value
@@ -166,26 +145,23 @@ func isLastRead*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph,
   result = true
 
 func isLastWrite*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph, loc: Path,
-                  start: InstrPos): tuple[result, exits, escapes: bool] =
+                  start: InstrPos): bool =
   ## Computes whether the location `loc` is reassigned or modified on any paths
   ## starting from and including `start`, returning 'false' if yes and 'true'
   ## if not. In other words, computes whether a reassignment or mutation that
   ## has a control-flow dependency on `start` and is located inside `span`
   ## observes the current value.
-  ##
-  ## In addition, whether the `start` is connected to a structured or
-  ## unstructured exit of `span` is also returned
   template path(val: OpValue): Path =
     computePath(tree, NodePosition val)
 
   var state: TraverseState
   for op, n in traverse(cfg, span, start, state):
     case op
-    of opDef, opMutate, opInvalidate:
+    of opDef, opMutate, opInvalidate, opDestroy:
       # note: since we don't know what happens to the location when it is
       # invalidated, the ``opInvalidate`` is also included here
       if overlaps(tree, loc, path n) != no:
-        return (false, false, false)
+        return false
 
     of opKill:
       let cmp = compare(tree, loc, path n)
@@ -199,92 +175,12 @@ func isLastWrite*(tree: MirTree, cfg: DataFlowGraph, span: Subgraph, loc: Path,
       if tree[loc.root].kind == mnkGlobal:
         # an unspecified global is mutated and we're analysing a location
         # derived from a global
-        return (false, false, false)
-
-    else:
-      discard
-
-  result = (true, state.exit, state.escapes)
-
-func computeAliveOp*[T: LocalId | GlobalId](
-  tree: MirTree, loc: T, op: Opcode, n: OpValue): AliveState =
-  ## Computes the state of `loc` at the *end* of the given operation. The
-  ## operands are expected to *not* alias with each other. The analysis
-  ## result will be wrong if they do
-
-  func isAnalysedLoc[T](n: MirNode, loc: T): bool =
-    when T is GlobalId:
-      n.kind == mnkGlobal and n.global == loc
-    elif T is LocalId:
-      n.kind in {mnkLocal, mnkParam, mnkTemp} and n.local == loc
-    else:
-      {.error.}
-
-  template isRootOf(val: OpValue): bool =
-    isAnalysedLoc(tree[getRoot(tree, val)], loc)
-
-  template sameLocation(val: OpValue): bool =
-    isAnalysedLoc(tree[skipConversions(tree, val)], loc)
-
-  case op
-  of opMutate, opDef:
-    if isRootOf(n):
-      # the analysed location or one derived from it is mutated
-      return alive
-
-  of opKill, opConsume:
-    if sameLocation(n):
-      # the location is killed or its value is consumed (i.e., moved somewhere
-      # else)
-      return dead
-
-  of opInvalidate:
-    discard "cannot be reasoned about here"
-
-  of opMutateGlobal:
-    when T is GlobalId:
-      # the operation mutates global state and we're analysing a global
-      result = alive
-
-  else:
-    discard
-
-func computeAlive*[T](tree: MirTree, cfg: DataFlowGraph,
-                      span: Subgraph, loc: T, op: static ComputeAliveProc[T]
-                     ): tuple[alive, escapes: bool] =
-  ## Computes whether the location is alive when `span` is exited via either
-  ## structured or unstructured control-flow. A location is considered alive
-  ## if it contains a value
-
-  # assigning to or mutating the analysed location makes it become alive,
-  # because it then stores a value. Consuming its value or using ``wasMoved``
-  # on it "kills" it (it no longer contains a value)
-
-  var exit = false
-  for opc, n in traverseFromExits(cfg, span, exit):
-    case op(tree, loc, opc, n)
-    of dead:
-      exit = true
-    of alive:
-      # the location is definitely alive when leaving the span via
-      # unstructured control-flow
-      return (true, true)
-    of unchanged:
-      discard
+        return false
 
-  # check if the location is alive at the structured exit of the span
-  for opc, n in traverseReverse(cfg, span, span.b + 1, exit):
-    case op(tree, loc, opc, n)
-    of dead:
-      exit = true
-    of alive:
-      # the location is definitely alive when leaving the span via
-      # structured control-flow
-      return (true, false)
-    of unchanged:
+    of opUse, opConsume:
       discard
 
-  result = (false, false)
+  result = true
 
 proc doesGlobalEscape*(tree: MirTree, scope: Subgraph, start: InstrPos,
                        s: GlobalId): bool =
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index 5fd03f8db13..f2bb6b40277 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -78,7 +78,7 @@ proc getOp*(g: ModuleGraph, t: PType, kind: TTypeAttachedOp): PSym =
 proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
   ## Computes whether the definition statement is something produced for
   ## sink parameter handling.
-  assert tree[stmt].kind in {mnkDef, mnkDefUnpack}
+  assert tree[stmt].kind == mnkDef
   let def = tree.operand(stmt, 0)
   if tree[def].kind != mnkTemp:
     # only temporaries are used for sink handling
@@ -198,7 +198,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         diags.add LocalDiag(pos: src, kind: ldkPassCopyToSink)
 
       case tree[stmt].kind
-      of mnkDef, mnkDefUnpack:
+      of mnkDef:
         # turn a ``def x = copy a.b`` into:
         #   def x
         #   =copy(name x, arg a.b)
@@ -235,7 +235,7 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         typ  = tree[stmt, 0].typ
 
       if not hasDestructor(env[typ]) or
-         tree[stmt].kind in {mnkDef, mnkDefUnpack, mnkInit}:
+         tree[stmt].kind in {mnkDef, mnkInit}:
         # nothing to do if:
         # * the type has no hooks
         # * it's guaranteed that there's no value in the destination
diff --git a/compiler/mir/mirchangesets.nim b/compiler/mir/mirchangesets.nim
index c157f49ad2c..c629e725a41 100644
--- a/compiler/mir/mirchangesets.nim
+++ b/compiler/mir/mirchangesets.nim
@@ -20,6 +20,8 @@ type
     inner: TreeChangeset
     locals: PartialStore[LocalId, Local]
       ## new locals to be added on changeset application
+    nextLabel: uint32
+      ## exchanged with the builder, where it's used for allocating new IDs
 
 # ----------------------------------------
 # proxy routines
@@ -49,6 +51,13 @@ func initChangeset*(body: MirBody): Changeset =
   ## Sets up a changeset for `body`. The changeset either needs to be
   ## discarded, or applied to the same ``MirBody`` instance it was created for.
   result = Changeset(locals: fork(body.locals))
+  # compute the next ID to use for new labels:
+  for i, n in body.code.pairs:
+    case n.kind
+    of mnkLabel:
+      result.nextLabel = max(n.label.uint32 + 1, result.nextLabel)
+    else:
+      discard
 
 func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
                  info: SourceId): MirBuilder =
@@ -56,10 +65,12 @@ func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
   ## ``finishBuilder`` call.
   result = initBuilder(info, move buffer)
   swap(c.locals, result.locals)
+  swap(c.nextLabel, result.nextLabel)
 
 func finishBuilder(c: var Changeset, buffer: var MirNodeSeq,
                    bu: sink MirBuilder) =
   # move the ID counter and buffer back into the changeset
+  swap(c.nextLabel, bu.nextLabel)
   (buffer, c.locals) = finish(bu)
 
 template insert*(c: var Changeset, tree: MirTree, at, source: NodePosition,
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index bba849668f6..7b487689274 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -56,6 +56,8 @@ type
 
     locals*: PartialStore[LocalId, Local]
       ## new locals created with the builder
+    nextLabel*: uint32
+      ## the ID to use when allocating a new label ID
 
     # XXX: the internal fields are currently exported for the integration
     #      with changesets to work, but future refactorings should focus
@@ -230,6 +232,17 @@ template buildStmt*(bu: var MirBuilder, body: untyped) =
   let v = bu.push(body)
   bu.pop(v)
 
+template buildIf*(bu: var MirBuilder, cond, body: untyped) =
+  ## Emits the start and end of an ``if``, with `cond` providing the MIR for
+  ## the condition, and `body` providing the MIR for the body.
+  let label = bu.allocLabel()
+  bu.subTree mnkIf:
+    cond
+    bu.add MirNode(kind: mnkLabel, label: label)
+  body
+  bu.subTree mnkEndStruct:
+    bu.add MirNode(kind: mnkLabel, label: label)
+
 template buildStmt*(bu: var MirBuilder, k: MirNodeKind, body: untyped) =
   ## Similar to `buildStmt <#buildStmt,TCtx,untyped>`_, but also starts a sub-
   ## tree of kind `k`.
@@ -315,6 +328,11 @@ template allocTemp*(bu: var MirBuilder, t: TypeId, alias = false): Value =
   let id = bu.addLocal(Local(typ: t))
   allocTemp(bu, t, id, alias)
 
+func allocLabel*(bu: var MirBuilder): LabelId =
+  ## Allocates a fresh label ID.
+  result = LabelId(bu.nextLabel)
+  inc bu.nextLabel
+
 func use*(bu: var MirBuilder, val: sink Value) {.inline.} =
   ## Emits a use of `val`.
   if val.info.isSome:
@@ -394,6 +412,16 @@ func asgnMove*(bu: var MirBuilder, a, b: Value) =
     bu.use a
     bu.move b
 
+func join*(bu: var MirBuilder, label: LabelId) =
+  ## Emits a ``join`` statement with `label`.
+  bu.subTree mnkJoin:
+    bu.add MirNode(kind: mnkLabel, label: label)
+
+template buildBlock*(bu: var MirBuilder, id: LabelId, body: untyped) =
+  ## Emits `body` followed by a join statement for the given `id`.
+  body
+  bu.join id
+
 func inline*(bu: var MirBuilder, tree: MirTree, fr: NodePosition): Value =
   ## Inlines the lvalue operand for non-mutating use. This is meant to be used
   ## for materialzing immutable arguments when inlining calls / expanding
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 6c36f31a68d..d756701da2b 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -75,6 +75,7 @@ import
     mirbodies,
     mirconstr,
     mirenv,
+    mirgen_blocks,
     mirtrees,
     mirtypes,
     proto_mir,
@@ -95,6 +96,8 @@ import
     idioms
   ]
 
+import std/options as std_options
+
 type
   DestFlag = enum
     ## Extra information about an assignment destination. The flags are used to
@@ -111,12 +114,6 @@ type
 
     flags: set[DestFlag]
 
-  Block = object
-    ## Information about a ``block``
-    label: PSym ## the symbol of the block's label. 'nil' if the block has no
-                ## label
-    id: LabelId ## the block's internal label ID
-
   SourceProvider = object
     ## Stores the active origin and the in-progress database of origin
     ## ``PNode``s. Both are needed together in most cases, hence their bundling
@@ -149,22 +146,24 @@ type
       ## ownership of the environment
     builder: MirBuilder ## the builder for generating the MIR trees
 
-    blocks: seq[Block] ## the stack of active ``block``s. Used for looking up
-                       ## break targets
+    blocks: BlockCtx
     localsMap: Table[int, LocalId]
       ## maps symbol IDs of locals to the corresponding ``LocalId``
 
     sp: SourceProvider
 
-    numLabels: int ## provides the ID to use for the next label
     scopeDepth: int ## the current amount of scope nesting
     inLoop: int
       ## > 0 if the current statement/expression is part of a loop
+    injectDestructors: bool
+      ## whether injection of destroy operations is enabled
+    unreachable: bool
+      ## set to true when entering unreachable code (e.g., statements
+      ## immediately following a `break`). Disables:
+      ## * translation of AST
+      ## * emission of control-flow statements at block/scope end
 
     # input:
-    context: TSymKind ## what entity the input AST is part of (e.g. procedure,
-                      ## macro, module, etc.). Used to allow or change how the
-                      ## AST is interpreted in some places
     userOptions: set[TOption]
     graph: ModuleGraph
 
@@ -224,10 +223,6 @@ proc typeToMir(c: var TCtx, t: PType): TypeId =
   if t.isNil: VoidType
   else:       c.env.types.add(t)
 
-func nextLabel(c: var TCtx): LabelId =
-  result = LabelId(c.numLabels)
-  inc c.numLabels
-
 # ----------- SourceProvider API -------------
 
 template useSource(bu: var MirBuilder, sp: var SourceProvider,
@@ -283,12 +278,17 @@ template subTree(c: var TCtx, n: MirNode, body: untyped) =
 template scope(c: var TCtx, body: untyped) =
   inc c.scopeDepth
   c.builder.subTree mnkScope:
+    let prev = c.blocks.startScope()
     body
+    c.blocks.closeScope(c.builder, prev, not c.unreachable)
   dec c.scopeDepth
 
 template use(c: var TCtx, val: Value) =
   c.builder.use(val)
 
+template join(c: var TCtx, label: LabelId) =
+  c.builder.join(label)
+
 template emitByVal(c: var TCtx, val: Value) =
   ## Emits a pass-by-value argument sub-tree with `val`.
   c.builder.emitByVal(val)
@@ -365,6 +365,12 @@ proc toFloatLiteral(env: var MirEnv, n: PNode): Value =
 func strLiteral(env: var MirEnv, str: string, typ: TypeId): Value =
   literal(env.getOrIncl(str), typ)
 
+template labelNode(lbl: LabelId): MirNode =
+  MirNode(kind: mnkLabel, label: lbl)
+
+template newLabelNode(c: var TCtx): MirNode =
+  labelNode(c.builder.allocLabel())
+
 func nameNode(c: var TCtx, s: PSym): MirNode =
   let t = c.typeToMir(s.typ)
   case s.kind
@@ -394,8 +400,11 @@ template allocTemp(c: var TCtx, typ: TypeId; alias=false): Value =
   ## Allocates a new ID for a temporary and returns the name.
   c.builder.allocTemp(typ, alias)
 
+template allocLabel(c: var TCtx): LabelId =
+  c.builder.allocLabel()
+
 proc gen(c: var TCtx; n: PNode)
-proc genx(c: var TCtx; e: PMirExpr, i: int)
+proc genx(c: var TCtx; e: PMirExpr, i: int; fromMove = false)
 proc genComplexExpr(c: var TCtx, n: PNode, dest: Destination)
 
 proc genAsgn(c: var TCtx, dest: Destination, rhs: PNode)
@@ -419,6 +428,9 @@ func getTemp(c: var TCtx, typ: TypeId): Value =
       c.use result
       c.add MirNode(kind: mnkNone)
 
+template raiseExit(c: var TCtx) =
+  raiseExit(c.blocks, c.builder)
+
 template buildStmt(c: var TCtx, k: MirNodeKind, body: untyped) =
   c.builder.buildStmt(k, body)
 
@@ -430,6 +442,7 @@ template buildCheckedMagicCall(c: var TCtx, m: TMagic, t: TypeId,
   c.subTree MirNode(kind: mnkCheckedCall, typ: t):
     c.add MirNode(kind: mnkMagic, magic: m)
     body
+    raiseExit(c)
 
 template buildDefectMagicCall(c: var TCtx, m: TMagic, t: TypeId,
                               body: untyped) =
@@ -447,6 +460,24 @@ template buildDefectMagicCall(c: var TCtx, m: TMagic, t: TypeId,
   c.subTree MirNode(kind: kind, typ: t):
     c.add MirNode(kind: mnkMagic, magic: m)
     body
+    if kind == mnkCheckedCall:
+      raiseExit(c)
+
+template buildIf(c: var TCtx, cond, body: untyped) =
+  let label = c.builder.allocLabel()
+  c.buildStmt mnkIf:
+    cond
+    c.add labelNode(label)
+  body
+  c.buildStmt mnkEndStruct:
+    c.add labelNode(label)
+
+proc register(c: var TCtx, loc: Value) =
+  ## If `loc` has a destructor and destroy injection is enabled for the
+  ## current context, registers `loc` for destruction at the end of the
+  ## current scope.
+  if c.injectDestructors and c.env[loc.typ].hasDestructor():
+    c.blocks.register(loc)
 
 proc singleToValue(c: var TCtx, e: PMirExpr, i: int): Value =
   c.builder.useSource(c.sp, e[i].orig)
@@ -470,6 +501,9 @@ proc toValue(c: var TCtx, e: PMirExpr, i: int, def: MirNodeKind): Value =
         c.use result
         c.builder.pop(f)
 
+    if def == mnkDef:
+      c.register(result)
+
 proc toValue(c: var TCtx, e: PMirExpr, i: int): Value =
   ## Generates the MIR code for the given expression and turns it into a
   ## ``Value``.
@@ -569,10 +603,8 @@ proc genAndOr(c: var TCtx, n: PNode, dest: Destination) =
       c.buildMagicCall mNot, BoolType:
         c.emitByVal v
 
-  c.subTree mnkIf:
-    c.use v
-    c.subTree mnkStmtList:
-      genAsgn(c, dest, n[2]) # the right-hand side
+  c.buildIf (c.use v;):
+    genAsgn(c, dest, n[2]) # the right-hand side
 
 proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
                    field: string) =
@@ -773,6 +805,12 @@ proc genCall(c: var TCtx, n: PNode) =
                     effects: effects):
     genCallee(c, n[0])
     genArgs(c, n)
+    if kind == mnkCheckedCall:
+      raiseExit(c)
+
+  # code following the call of a .noreturn routine is unreachable:
+  if n[0].kind == nkSym and sfNoReturn in n[0].sym.flags:
+    c.unreachable = true
 
 proc genMacroCallArgs(c: var TCtx, n: PNode, kind: TSymKind, fntyp: PType) =
   ## Generates the arguments for a macro/template call expression. `n` is
@@ -834,35 +872,47 @@ proc genInSetOp(c: var TCtx, n: PNode) =
       a   = genRd(c, x[1])
       b   = genRd(c, x[2])
 
-    c.buildStmt mnkIf:
-      # condition: ``a <= x:``
-      c.wrapAndUse(BoolType):
-        c.buildMagicCall leOp, BoolType:
-          c.emitByVal a
-          c.emitByVal val
-      # the outer body:
-      c.subTree mnkStmtList:
+    c.builder.buildStmt:
+      let
+        label1 = c.allocLabel()
+        label2 = c.allocLabel()
+
+      c.subTree mnkIf:
+        # condition: ``a <= x:``
+        c.wrapAndUse(BoolType):
+          c.buildMagicCall leOp, BoolType:
+            c.emitByVal a
+            c.emitByVal val
+        c.add labelNode(label1)
+
+      c.subTree mnkIf:
         # condition: ``x <= b:``
-        c.subTree mnkIf:
-          c.wrapAndUse(BoolType):
-            c.buildMagicCall leOp, BoolType:
-              c.emitByVal val
-              c.emitByVal b
-          c.subTree mnkStmtList:
-            var sv: Value
-            if se.kind == nkCurly and not isDeepConstExpr(se):
-              sv = c.allocTemp(c.typeToMir(se.typ))
-              c.subTree mnkDef:
-                c.use sv
-                genSetConstr(c, se)
-            else:
-              sv = genRd(c, se)
-
-            c.subTree mnkInit:
-              c.use res
-              c.buildMagicCall mInSet, BoolType:
-                c.emitByVal sv
-                c.emitByVal val
+        c.wrapAndUse(BoolType):
+          c.buildMagicCall leOp, BoolType:
+            c.emitByVal val
+            c.emitByVal b
+        c.add labelNode(label2)
+
+      var sv: Value
+      if se.kind == nkCurly and not isDeepConstExpr(se):
+        sv = c.allocTemp(c.typeToMir(se.typ))
+        c.subTree mnkDef:
+          c.use sv
+          genSetConstr(c, se)
+      else:
+        sv = genRd(c, se)
+
+      c.subTree mnkInit:
+        c.use res
+        c.buildMagicCall mInSet, BoolType:
+          c.emitByVal sv
+          c.emitByVal val
+
+      # close the if statements:
+      c.subTree mnkEndStruct:
+        c.add labelNode(label2)
+      c.subTree mnkEndStruct:
+        c.add labelNode(label1)
 
     c.use res
   else:
@@ -1029,6 +1079,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
       c.buildTree mnkCheckedCall, rtyp:
         c.genCallee(n[0])
         arg n[1]
+        raiseExit(c)
     else:
       genCall(c, n)
 
@@ -1136,6 +1187,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
                         effects: {geMutateGlobal}):
         # we can use the internal signature
         genMacroCallArgs(c, n, skMacro, callee.sym.internal)
+        raiseExit(c)
     else:
       unreachable()
 
@@ -1218,7 +1270,12 @@ proc genRaise(c: var TCtx, n: PNode) =
     # ``sink`` parameter
     var e = exprToPmir(c, n[0], true, false)
     wantConsumeable(e)
-    let tmp = toValue(c, e, e.high)
+    # we cannot use ``toValue`` here, since the temporary must not be
+    # registered for destruction -- it's moved into the `raise` operation
+    let tmp = c.wrapTemp c.typeToMir(e[^1].typ):
+      assert e[^1].kind == pirMat
+      # skip the 'materialize' node
+      genx(c, e, e.high - 1, fromMove=true)
 
     # emit the preparation code:
     let
@@ -1237,17 +1294,25 @@ proc genRaise(c: var TCtx, n: PNode) =
     # emit the raise statement:
     c.buildStmt mnkRaise:
       c.use tmp
+      raiseExit(c)
   else:
     # a re-raise statement
     c.buildStmt mnkRaise:
       c.add MirNode(kind: mnkNone)
+      raiseExit(c)
+
+  # code following a raise statement is unreachable:
+  c.unreachable = true
 
 proc genReturn(c: var TCtx, n: PNode) =
   assert n.kind == nkReturnStmt
   if n[0].kind != nkEmpty:
     gen(c, n[0])
 
-  c.add MirNode(kind: mnkReturn)
+  c.buildStmt mnkGoto:
+    blockExit(c.blocks, c.builder, 0)
+
+  c.unreachable = true
 
 proc genAsgnSource(c: var TCtx, e: PNode, status: set[DestFlag]) =
   ## Generates the MIR code for the right-hand side of an assignment.
@@ -1270,15 +1335,6 @@ proc genAsgnSource(c: var TCtx, e: PNode, status: set[DestFlag]) =
 
   genx(c, e, e.high)
 
-proc genAsgn(c: var TCtx, dest: Destination, rhs: PNode) =
-  assert dest.isSome
-  let kind =
-    if dfEmpty in dest.flags: mnkInit
-    else:                     mnkAsgn
-  c.buildStmt kind:
-    c.use dest.val
-    c.genAsgnSource(rhs, dest.flags)
-
 proc unwrap(c: var TCtx, n: PNode): PNode =
   ## If `n` is a statement-list expression, generates the code for all
   ## statements and returns the unwrapped expression. The unchanged `n` is
@@ -1292,6 +1348,19 @@ proc unwrap(c: var TCtx, n: PNode): PNode =
     result = result.lastSon
     assert result.kind != nkStmtListExpr
 
+proc genAsgn(c: var TCtx, dest: Destination, rhs: PNode) =
+  assert dest.isSome
+  let kind =
+    if dfEmpty in dest.flags: mnkInit
+    else:                     mnkAsgn
+
+  let rhs = unwrap(c, rhs)
+  # the right-hand expression not returning needs to be accounted for
+  if not c.unreachable:
+    c.buildStmt kind:
+      c.use dest.val
+      c.genAsgnSource(rhs, dest.flags)
+
 proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
   ## Generates the code for an assignment. `isFirst` indicates if this is the
   ## first assignment to the location named by `lhs`.
@@ -1306,6 +1375,10 @@ proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
     lhs = unwrap(c, lhs)
     sink = sink and not isCursor(lhs)
 
+  if c.unreachable:
+    # the left-hand expression terminates -> the assignment is dead code
+    return
+
   case rhs.kind
   of ComplexExprs:
     # optimization: forward the destination. For example:
@@ -1373,6 +1446,9 @@ proc genLocDef(c: var TCtx, n: PNode, val: PNode) =
       else:
         c.add MirNode(kind: mnkNone)
 
+    if sfCursor notin s.flags:
+      c.register(genLocation(c, n))
+
 proc genLocInit(c: var TCtx, symNode: PNode, initExpr: PNode) =
   ## Generates the code for a location definition. `sym` is the symbol of the
   ## location and `initExpr` the initializer expression
@@ -1419,7 +1495,7 @@ proc genVarTuple(c: var TCtx, n: PNode) =
   else:
     # generate the definition for the temporary:
     let val = c.allocTemp(c.typeToMir(initExpr.typ))
-    c.buildStmt mnkDefUnpack:
+    c.buildStmt mnkDef:
       c.use val
       # ensure that the temporary owns the tuple value:
       genAsgnSource(c, initExpr, {dfEmpty, dfOwns})
@@ -1445,6 +1521,9 @@ proc genVarTuple(c: var TCtx, n: PNode) =
                             position: i.uint32):
             c.use val
 
+    # it's guaranteed that all elements are moved out of the tuple, no
+    # destruction is needed
+
 proc genVarSection(c: var TCtx, n: PNode) =
   for a in n:
     case a.kind
@@ -1488,34 +1567,41 @@ proc genVarSection(c: var TCtx, n: PNode) =
 proc genWhile(c: var TCtx, n: PNode) =
   ## Generates the code for a ``nkWhile`` node.
   assert isTrue(n[0]), "`n` wasn't properly transformed"
-  c.subTree MirNode(kind: mnkRepeat):
-    c.scope:
-      inc c.inLoop
-      c.gen(n[1])
-      dec c.inLoop
+  let label = c.allocLabel()
+  c.subTree mnkLoopJoin:
+    c.add labelNode(label)
+  c.scope:
+    inc c.inLoop
+    c.gen(n[1])
+    dec c.inLoop
+  c.subTree mnkLoop:
+    c.add labelNode(label)
+  # a while loop has no structured exit:
+  c.unreachable = true
+
+proc closeBlock(c: var TCtx) =
+  if c.blocks.closeBlock(c.builder):
+    c.unreachable = false
+
+template withBlock(c: var TCtx, k: BlockKind, body: untyped) =
+  c.blocks.add Block(kind: k)
+  body
+  c.closeBlock()
+
+template withBlock(c: var TCtx, k: BlockKind, lbl: LabelId, body: untyped) =
+  c.blocks.add Block(kind: k, id: some lbl)
+  body
+  c.closeBlock()
 
 proc genBlock(c: var TCtx, n: PNode, dest: Destination) =
-  ## Generates and emits the MIR code for a ``block`` expression or statement
-  if sfUsed notin n[0].sym.flags:
-    # if the label is never used, it means that the block is only used for
-    # scoping. Omit emitting an ``mnkBlock`` and just use a scope
-    c.scope: c.genWithDest(n[1], dest)
-    return
-
-  let id = nextLabel(c)
-
-  # push the block to the stack:
-  var oldLen = c.blocks.len
-  c.blocks.add Block(label: n[0].sym, id: id)
+  ## Generates and emits the MIR code for a ``block`` expression or statement.
+  ## A block translates to a scope and, optionally, a join.
+  c.blocks.add Block(kind: bkBlock, label: n[0].sym)
 
   # generate the body:
-  c.subTree MirNode(kind: mnkBlock, label: id):
-    c.scope:
-      c.genWithDest(n[1], dest)
-
-  # pop the block:
-  assert c.blocks.len == oldLen + 1
-  c.blocks.setLen(oldLen)
+  c.scope:
+    c.genWithDest(n[1], dest)
+  c.closeBlock()
 
 proc genBranch(c: var TCtx, n: PNode, dest: Destination) =
   ## Generates the body of a branch. Here, a branch refers to either an
@@ -1528,6 +1614,21 @@ proc genBranch(c: var TCtx, n: PNode, dest: Destination) =
   else:
     gen(c, n)
 
+proc leaveBlock(c: var TCtx) =
+  ## Emits a goto for jumping to the exit of first enclosing block, but only
+  ## if not in an unreachable context.
+  if c.unreachable:
+    return # omit the leave actions if not reachable
+
+  if c.scopeDepth > 0:
+    # only emit the early scope exit if still within a scope
+    earlyExit(c.blocks, c.builder)
+
+  c.subTree mnkGoto:
+    blockExit(c.blocks, c.builder, closest(c.blocks))
+
+  c.unreachable = true # code following a goto is unreachable
+
 proc genIf(c: var TCtx, n: PNode, dest: Destination) =
   ## Generates the code for an ``if`` statement (``nkIf(Stmt|Expr)``). It's
   ## translated to the ``mnkIf`` MIR construct (which can be seen as a
@@ -1566,31 +1667,30 @@ proc genIf(c: var TCtx, n: PNode, dest: Destination) =
     ## Generates the code for a single ``nkElif(Branch|Expr)``
     c.scope:
       let v = genUse(c, branch[0])
-      c.subTree mnkIf:
-        c.use v
+      c.buildIf (c.use v;):
         c.scope:
           genBranch(c, branch.lastSon, dest)
           extra
 
+      # if the start of the branch was reachable, then so is the code
+      # following the branch
+      c.unreachable = false
+
   if n.len == 1:
-    # an ``if`` statement/expression with a single branch. Don't emit the
-    # unnecessary 'block' and 'break'
+    # an ``if`` statement/expression with a single branch. Don't wrap in a
+    # block
     genElifBranch(n[0]):
       discard
 
   else:
     # a multi-clause ``if`` statement/expression
-    let label = nextLabel(c)
-    c.subTree MirNode(kind: mnkBlock, label: label):
-      c.subTree mnkStmtList:
+    c.withBlock bkBlock: # <- the exit to jump to at the end of each branch
+      if true:
         for it in n.items:
           case it.kind
           of nkElifBranch, nkElifExpr:
             genElifBranch(it):
-              # don't emit the 'break' if the branch doesn't have a structured
-              # exit
-              if not endsInNoReturn(it.lastSon):
-                c.add MirNode(kind: mnkBreak, label: label)
+              leaveBlock(c)
 
           of nkElse, nkElseExpr:
             c.scope:
@@ -1601,18 +1701,17 @@ proc genIf(c: var TCtx, n: PNode, dest: Destination) =
             unreachable(it.kind)
 
 proc genCase(c: var TCtx, n: PNode, dest: Destination) =
-  ## Generates the MIR code for an ``nkCaseStmt`` node. Since the ``mnkCase``
-  ## MIR construct works in a very similar way, the translation logic is
-  ## straightforward
+  ## Generates the MIR code for an ``nkCaseStmt`` node.
   assert isEmptyType(n.typ) == not dest.isSome
 
   let v = genUse(c, n[0])
-  c.add MirNode(kind: mnkCase, len: uint32(n.len - 1))
+  c.add MirNode(kind: mnkCase, len: uint32(n.len))
   c.use v
 
-  # iterate of/else branches:
+  let firstLabel = c.builder.nextLabel
+  # first step: emit the dispatcher
   for (_, branch) in branches(n):
-    c.add MirNode(kind: mnkBranch, len: uint32(branch.len - 1))
+    c.add MirNode(kind: mnkBranch, len: uint32(branch.len))
 
     case branch.kind
     of nkElse:
@@ -1629,19 +1728,33 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
     else:
       unreachable(branch.kind)
 
-    # the branch's body:
-    c.scope:
-      genBranch(c, branch.lastSon, dest)
-
+    c.add newLabelNode(c) # the jump target
     c.add endNode(mnkBranch)
 
   c.add endNode(mnkCase)
 
-proc genExceptBranch(c: var TCtx, n: PNode, dest: Destination) =
+  # second step: emit the branch bodies
+  c.withBlock bkBlock:
+    for (i, branch) in branches(n):
+      c.join LabelId(firstLabel + uint32(i))
+      c.unreachable = false # every branch starts as reachable again
+      c.scope:
+        genBranch(c, branch.lastSon, dest)
+        leaveBlock(c)
+
+proc genExceptBranch(c: var TCtx, n: PNode, label: LabelId,
+                     next: Option[LabelId], dest: Destination) =
   assert n.kind == nkExceptBranch
   c.builder.useSource(c.sp, n)
+  let withFilter = n.len > 1
+
+  # the except branch is reachable:
+  c.unreachable = false
+
+  c.subTree MirNode(kind: mnkExcept,
+                    len: uint32(1 + (n.len - 1) + ord(withFilter))):
+    c.add labelNode(label) # name of the except
 
-  c.subTree MirNode(kind: mnkBranch, len: uint32(n.len - 1)):
     # emit the exception types the branch covers:
     for _, tn in branchLabels(n):
       case tn.kind
@@ -1656,36 +1769,96 @@ proc genExceptBranch(c: var TCtx, n: PNode, dest: Destination) =
       else:
         unreachable()
 
-    # generate the body of the branch:
+    if withFilter:
+      # exception handler with filters fork to another handler on mismatch
+      if next.isSome:
+        # try the next handler from the current try statement
+        c.add labelNode(next.unsafeGet)
+      else:
+        # continue raising
+        raiseExit(c)
+
+  # generate the body of the except branch:
+  c.withBlock bkExcept, label:
     c.scope:
       genBranch(c, n.lastSon, dest)
+      leaveBlock(c)
+
+  c.subTree mnkEndStruct:
+    c.add labelNode(label)
+
+proc genExcept(c: var TCtx, n: PNode, len: int, dest: Destination) =
+  let tryBlock = c.blocks.pop()
+  if tryBlock.id.isNone:
+    # the exception handlers are never entered, omit them
+    return
+
+  var next = tryBlock.id.unsafeGet()
+    ## the label of the next handler
+
+  for i in 1..<len:
+    let curr = next
+    if i + 1 < len:
+      # there's another except branch in the try
+      next = c.allocLabel()
+      c.genExceptBranch(n[i], curr, some next, dest)
+    else:
+      # this is the last branch
+      c.genExceptBranch(n[i], curr, none LabelId, dest)
+
+proc genFinally(c: var TCtx, n: PNode) =
+  let blk = c.blocks.pop()
+  if blk.id.isNone:
+    # the finally is never entered, omit it
+    return
+
+  c.unreachable = false # the finally is reachable
+  c.builder.useSource(c.sp, n)
+  c.subTree mnkFinally:
+    c.add labelNode(blk.id.unsafeGet)
+
+  # translate the body:
+  c.withBlock bkFinally, blk.id.unsafeGet:
+    c.scope:
+      c.gen(n[^1])
+
+  # the continue statement is always necessary, even if the body has no
+  # structured exit
+  c.subTree MirNode(kind: mnkContinue, len: uint32(1 + blk.exits.len)):
+    c.add labelNode(blk.id.unsafeGet)
+    for it in blk.exits.items:
+      c.add labelNode(it)
 
 proc genTry(c: var TCtx, n: PNode, dest: Destination) =
   let
     hasFinally = n.lastSon.kind == nkFinally
     hasExcept = n[1].kind == nkExceptBranch
 
-  c.add MirNode(kind: mnkTry, len: uint32(ord(hasFinally) + ord(hasExcept)))
+  # the anonymous block to provide the exit:
+  c.blocks.add Block(kind: bkBlock)
+
+  if hasFinally:
+    # the finally clause also applies to the except clauses, so it's
+    # pushed first
+    c.blocks.add Block(kind: bkTryFinally)
+
+  if hasExcept:
+    c.blocks.add Block(kind: bkTryExcept)
+
+  # the body of the try:
   c.scope:
     c.genBranch(n[0], dest)
-
-  let len =
-    if hasFinally: n.len-1
-    else: n.len
-    ## the number of sub-nodes excluding ``nkFinally``
+    leaveBlock(c)
 
   if hasExcept:
-    c.subTree MirNode(kind: mnkExcept, len: uint32(len-1)):
-      for i in 1..<len:
-        genExceptBranch(c, n[i], dest)
+    genExcept(c, n, n.len - ord(hasFinally), dest)
 
   if hasFinally:
-    c.builder.useSource(c.sp, n.lastSon)
-    c.subTree MirNode(kind: mnkFinally):
-      c.scope:
-        c.gen(n.lastSon[0])
+    genFinally(c, n[^1])
 
-  c.add endNode(mnkTry)
+  # presume unreachable, closing the block will correct the presumption
+  c.unreachable = true
+  c.closeBlock()
 
 proc genAsmOrEmitStmt(c: var TCtx, kind: range[mnkAsm..mnkEmit], n: PNode) =
   ## Generates and emits the MIR code for an emit directive or ``asm``
@@ -1733,14 +1906,14 @@ proc toConstant(c: var TCtx, n: PNode): Value =
   let con = toConstId c.env.data.getOrPut(constDataToMir(c.env, n))
   toValue(con, c.typeToMir(n.typ))
 
-proc genx(c: var TCtx, e: PMirExpr, i: int) =
+proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
   ## Translates the proto-MIR expression to MIR code and emits it into the
   ## current front buffer.
   let n {.cursor.} = e[i]
   c.builder.useSource(c.sp, n.orig)
 
-  template recurse() =
-    genx(c, e, i - 1)
+  template recurse(fromMove = false) =
+    genx(c, e, i - 1, fromMove)
 
   proc viewOp(kind: MirNodeKind, typ: PType): MirNodeKind {.nimcall.} =
     # pick the correct kind based on the var-ness
@@ -1795,7 +1968,8 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       recurse()
   of pirLvalueConv:
     c.buildOp mnkPathConv, typ:
-      recurse()
+      # moves are propagated through lvalue conversions
+      recurse(fromMove)
   of pirCheckedArrayAccess, pirCheckedSeqAccess:
     let
       arr = toValue(c, e, i - 1)
@@ -1821,7 +1995,7 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     let
       val = toValue(c, e, i - 1)
 
-    c.buildStmt mnkIf:
+    c.buildIf:
       # the ``x != nil`` condtion:
       c.wrapAndUse(BoolType):
         c.buildMagicCall mNot, BoolType:
@@ -1829,8 +2003,9 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
             c.wrapAndUse(BoolType):
               c.buildMagicCall mIsNil, BoolType:
                 c.emitByVal val
+    do:
       # the check:
-      c.subTree mnkScope:
+      c.buildStmt mnkScope:
         c.subTree mnkVoid:
           c.buildDefectMagicCall mChckObj, VoidType:
             c.emitByVal val
@@ -1921,7 +2096,20 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       for i in 0..<orig.len-1:
         gen(c, orig[i])
 
-    recurse()
+    if c.unreachable:
+      # don't translate the expression if it's unreachable. The callsite still
+      # expects some expression, and thus a default-intialized temporary is
+      # used. Do note that the code is unreachable, and the assignment is thus
+      # never evaluated -- it's just there to uphold the callsite's syntactic
+      # expectations
+      # XXX: ideally, non-terminating statement list expressions should
+      #      have the trailing expression cut off and be turned into
+      #      ``nkStmtList`` nodes at an earlier stage
+      c.wrapAndUse typ:
+        c.buildMagicCall mDefault, typ:
+          discard
+    else:
+      recurse()
   of pirComplex:
     # attempting to generate the code for a complex expression without a
     # destination specified -> assign the value resulting from it to a
@@ -1932,13 +2120,14 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
       genComplexExpr(c, n.orig):
         Destination(isSome: true, val: tmp, flags: {dfOwns, dfEmpty})
 
+    # the temporary is registered for destruction by the ``pirMat`` handling
     c.use tmp
   of pirCopy:
     c.buildOp mnkCopy, typ:
       recurse()
   of pirMove:
     c.buildOp mnkMove, typ:
-      recurse()
+      recurse(fromMove = true)
   of pirSink, pirDestructiveMove:
     # a destructive move is currently not translated into a move + wasMoved,
     # but rather into a sink, which is then, if necessary, later turned into
@@ -1946,6 +2135,11 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
     c.buildOp mnkSink, typ:
       recurse()
   of pirMat, pirMatCursor:
+    template needsDestroy(): bool =
+      # the materialized temporary needs to be destroyed if owning and not
+      # immediately moved afterwards
+      n.kind == pirMat and not fromMove
+
     let f = c.builder.push: recurse()
     # only materialize a temporary if the expression is not already a
     # temporary introduced by the PMIR-to-MIR translation
@@ -1955,6 +2149,15 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
         c.subTree (if n.kind == pirMat: mnkDef else: mnkDefCursor):
           c.use tmp
           c.builder.pop(f)
+
+      if needsDestroy():
+        c.register(tmp)
+      c.use tmp
+    elif needsDestroy():
+      # nothing to materialize (the input is already a temporary), but the
+      # temporary still needs to be registered for destruction
+      let tmp = c.builder.popSingle(f)
+      c.register(tmp)
       c.use tmp
   of pirMatLvalue:
     let tmp = c.allocTemp(typ, true)
@@ -1966,6 +2169,9 @@ proc genx(c: var TCtx, e: PMirExpr, i: int) =
 
 proc gen(c: var TCtx, n: PNode) =
   ## Generates and emits the MIR code for the statement `n`
+  if c.unreachable:
+    return
+
   c.builder.useSource(c.sp, n)
 
   # because of ``.discardable`` calls, we can't require `n` to be of void
@@ -1998,18 +2204,10 @@ proc gen(c: var TCtx, n: PNode) =
   of nkPragmaBlock:
     gen(c, n.lastSon)
   of nkBreakStmt:
-    var id: LabelId
-    block search:
-      let sym = n[0].sym
-      # find the block with the matching label and use its ``LabelId``:
-      for b in c.blocks.items:
-        if b.label.id == sym.id:
-          id = b.id
-          break search
-
-      unreachable "break target missing"
-
-    c.add MirNode(kind: mnkBreak, label: id)
+    c.buildStmt mnkGoto:
+      blockExit(c.blocks, c.builder, findBlock(c.blocks, n[0].sym))
+
+    c.unreachable = true # code following a break is unreachable
   of nkVarSection, nkLetSection:
     genVarSection(c, n)
   of nkAsgn:
@@ -2051,7 +2249,12 @@ proc gen(c: var TCtx, n: PNode) =
           c.builder.pop(f)
   of nkDiscardStmt:
     if n[0].kind != nkEmpty:
-      let e = exprToPmir(c, unwrap(c, n[0]), false, false)
+      let n = unwrap(c, n[0])
+      if c.unreachable:
+        # don't translate the expression
+        return
+
+      let e = exprToPmir(c, n, false, false)
       case classify(e)
       of Rvalue:
         discard toValue(c, e, e.high, mnkDefCursor)
@@ -2116,14 +2319,26 @@ proc genWithDest(c: var TCtx, n: PNode; dest: Destination) =
   else:
     gen(c, n)
 
+proc initCtx(graph: ModuleGraph, config: TranslationConfig, owner: PSym,
+             env: sink MirEnv): TCtx =
+  result = TCtx(graph: graph, config: config, env: move env)
+  if owner != nil:
+    result.userOptions = owner.options
+    result.injectDestructors =
+      sfInjectDestructors in owner.flags and
+      sfGeneratedOp notin owner.flags and
+      goIsCompileTime notin result.config.options
+  else:
+    # default to injecting destructors
+    result.injectDestructors = goIsCompileTime notin result.config.options
+
 proc generateAssignment*(graph: ModuleGraph, env: var MirEnv,
                    config: TranslationConfig, n: PNode,
                    builder: var MirBuilder, source: var SourceMap) =
   ## Translates an `nkIdentDefs` AST into MIR and emits the result into
   ## `builder`'s currently selected buffer.
   assert n.kind == nkIdentDefs and n.len == 3
-  var c = TCtx(context: skUnknown, graph: graph, config: config,
-               env: move env)
+  var c = initCtx(graph, config, nil, move env)
   # treat the code as top-level code so that no 'def' is generated for
   # assignments to globals
   c.scopeDepth = 1
@@ -2174,55 +2389,53 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
   #      might no longer be present after the lambdalifting pass
   #assert nfTransf in body.flags, "transformed AST is expected as input"
 
-  var c = TCtx(context: owner.kind, graph: graph, config: config,
-               userOptions: owner.options, env: move env)
+  var c = initCtx(graph, config, owner, move env)
   c.sp.active = (body, c.sp.map.add(body))
 
-  c.scopeDepth = 1
-  c.add MirNode(kind: mnkScope)
-  if sfNeverRaises in owner.flags:
-    c.add MirNode(kind: mnkTry, len: 1)
-    c.add MirNode(kind: mnkStmtList)
-
-  if owner.kind in routineKinds:
-    # the procedure backing a macro has its own internal signature; use that
-    # beyond this point
-    let signature =
-      if owner.kind == skMacro:
-        owner.internal
-      else:
-        owner.typ
-
-    addParams(c, owner, signature)
-    # add a 'def' for each ``sink`` parameter. This simplifies further
-    # processing and analysis
-    let params = signature.n
-    for i in 1..<params.len:
-      let s = params[i].sym
-      if s.typ.isSinkTypeForParam():
-        c.subTree mnkDef:
-          c.add nameNode(c, s)
-          c.add MirNode(kind: mnkNone)
-  else:
-    # reserve the result slot:
-    discard c.addLocal(Local())
-
-  gen(c, body)
-
-  if sfNeverRaises in owner.flags:
-    # if it's enforced that the procedure never raises, exceptions escaping
-    # the procedure terminate the program. This is achieved by wrapping the
-    # body in a catch-all exception handler
-    c.add endNode(mnkStmtList)
-    c.subTree MirNode(kind: mnkExcept, len: 1):
-      c.subTree mnkBranch:
-        c.subTree mnkVoid:
-          let p = c.graph.getCompilerProc("nimUnhandledException")
-          c.builder.buildCall c.env.procedures.add(p), VoidType:
-            discard
-    c.add endNode(mnkTry)
+  c.withBlock bkBlock: # the target for return statements
+    if sfNeverRaises in owner.flags:
+      # it needs to be ensured that no exceptions leave the body
+      c.blocks.add Block(kind: bkTryExcept)
 
-  c.add endNode(mnkScope)
+    c.scope:
+      if owner.kind in routineKinds:
+        # the procedure backing a macro has its own internal signature; use that
+        # beyond this point
+        let signature =
+          if owner.kind == skMacro:
+            owner.internal
+          else:
+            owner.typ
+
+        addParams(c, owner, signature)
+        # add a 'def' for each ``sink`` parameter. This simplifies further
+        # processing and analysis
+        let params = signature.n
+        for i in 1..<params.len:
+          let s = params[i].sym
+          if s.typ.isSinkTypeForParam():
+            c.subTree mnkDef:
+              c.add nameNode(c, s)
+              c.add MirNode(kind: mnkNone)
+            # the sink parameter requires destruction:
+            c.register(genLocation(c, params[i]))
+      else:
+        # reserve the result slot:
+        discard c.addLocal(Local())
+
+      gen(c, body)
+
+    if sfNeverRaises in owner.flags and (let b = c.blocks.pop(); b.id.isSome):
+      leaveBlock(c) # jump over the handler
+      # emit the handler for panicking on escaping exceptions:
+      c.subTree MirNode(kind: mnkExcept, len: 1):
+        c.add labelNode(b.id.unsafeGet)
+      c.subTree mnkVoid:
+        let p = c.graph.getCompilerProc("nimUnhandledException")
+        c.builder.buildCall c.env.procedures.add(p), VoidType:
+          discard
+      c.subTree mnkEndStruct:
+        c.add labelNode(b.id.unsafeGet)
 
   env = c.env
 
@@ -2235,26 +2448,27 @@ proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
   ## Only meant to be used by `vmjit <#vmjit>`_. Produces a MIR body for a
   ## standalone expression. The result of the expression is assigned to the
   ## special local with ID 0.
-  var c = TCtx(context: skUnknown, graph: graph, config: config, env: move env)
+  var c = initCtx(graph, config, nil, move env)
   c.sp.active = (e, c.sp.map.add(e))
 
   let
     rtyp = c.typeToMir(e.typ)
     res = c.addLocal(Local(typ: rtyp)) # the result variable
-  c.scope:
-    c.buildStmt mnkDef:
-      c.use toValue(mnkLocal, res, rtyp)
-      if e.typ.kind == tyTypeDesc:
-        # FIXME: this shouldn't happen, but type expressions are sometimes
-        #        evaluated with the VM, such as a ``typeof(T.x)`` appearing as
-        #        a field type within a generic object definition. While it
-        #        makes sense to allow evaluating type expression with the VM,
-        #        in simple situtations like the example above, it's simpler,
-        #        faster, and more intuitive to either evaluate them directly
-        #        when analyzing the type expression, or during ``semfold``
-        c.use genTypeExpr(c, e)
-      else:
-        c.genAsgnSource(e, {dfOwns, dfEmpty})
+  c.withBlock bkBlock:
+    c.scope:
+      c.buildStmt mnkDef:
+        c.use toValue(mnkLocal, res, rtyp)
+        if e.typ.kind == tyTypeDesc:
+          # FIXME: this shouldn't happen, but type expressions are sometimes
+          #        evaluated with the VM, such as a ``typeof(T.x)`` appearing as
+          #        a field type within a generic object definition. While it
+          #        makes sense to allow evaluating type expression with the VM,
+          #        in simple situtations like the example above, it's simpler,
+          #        faster, and more intuitive to either evaluate them directly
+          #        when analyzing the type expression, or during ``semfold``
+          c.use genTypeExpr(c, e)
+        else:
+          c.genAsgnSource(e, {dfOwns, dfEmpty})
 
   env = move c.env
 
diff --git a/compiler/mir/mirgen_blocks.nim b/compiler/mir/mirgen_blocks.nim
new file mode 100644
index 00000000000..b32b1363b7c
--- /dev/null
+++ b/compiler/mir/mirgen_blocks.nim
@@ -0,0 +1,297 @@
+## Subordinate module to `mirgen <#mirgen>`_. Implements the block and scope
+## management required for translating the AST's high-level control-flow
+## constructs to the MIR's goto-based ones. Injecting ``mnkDestroy``
+## operations is also implemented here, integrated with the scope management.
+
+import
+  std/[
+    options
+  ],
+  compiler/ast/[
+    ast_types
+  ],
+  compiler/mir/[
+    mirconstr,
+    mirtrees
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+type
+  BlockKind* = enum
+    bkBlock
+    bkScope
+    bkTryExcept
+    bkTryFinally
+    bkFinally
+    bkExcept
+
+  Block* = object
+    ## Information about a block-like structure. This not only includes |NimSkull|
+    ## ``block``s, but also try, finally, etc.
+    id*: Option[LabelId]
+      ## the block's label. Initialized on-demand, meaning that 'none'
+      ## indicates that the block is unused
+    case kind*: BlockKind
+    of bkBlock:
+      label*: PSym
+        ## the symbol of the block's label. nil if it's an internal block
+    of bkScope:
+      numRegistered: int
+        ## number of entities registered for the scope in the to-destroy list
+      scopeExits: seq[LabelId]
+        ## unordered set of follow-up targets
+    of bkTryFinally:
+      doesntExit*: bool
+        ## whether structured control-flow doesn't reach the end of the finally
+      exits*: seq[LabelId]
+        ## unordered set of follow-up targets
+    of bkTryExcept, bkFinally, bkExcept:
+      discard
+
+  BlockCtx* = object
+    ## Per-procedure block-related state.
+    blocks: seq[Block]
+      ## stack of enclosing try, finally, etc. blocks
+    toDestroy: seq[tuple[entity: Value, label: Option[LabelId]]]
+      ## all locals/globals/temporaries that need destruction, together
+      ## with the label of the finally that the destroy operation is part
+      ## of. Only the items where the `label` changes have an initialized
+      ## label
+    currScope: int
+      ## block index of the current scope
+
+# shorten some common parameter declarations:
+using
+  c: var BlockCtx
+  bu: var MirBuilder
+
+proc requestLabel(bu; b: var Block): LabelId =
+  if b.id.isNone:
+    b.id = some bu.allocLabel()
+  result = b.id.unsafeGet
+
+proc labelNode*(label: LabelId): MirNode =
+  MirNode(kind: mnkLabel, label: label)
+
+proc emitDestroy(bu; val: Value) =
+  bu.subTree mnkDestroy:
+    bu.use val
+
+proc emitFinalizerLabels(c; bu; locs: Slice[int]) =
+  ## Emits the labels for all scope finalizers required for cleaning up the
+  ## registered entities in `locs`.
+  # destruction happens in reverse, so iterate from high to low
+  for i in countdown(locs.b, locs.a):
+    if c.toDestroy[i].label.isSome:
+      bu.add labelNode(c.toDestroy[i].label.unsafeGet)
+
+proc blockLeaveActions(c; bu; targetBlock: int): bool =
+  ## Emits the actions for leaving the blocks up until (but not including)
+  ## `targetBlock`. Returns false when there's an intercepting
+  ## ``finally`` clause that doesn't exit (meaning that `targetBlock` won't
+  ## be reached), true otherwise.
+  proc incl[T](s: var seq[T], it: T) {.inline.} =
+    if it notin s:
+      s.add it
+
+  proc inclExit(b: var Block, it: LabelId) {.inline.} =
+    case b.kind
+    of bkTryFinally: b.exits.incl it
+    of bkScope:      b.scopeExits.incl it
+    else: unreachable()
+
+  var
+    last = c.toDestroy.high
+    previous = -1
+
+  for i in countdown(c.blocks.high, targetBlock + 1):
+    let b {.cursor.} = c.blocks[i]
+    case b.kind
+    of bkBlock, bkTryExcept:
+      discard "nothing to do"
+    of bkExcept, bkFinally:
+      # needs a leave action
+      bu.add MirNode(kind: mnkLeave, label: b.id.get)
+    of bkScope:
+      if b.numRegistered > 0:
+        # there are some locations that require cleanup
+        if c.toDestroy[last].label.isNone:
+          c.toDestroy[last].label = some bu.allocLabel()
+
+        if previous != -1:
+          c.blocks[previous].inclExit c.toDestroy[last].label.unsafeGet
+
+        previous = i
+        # emit the labels for all scope finalizers that need to be run
+        emitFinalizerLabels(c, bu, (last-b.numRegistered+1)..last)
+
+        last -= b.numRegistered
+    of bkTryFinally:
+      let label = bu.requestLabel(c.blocks[i])
+      # register as outgoing edge of the preceding finally (if any):
+      if previous != -1:
+        c.blocks[previous].inclExit label
+
+      previous = i
+
+      # enter the finally clause:
+      bu.add labelNode(label)
+      if b.doesntExit:
+        # structured control-flow doesn't leave the finally; the finally is
+        # the final jump target
+        return false
+
+  if targetBlock >= 0 and previous != -1 and
+     c.blocks[targetBlock].kind in {bkBlock, bkTryExcept}:
+    # register the target as the follow-up for the previous finally
+    c.blocks[previous].inclExit bu.requestLabel(c.blocks[targetBlock])
+
+  result = true
+
+template add*(c: var BlockCtx; b: Block) =
+  c.blocks.add b
+
+template pop*(c: var BlockCtx): Block =
+  c.blocks.pop()
+
+proc closest*(c: BlockCtx): int =
+  ## Returns the index of the closest block.
+  result = c.blocks.high
+  while result >= 0 and c.blocks[result].kind != bkBlock:
+    dec result
+  assert result >= 0, "no enclosing block?"
+
+proc findBlock*(c: BlockCtx, label: PSym): int =
+  ## Returns the index of the block with label `label`.
+  var i = c.blocks.high
+  while i >= 0 and (c.blocks[i].kind != bkBlock or c.blocks[i].label != label):
+    dec i
+  assert i >= 0, "no enclosing block?"
+  result = i
+
+proc blockExit*(c; bu; targetBlock: int) =
+  ## Emits the jump target description for a jump to `targetBlock`.
+  # XXX: a target list is only necessary if there's more than one jump
+  #      target
+  bu.subTree mnkTargetList:
+    if blockLeaveActions(c, bu, targetBlock):
+      bu.add labelNode(bu.requestLabel(c.blocks[targetBlock]))
+
+proc raiseExit*(c; bu) =
+  ## Emits the jump target description for a jump to the nearest enclosing
+  ## exception handler.
+  var i = c.blocks.high
+  while i >= 0 and c.blocks[i].kind != bkTryExcept:
+    dec i
+
+  bu.subTree mnkTargetList:
+    if blockLeaveActions(c, bu, i):
+      if i == -1:
+        # nothing handles the exception within the current procedure
+        bu.add MirNode(kind: mnkResume)
+      else:
+        bu.add labelNode(bu.requestLabel(c.blocks[i]))
+
+proc closeBlock*(c; bu): bool =
+  ## Finishes the current block. If required for the block (because it is a
+  ## ``block`` and broken out of), emits a join and returns true, false
+  ## otherwise.
+  let blk = c.blocks.pop()
+  # if there's no label, the exit of the block is never jumped to
+  # and the join can be omitted
+  if blk.kind == bkBlock and blk.id.isSome:
+    bu.join blk.id.unsafeGet
+    result = true
+
+func register*(c; loc: Value) =
+  ## Registers `loc` for destruction at the end of the current scope.
+  ## Destruction happens in the reverse order the locations are registered in.
+  inc c.blocks[c.currScope].numRegistered
+  c.toDestroy.add (loc, none LabelId)
+
+proc startScope*(c): int =
+  ## Starts a new scope and returns the index of the previous one.
+  result = c.currScope
+  c.blocks.add Block(kind: bkScope)
+  c.currScope = c.blocks.high
+
+proc earlyExit*(c; bu) =
+  ## Emits the destroy operations for when structured control-flow reaches the
+  ## current scope's end. All entities for which a destroy operation is
+  ## emitted are unregistered already.
+  let start = c.toDestroy.len - c.blocks[c.currScope].numRegistered
+  var i = c.toDestroy.high
+
+  while i >= start and c.toDestroy[i].label.isNone:
+    bu.emitDestroy(c.toDestroy[i].entity)
+    dec i
+
+  # unregister the entities for which a destroy operation was emitted:
+  c.blocks[c.currScope].numRegistered = i - start + 1
+  c.toDestroy.setLen(i + 1)
+
+proc closeScope*(c; bu; nextScope: int, hasStructuredExit: bool) =
+  ## Pops the scope from the stack and emits the scope exit actions.
+  ## `hasStructuredExit` tells whether structured control-flow reaches
+  ## the end of the scope, affecting how the exit looks like.
+  ##
+  ## `next` is the index of the scope index returns by the previous
+  ## `startScope <#startScope,BlockCtx>`_ call.
+  # emit all destroy operations that don't need a finally
+  earlyExit(c, bu)
+
+  var scope = c.blocks.pop()
+  assert scope.kind == bkScope
+
+  let start = c.toDestroy.len - scope.numRegistered
+
+  var next = none LabelId
+  if start < c.toDestroy.len and hasStructuredExit:
+    # there are destroy operations that need a finally. A goto is required
+    # for visiting them
+    next = some bu.allocLabel()
+    bu.subTree mnkGoto:
+      bu.subTree mnkTargetList:
+        emitFinalizerLabels(c, bu, start..c.toDestroy.high)
+        bu.add labelNode(next.unsafeGet)
+
+    scope.scopeExits.add next.unsafeGet
+
+  # emit all finally sections for the scope. Since not all entities requiring
+  # destruction necessarily start their existence at the start of the scope,
+  # multiple sections may be required
+  var curr = none LabelId
+  for i in countdown(c.toDestroy.high, start):
+    # if a to-destroy entry has a label, it marks the start of a new finally
+    if c.toDestroy[i].label.isSome:
+      if curr.isSome:
+        # finish the previous finally by emitting the corresponding 'continue':
+        bu.subTree MirNode(kind: mnkContinue, len: 2):
+          bu.add labelNode(curr.unsafeGet)
+          # a finally section that's not the last one always continues with
+          # the next finally
+          bu.add labelNode(c.toDestroy[i].label.unsafeGet)
+
+      curr = c.toDestroy[i].label
+      bu.subTree mnkFinally:
+        bu.add labelNode(curr.unsafeGet)
+
+    bu.emitDestroy(c.toDestroy[i].entity)
+
+  if curr.isSome:
+    # finish the final finally. `scopeExits` stores all possible follow-up
+    # targets for the finally
+    bu.subTree MirNode(kind: mnkContinue, len: uint32(1 + scope.scopeExits.len)):
+      bu.add labelNode(curr.unsafeGet)
+      for it in scope.scopeExits.items:
+        bu.add labelNode(it)
+
+  if next.isSome:
+    # the join point for the structured scope exit
+    bu.join next.unsafeGet
+
+  # unregister all entities registered with the scope:
+  c.toDestroy.setLen(start)
+  c.currScope = nextScope
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 41b82eadc50..8a75a1ef898 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -294,7 +294,7 @@ proc eliminateTemporaries(tree: MirTree, types: TypeEnv,
           # the searched-for temporary is used and there was no mutation of
           # `p` so far -> not modified
           return NodePosition(n)
-      of opConsume, opDef, opMutate, opKill, opInvalidate:
+      of opConsume, opDef, opMutate, opKill, opInvalidate, opDestroy:
         if (tree[n].kind == mnkTemp and tree[n].local == e) or
            overlaps(p, typ, n):
           # either the searched-for temporary is mutated or consumed itself,
@@ -417,7 +417,7 @@ proc injectResultInit(tree: MirTree, resultTyp: TypeId, changes: var Changeset)
           # path
           s.exit = true
 
-      of opUse, opConsume, opMutate, opInvalidate:
+      of opUse, opConsume, opMutate, opInvalidate, opDestroy:
         if isResult(tree, getRoot(tree, n)):
           # the result variable is read from or modified before it was
           # initialized
@@ -456,13 +456,12 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
       bu.buildCall prcId, VoidType:
         discard "no arguments"
 
-  for i in search(tree, {mnkEnd}):
-    if tree[i].start == mnkRepeat:
-      # insert the call before the end node:
-      changes.insert(tree, i - 1, i, bu):
-        bu.subTree mnkVoid:
-          bu.buildCall prcId, VoidType:
-            discard "no arguments"
+  for i in search(tree, {mnkLoop}):
+    # insert the call before the loop end:
+    changes.insert(tree, i - 1, i, bu):
+      bu.subTree mnkVoid:
+        bu.buildCall prcId, VoidType:
+          discard "no arguments"
 
 proc lowerNew(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
               changes: var Changeset) =
@@ -533,7 +532,7 @@ proc lowerNew(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
 
       var tmp: Value
       changes.insert(tree, stmt, call, bu):
-        if numArgs(tree, call) == 2:
+        if numArgs(tree, call) == 1:
           # the unsafe new-with-size version
           let size = bu.inline(tree, NodePosition tree.argument(call, 0))
           # not the whole memory is necessarily initialized by the default
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 18be9c1b946..dbd9efe2576 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -46,7 +46,8 @@ template indexLike*(_: typedesc[SourceId]) = discard
 
 type
   LabelId* = distinct uint32
-    ## ID of a label, used to identify a block (``mnkBlock``).
+    ## ID of a label, used to identify the control-flow destinations and
+    ## constructs.
 
   MirNodeKind* = enum
     ## Users of ``MirNodeKind`` should not depend on the absolute or relative
@@ -67,6 +68,7 @@ type
               ## ``lent T`` local
 
     mnkField  ## declarative node only allowed in special contexts
+    mnkLabel  ## name of a label
 
     mnkNilLit  ## nil literal
     mnkIntLit  ## reference to signed integer literal
@@ -83,15 +85,17 @@ type
     mnkMagic  ## only allowed in a callee position. Refers to a magic
               ## procedure
 
+    mnkResume    ## special action in a target list that means "resume
+                 ## exception handling in caller"
+    mnkLeave     ## a leave action within a target list
+    mnkTargetList## describes the actions to perform prior to jumping, as well
+                 ## as the final jump
+
     mnkDef       ## marks the start of existence of a local, global, procedure,
                  ## or temporary. Supports an optional intial value (except for
                  ## procedure definitions)
     mnkDefCursor ## marks the start of existence of a non-owning location
-    # future direction: remove this distinction and perform all related decision
-    # making (e.g., injecting destructors) requiring knowledge of locations'
-    # ownership in ``mirgen``. There's only going to be the ``Def`` kind
-    mnkDefUnpack ## intermediate hack required by destructor injection. Don't
-                 ## use
+
     mnkBind      ## introduces an alias that may be used for read/write
                  ## access, but not for direct assignments. The source
                  ## expression must not be empty
@@ -169,10 +173,8 @@ type
     # unsigned integers
 
     mnkRaise  ## if the operand is an ``mnkNone`` node, reraises the
-              ## currently active exception. Otherwise, set the operand value
-              ## as the active exception (via a move). Control-flow is
-              ## transfered to the closest exception handler. If none exists,
-              ## the program terminates
+              ## currently active exception. Otherwise, consumes the operand
+              ## and sets it as the active exception
 
     mnkTag    ## must only appear as the immediate subnode to a ``mnkName``
               ## tree. Describes what kind of mutation is applied to the
@@ -211,39 +213,25 @@ type
               ## * syntactic statement node for representing void calls
               ## * statement acting as a use of the given lvalue
 
-    mnkStmtList ## a sequence of statements, grouped together as a single
-                ## statement
     mnkScope  ## the only way to introduce a scope. Scopes can be nested and
               ## dictate the lifetime of the locals that are directly enclosed
               ## by them
 
+    mnkGoto   ## unconditional jump
     mnkIf     ## depending on the run-time value of `x`, transfers control-
               ## flow to either the start or the end of the spanned code
-    mnkCase   ## dispatches to one the its branches based on the run-time
+    mnkCase   ## dispatches to one of its branches based on the run-time
               ## value of the operand
-    mnkRepeat ## repeats the body indefinitely
-    mnkTry    ## associates one one or more statements (the first sub-node)
-              ## with: an exception handler, a finalizer, or both
-    mnkExcept ## defines and attaches an exception handler to a ``try`` block.
-              ## Only one handler can be attached to a ``try`` block
-    mnkFinally## defines a finalizer in the context of a ``try`` construct. All
-              ## control-flow that either leaves the body of the ``try`` and
-              ## does not target the exception handler (if one is present) or
-              ## that leaves the exception handler is redirected to inside the
-              ## finalizer first. Once control-flow reaches the end of a
-              ## finalizer, it is transferred to the original destination. Only
-              ## one finalizer can be attached to a ``try`` block
-    mnkBlock  ## attaches a label to a span of code. If control-flow reaches
-              ## this statement, it is transferred to the start of the body.
-              ## Once control-flow reaches the end of a ``block``, it is
-              ## transferred to the next statement/operation following the
-              ## block
-    mnkBreak  ## transfers control-flow to the statement/operation following
-              ## after the ``block`` with the given label
-    mnkReturn ## if the code-fragment represents the body of a procedure,
-              ## transfers control-flow back to the caller
-
-    mnkBranch ## defines a branch of an ``mnkExcept`` or ``mnkCase``
+    mnkBranch ## a branch in a ``mnkCase`` dispatcher
+    mnkLoop   ## unconditional jump to the associated-with loop start
+
+    mnkJoin   ## join point for gotos and branches
+    mnkLoopJoin## join point for loops. Represents the start of a loop
+    mnkExcept ## starts an exception handler
+    mnkFinally## starts a finally section. Must be paired with exactly one
+              ## ``mnkContinue`` that follows
+    mnkContinue## marks the end of a finally section
+    mnkEndStruct ## marks the end of an if or except
 
     mnkDestroy## destroys the value stored in the given location, leaving the
               ## location in an undefined state
@@ -297,11 +285,10 @@ type
       position*: uint32 ## the 0-based position of the field
     of mnkCall, mnkCheckedCall:
       effects*: set[GeneralEffect]
+    of mnkLabel, mnkLeave:
+      label*: LabelId
     of mnkMagic:
       magic*: TMagic
-    of mnkBlock, mnkBreak:
-      label*: LabelId ## for a block, the label that identifies the block;
-                      ## for a break, the label of the block to break out of
     of mnkEnd:
       start*: MirNodeKind ## the kind of the corresponding start node
     of mnkTag:
@@ -328,11 +315,11 @@ const
   AllNodeKinds* = {low(MirNodeKind)..high(MirNodeKind)}
     ## Convenience set containing all existing node kinds
 
-  DefNodes* = {mnkDef, mnkDefCursor, mnkDefUnpack, mnkBind, mnkBindMut}
+  DefNodes* = {mnkDef, mnkDefCursor, mnkBind, mnkBindMut}
     ## Node kinds that represent definition statements (i.e. something that
     ## introduces a named entity)
 
-  AtomNodes* = {mnkNone..mnkType, mnkMagic, mnkBreak, mnkReturn}
+  AtomNodes* = {mnkNone..mnkLeave}
     ## Nodes that don't support sub nodes.
 
   SubTreeNodes* = AllNodeKinds - AtomNodes - {mnkEnd}
@@ -353,6 +340,8 @@ const
     ## Assignment modifiers. Nodes that can only appear directly in the source
     ## slot of assignments.
 
+  LabelNodes* = {mnkLabel, mnkLeave}
+
   LiteralDataNodes* = {mnkNilLit, mnkIntLit, mnkUIntLit, mnkFloatLit,
                        mnkStrLit, mnkAstLit}
 
@@ -362,16 +351,17 @@ const
                       mnkEnd} + LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
+  StmtNodes* = {mnkScope, mnkGoto, mnkIf, mnkCase, mnkLoop, mnkJoin,
+                mnkLoopJoin, mnkExcept, mnkFinally, mnkContinue, mnkEndStruct,
+                mnkInit, mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkDestroy,
+                mnkEmit, mnkAsm} + DefNodes
+    ## Nodes that are treated like statements, in terms of syntax.
+
   # --- semantics-focused sets:
 
-  Atoms* = {mnkNone .. mnkType} - {mnkField, mnkProc}
+  Atoms* = {mnkNone .. mnkType} - {mnkField, mnkProc, mnkLabel}
     ## Nodes that may be appear in atom-expecting slots.
 
-  StmtNodes* = {mnkScope, mnkStmtList, mnkIf, mnkCase, mnkRepeat, mnkTry,
-                mnkBlock, mnkBreak, mnkReturn, mnkRaise, mnkInit,
-                mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkDestroy, mnkEmit,
-                mnkAsm} + DefNodes
-
   UnaryOps*  = {mnkNeg}
     ## All unary operators
   BinaryOps* = {mnkAdd, mnkSub, mnkMul, mnkDiv, mnkModI}
@@ -566,13 +556,22 @@ func findParent*(tree: MirTree, start: NodePosition,
   while tree[result].kind != kind:
     result = parent(tree, result)
 
-func numArgs*(tree: MirTree, n: NodePosition): int =
-  ## Computes the number of arguments in the call tree.
+func len*(tree: MirTree, n: NodePosition): int =
+  ## Computes the number of child nodes for the given sub-tree node.
   var n = n + 1
   while tree[n].kind != mnkEnd:
     inc result
     n = tree.sibling(n)
 
+func numArgs*(tree: MirTree, n: NodePosition): int =
+  ## Counts and returns the number of *call arguments* in the call tree at
+  ## `n`.
+  assert tree[n].kind in CallKinds
+  var n = tree.sibling(n + 1) # skip the callee
+  while tree[n].kind in ArgumentNodes:
+    inc result
+    n = tree.sibling(n)
+
 func operand*(tree: MirTree, op: OpValue|NodePosition): OpValue =
   ## Returns the index (``OpValue``) of the operand for the single-input node
   ## at `op`.
@@ -620,7 +619,9 @@ iterator arguments*(tree: MirTree, n: NodePosition): (ArgKinds, OpValue) =
   ## Returns the argument kinds together with the operand node (or tag tree).
   assert tree[n].kind in CallKinds
   var i = tree.sibling(n + 1) # skip the callee
-  while tree[i].kind != mnkEnd:
+  # XXX: iterating until no more argument nodes are found is a temporary
+  #      workaround until call nodes store their number of sub-nodes
+  while tree[i].kind in ArgumentNodes:
     yield (ArgKinds(tree[i].kind), tree.operand(i))
     i = tree.sibling(i)
 
diff --git a/compiler/mir/proto_mir.nim b/compiler/mir/proto_mir.nim
index 8586d296461..13e8982c2e5 100644
--- a/compiler/mir/proto_mir.nim
+++ b/compiler/mir/proto_mir.nim
@@ -344,6 +344,11 @@ func ownershipOp(e: seq[ProtoItem], i: int): ProtoItemKind =
     # cannot be part of an lvalue expression sequence
     unreachable(e[i].kind)
 
+func materialize(e: var seq[ProtoItem], kind: ProtoItemKind) =
+  # only materialize if not materialized already
+  if e[^1].kind != kind:
+    e.add kind
+
 func wantOwning*(e: var seq[ProtoItem], forceTemp: bool) =
   ## Makes sure `e` produces an owning value. If `forceTemp` is true, a
   ## temporary is materialized even if the expression would already produce
@@ -351,8 +356,7 @@ func wantOwning*(e: var seq[ProtoItem], forceTemp: bool) =
   case classify(e, e.high)
   of Rvalue:
     # rvalue expressions cannot be copied from directly
-    if e[^1].kind != pirMatCursor:
-      e.add pirMatCursor
+    materialize(e, pirMatCursor)
     e.add pirCopy
   of OwnedRvalue:
     var i = e.high
@@ -383,14 +387,12 @@ func wantConsumeable*(e: var seq[ProtoItem]) =
   ## value).
   case classify(e, e.high)
   of Rvalue:
-    if e[^1].kind != pirMatCursor:
-      e.add pirMatCursor
+    materialize(e, pirMatCursor)
     e.add pirCopy
     e.add pirMat
   of OwnedRvalue:
-    if e[^1].kind != pirMat:
-      # requires an owning temporary
-      e.add pirMat
+    # requires an owning temporary
+    materialize(e, pirMat)
   of Lvalue:
     e.add ownershipOp(e, e.high)
     e.add pirMat
@@ -408,9 +410,9 @@ proc wantPure*(e: var seq[ProtoItem]) =
     if not isPure(e, e.high):
       e.add pirMatCursor
   of Rvalue:
-    e.add pirMatCursor
+    materialize(e, pirMatCursor)
   of OwnedRvalue:
-    e.add pirMat
+    materialize(e, pirMat)
 
 proc wantValue*(e: var seq[ProtoItem]) =
   ## Makes sure `e` is a literal value or lvalue expression.
@@ -418,16 +420,16 @@ proc wantValue*(e: var seq[ProtoItem]) =
   of Lvalue, Literal:
     discard "nothin to do"
   of Rvalue:
-    e.add pirMatCursor
+    materialize(e, pirMatCursor)
   of OwnedRvalue:
-    e.add pirMat
+    materialize(e, pirMat)
 
 proc wantShallow*(e: var seq[ProtoItem]) =
   ## Makes sure `e` is something that can be assigned to a non-owning
   ## destination.
   if classify(e, e.high) == OwnedRvalue:
     # commit to a temporary
-    e.add pirMat
+    materialize(e, pirMat)
 
 proc wantStable*(e: var seq[ProtoItem]) =
   ## Makes sure `e` is a stable lvalue expression. Rvalues and literal values
@@ -437,9 +439,9 @@ proc wantStable*(e: var seq[ProtoItem]) =
     if not isStable(e, e.high):
       e.add pirMatLvalue
   of OwnedRvalue:
-    e.add pirMat
+    materialize(e, pirMat)
   of Rvalue, Literal:
-    e.add pirMatCursor
+    materialize(e, pirMatCursor)
 
 # ---- translation routines ----
 
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 54d830fd8ec..7268ef3a0f7 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -48,8 +48,7 @@ template subTree(bu; k: MirNodeKind, t: TypeId, body: untyped) =
     body
 
 template buildIf(bu; cond: Value, body: untyped) =
-  bu.subTree mnkIf:
-    bu.use cond
+  bu.buildIf (;bu.use(cond)):
     bu.subTree mnkScope:
       body
 
@@ -58,8 +57,7 @@ template buildIfNot(bu; cond: Value, body: untyped) =
     bu.buildMagicCall mNot, BoolType:
       bu.emitByVal cond
 
-  bu.subTree mnkIf:
-    bu.use c
+  bu.buildIf(c):
     body
 
 template emitCall(bu; tree; call; prc: ProcedureId, arguments: untyped) =
@@ -70,6 +68,10 @@ template emitCall(bu; tree; call; prc: ProcedureId, arguments: untyped) =
       bu.add procNode(prc) # callee
       arguments # custom arguments
 
+      if tree[call].kind == mnkCheckedCall:
+        # copy the jump target
+        bu.emitFrom(tree, tree.previous(findEnd(tree, call)))
+
 proc addCompilerProc(env; graph; name: string): ProcedureId =
   env.procedures.add(graph.getCompilerProc(name))
 
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index d0963a050af..293b7a02246 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -59,9 +59,9 @@ func `$`(n: MirNode): string =
   of mnkMagic:
     result.add " magic: "
     result.add $n.magic
-  of mnkBlock, mnkBreak:
-    result.add " block: "
-    result.add $ord(n.label)
+  of mnkLabel, mnkLeave:
+    result.add " label: "
+    result.addInt n.label.uint32
   of mnkEnd:
     result.add " start: "
     result.add $n.start
@@ -144,6 +144,9 @@ func next(tree: MirTree, i: var int): lent MirNode =
   result = tree[i]
   inc i
 
+proc error(result: var string, n: MirNode) =
+  result.add "<unexpected: " & $n.kind & ">"
+
 func idToStr[I](result: var string, id: I, open: string) =
   result.add open
   result.addInt id.uint32
@@ -201,6 +204,10 @@ proc addTypedNumber(result: var string, bits: BiggestInt, typ: PType) =
   else:
     result.add "<invalid literal>"
 
+func add(result: var string, id: LabelId) =
+  result.add 'L'
+  result.addInt id.uint32
+
 proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
   case n.kind
   of mnkParam:
@@ -253,8 +260,8 @@ proc singleToStr(n: MirNode, result: var string, c: RenderCtx) =
     result.add "type("
     typeToStr(result, n.typ, c.env)
     result.add ")"
-  of AllNodeKinds - Atoms - mnkProc:
-    result.add "<error: " & $n.kind & ">"
+  of AllNodeKinds - Atoms - mnkProc + {mnkResume, mnkLeave}:
+    result.error(n)
 
 proc singleToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   singleToStr(next(tree, i), result, c)
@@ -311,7 +318,7 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   of AtomNodes:
     singleToStr(n, result, c)
   else:
-    result.add "<error: " & $n.kind & ">"
+    result.error(n)
 
 proc calleeToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   case tree[i].kind
@@ -331,7 +338,7 @@ proc argToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   of mnkName:    result.add "name "
   of mnkConsume: result.add "consume "
   of AllNodeKinds - ArgumentNodes:
-    result.add "<error: " & $n.kind & ">"
+    result.error(n)
 
   if tree[i].kind == mnkTag:
     discard next(tree, i)
@@ -345,6 +352,39 @@ proc argToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
 template argToStr() =
   argToStr(treeParam(), i, result, c)
 
+proc labelToStr(nodes: MirTree, i: var int, result: var string) =
+  let n {.cursor.} = next(nodes, i)
+  case n.kind
+  of mnkLabel:
+    result.add n.label
+  else:
+    error(result, n)
+
+proc targetToStr(nodes: MirTree, i: var int, result: var string) =
+  var n {.cursor.} = next(nodes, i)
+  case n.kind
+  of mnkLabel:
+    result.add n.label
+  of mnkTargetList:
+    result.add "["
+    let start = i
+    while (n = next(nodes, i); n.kind != mnkEnd):
+      if i > start + 1:
+        result.add ", "
+
+      case n.kind
+      of mnkLabel:  result.add n.label
+      of mnkLeave:  result.add "Leave(L" & $n.label.int & ")"
+      of mnkResume: result.add "Resume"
+      else:         result.error(n)
+
+    result.add "]"
+  else:
+    result.error(n)
+
+template targetToStr() =
+  targetToStr(nodes, i, result)
+
 proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   template tree(start: string, body: untyped) =
     result.add start
@@ -432,9 +472,16 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
     tree "":
       calleeToStr(nodes, i, result, c)
       result.add "("
-      commaSeparated:
+      # arguments:
+      let first = i
+      while nodes[i].kind in ArgumentNodes:
+        if i > first:
+          result.add ", "
         argToStr()
-      result.add ") (raises)"
+
+      # jump target:
+      result.add ") -> "
+      targetToStr()
   of UnaryOps:
     const Map = [mnkNeg: "-"]
     let kind = nodes[i].kind
@@ -459,7 +506,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       valueToStr()
   else:
     # TODO: make this branch exhaustive
-    result.add "<error: " & $nodes[i].kind & ">"
+    result.error(nodes[i])
     inc i
 
 template exprToStr() =
@@ -475,22 +522,13 @@ proc renderNameWithType(tree: MirTree, i: var int, result: var string,
 proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
                 c: RenderCtx)
 
-template renderList(indent: int) =
-  mixin renderList
-  renderList(treeParam(), i, indent, result, c)
-
-template stmtToStr(indent: int) =
-  mixin stmtToStr
-  stmtToStr(treeParam(), i, indent, result, c)
-
-proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
+proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
                c: RenderCtx) =
   template tree(str: string, body: untyped) =
     result.add repeat("  ", indent)
     result.add str
     body
 
-  var indent = indent
   template tab(body: untyped) =
     ## Runs `body` with the indentation increased by 1.
     inc indent
@@ -499,7 +537,7 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
 
   let n {.cursor.} = next(nodes, i)
   case n.kind
-  of mnkDef, mnkDefUnpack:
+  of mnkDef:
     tree "def ":
       renderNameWithType(nodes, i, result, c)
       if nodes[i].kind != mnkNone:
@@ -538,54 +576,65 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
       result.add " := "
       exprToStr()
     result.add "\n"
-  of mnkStmtList:
-    renderList(indent)
-  of mnkTry:
-    tree "try:\n":
-      tab:
-        stmtToStr(indent)
-      renderList(indent)
   of mnkExcept:
-    tree "except\n":
-      renderList(indent)
+    tree "except (":
+      labelToStr(nodes, i, result)
+      result.add ")"
+      # render the filter types:
+      for j in 1..<n.len-1:
+        if j == 1:
+          result.add " "
+        else:
+          result.add ", "
+        singleToStr()
+      # render the next handler target:
+      if n.len > 1:
+        result.add " else "
+        targetToStr()
+      result.add ":\n"
+
+    inc indent
   of mnkFinally:
-    tree "finally:\n":
-      tab:
-        stmtToStr(indent)
+    tree "finally (":
+      labelToStr(nodes, i, result)
+      result.add "):\n"
+
+    inc indent
   of mnkScope:
     tree "scope:\n":
       tab:
-        renderList(indent)
+        renderList(nodes, i, indent, result, c)
   of mnkIf:
     tree "if ":
       valueToStr()
+      inc i # ignore the label
       result.add ":\n"
-      tab:
-        renderList(indent)
+
+    inc indent
   of mnkCase:
     tree "case ":
       valueToStr()
       result.add "\n"
-      # use ``renderList`` for simplicity, even though it allows for
-      # structures that are invalid
-      renderList(indent)
-  of mnkBranch:
-    tree "of ":
-      for j in 0..<n.len:
-        if j > 0:
-          result.add ", "
-        singleToStr()
-      result.add ":\n"
-      tab:
-        renderList(indent)
-  of mnkBlock:
-    tree "block L" & $n.label.int & ":\n":
-      tab:
-        renderList(indent)
-  of mnkRepeat:
-    tree "while true:\n":
-      tab:
-        renderList(indent)
+      # render the branches:
+      for _ in 1..<n.len:
+        let b {.cursor.} = next(nodes, i)
+        case b.kind
+        of mnkBranch:
+          tree "of ":
+            # render the values:
+            for j in 0..<b.len-1:
+              if j > 0:
+                result.add ", "
+              singleToStr()
+            # render the jump destination:
+            result.add ": goto "
+            labelToStr(nodes, i, result)
+            result.add "\n"
+          inc i # skip the end node
+        else:
+          # make no attempt at error correction
+          result.error(b)
+
   of mnkAsm, mnkEmit:
     tree (if n.kind == mnkAsm: "asm " else: "emit "):
       var first = true
@@ -607,27 +656,50 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: int, result: var string,
   of mnkRaise:
     tree "raise ":
       valueToStr()
+      result.add " -> "
+      targetToStr()
     result.add "\n"
   of mnkDestroy:
     tree "destroy ":
       valueToStr()
       result.add "\n"
-  of mnkBreak:
-    result.add repeat("  ", indent)
-    result.add "break L" & $n.label.int & "\n"
-  of mnkReturn:
-    result.add repeat("  ", indent)
-    result.add "return\n"
-  of AllNodeKinds - StmtNodes - {mnkBranch, mnkExcept, mnkFinally}:
-    result.add "<error: " & $n.kind & ">\n"
+  of mnkGoto:
+    tree "goto ":
+      targetToStr()
+      result.add "\n"
+  of mnkLoopJoin:
+    tree "while true:\n":
+      inc i # skip the label node
+    inc indent
+  of mnkLoop, mnkEndStruct:
+    inc i # skip the label node
+    dec indent
+  of mnkJoin:
+    tree "":
+      labelToStr(nodes, i, result)
+      result.add ":\n"
+  of mnkContinue:
+    tree "continue ":
+      inc i # skip the label
+      result.add "{"
+      for j in 1..<n.len:
+        if j > 1:
+          result.add ", "
+        labelToStr(nodes, i, result)
+      result.add "}\n"
+
+    dec indent
+  of AllNodeKinds - StmtNodes:
+    result.error(n)
 
   # skip the end node
   i += ord(n.kind in SubTreeNodes)
 
 proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
                 c: RenderCtx) =
+  var indent = indent # support mutation
   while i < tree.len and tree[i].kind != mnkEnd:
-    stmtToStr(indent)
+    stmtToStr(tree, i, indent, result, c)
 
 proc exprToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
                 body: ptr MirBody = nil): string =
@@ -638,13 +710,17 @@ proc exprToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
 proc stmtToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
                 body: ptr MirBody = nil): string =
   ## Renders the statement at `n` into a human-readable text representation.
-  var i = n.int
-  stmtToStr(tree, i, 0, result, RenderCtx(env: env, body: body))
+  var
+    i = n.int
+    indent = 0
+  stmtToStr(tree, i, indent, result, RenderCtx(env: env, body: body))
 
 proc render*(tree: MirTree; env: ptr MirEnv = nil;
              body: ptr MirBody = nil): string =
   ## Renders `tree` into a human-readable text representation. The output is
   ## meant for debugging and tracing and is not guaranteed to have a stable
   ## format.
-  var i = 0
-  renderList(tree, i, 0, result, RenderCtx(env: env, body: body))
+  var
+    i = 0
+    indent = 0
+  renderList(tree, i, indent, result, RenderCtx(env: env, body: body))
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index be260e88740..3402c21013b 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -11,8 +11,11 @@
 ## - the 'switch' operation lowering (``lowerBranchSwitch``)
 ## - the pass for collapsing sink assignments into copies, moves, and
 ##   destrutive moves
-## - the pass for injected ``wasMoved`` calls for consumed lvalues
-## - the pass for injecting destructors
+## - the pass for injecting ``wasMoved`` calls for consumed lvalues
+## - the pass for eliminating unnecessary destroy operations
+##
+## The module name is a historical leftover, it doesn't reflect the module's
+## content nor purpose anymore.
 ##
 ## Overview
 ## ========
@@ -74,7 +77,6 @@
 
 import
   std/[
-    algorithm,
     hashes,
     packedsets,
     tables
@@ -92,15 +94,15 @@ import
     mirconstr,
     mirenv,
     mirtrees,
-    sourcemaps
+    sourcemaps,
+    utils # unused import, but keeping it significantly speeds up the compiler
+    # XXX: this is possibly caused by some hooks changing which module they're
+    #      part of
   ],
   compiler/modules/[
     magicsys,
     modulegraphs
   ],
-  compiler/front/[
-    options
-  ],
   compiler/sem/[
     aliasanalysis,
     liftdestructors,
@@ -136,13 +138,6 @@ type
     ## injection and the move analyser. A location may have more than one
     ## lifetimes.
 
-  DestroyEntry = tuple
-    scope: NodePosition ## the position of the enclosing 'scope' node
-    pos: NodePosition   ## the position of the 'def' belonging to the entity
-                        ## that requires destruction
-    needsFinally: bool  ## whether the destructor needs to be placed in a
-                        ## 'finally' clause
-
   Moves = PackedSet[OpValue]
     ## A set storing the operands of all sinks that were collapsed into
     ## moves.
@@ -153,14 +148,6 @@ type
     # XXX: ideally, view types (i.e. ``lent``) would be used here
     moves: Cursor[Moves]
     entities: Cursor[EntityDict]
-    destroy: Cursor[seq[DestroyEntry]]
-
-iterator ritems[T](x: openArray[T]): lent T =
-  ## Iterates and yields the items from the container `x` in reverse
-  var i = x.high
-  while i >= 0:
-    yield x[i]
-    dec i
 
 func hash(x: EntityName): int =
   result = 0 !& x.a[0] !& x.a[1]
@@ -234,6 +221,10 @@ iterator nodesWithScope(tree: MirTree): (NodePosition, lent MirNode, Slice[NodeP
       if n.start == mnkScope:
         # leave the current scope:
         scopeStack.setLen(scopeStack.len - 1)
+        if scopeStack.len == 0:
+          # the following statements, if any, can only be joins, and those can
+          # safely be skipped here
+          break
 
     else:
       yield (i, n, scopeStack[^1])
@@ -250,7 +241,7 @@ func initEntityDict(tree: MirTree, dfg: DataFlowGraph, env: MirEnv): EntityDict
   ## and cursor locations (non-owning) are not include in the dictionary.
   for i, n, scope in nodesWithScope(tree):
     case n.kind
-    of mnkDef, mnkDefUnpack:
+    of mnkDef:
       let entity = tree[getDefEntity(tree, i)]
       if hasDestructor(env[entity.typ]):
         result.mgetOrPut(toName(entity), @[]).add:
@@ -312,84 +303,6 @@ func collapseSink(tree: MirTree, cfg: var DataFlowGraph,
   # recomputing the graph
   cfg.change(update, opConsume)
 
-type DestructionMode = enum
-  demNone    ## location doesn't need to be destroyed because it contains no
-             ## value when control-flow exits the enclosing scope
-  demNormal  ## the location contains a value when the scope is exited via
-             ## structured control-flow
-  demFinally ## the location contains a value when the scope is exited via
-             ## unstructured control-flow
-
-func requiresDestruction(tree: MirTree, cfg: DataFlowGraph,
-                         span: Subgraph, def: NodePosition, entity: MirNode
-                        ): DestructionMode =
-  template computeAlive(loc, op: untyped): untyped =
-    computeAlive(tree, cfg, span, loc, op)
-
-  let r =
-    case entity.kind
-    of mnkParam, mnkLocal:
-      computeAlive(entity.local, computeAliveOp[LocalId])
-    of mnkGlobal:
-      computeAlive(entity.global, computeAliveOp[GlobalId])
-    of mnkTemp:
-      # unpacked tuples don't need to be destroyed because all elements are
-      # moved out of them
-      if tree[def].kind != mnkDefUnpack:
-        computeAlive(entity.local, computeAliveOp[LocalId])
-      else:
-        (alive: false, escapes: false)
-    else:
-      unreachable(entity.kind)
-
-  result =
-    if r.escapes: demFinally
-    elif r.alive: demNormal
-    else:         demNone
-
-func computeDestructors(tree: MirTree, cfg: DataFlowGraph,
-                        entities: EntityDict): seq[DestroyEntry] =
-  ## Computes and collects which locations present in `entities` need to be
-  ## destroyed at the exit of their enclosing scope in order to prevent the
-  ## values they still store from staying alive.
-  ##
-  ## Special handling is required if the scope is exited via unstructured
-  ## control-flow while the location is still alive (its value is then said
-  ## to "escape")
-  var needsFinally: PackedSet[NodePosition]
-
-  iterator items(x: EntityDict): lent EntityInfo =
-    for _, infos in x.pairs:
-      for it in infos.items:
-        yield it
-
-  for info in entities.items:
-    let
-      def = info.def ## the position of the entity's definition
-      entity = tree[getDefEntity(tree, def)]
-      scopeStart = findParent(tree, def, mnkScope)
-
-    if entity.kind == mnkGlobal and
-       doesGlobalEscape(tree, info.scope, info.scope.a, entity.global):
-      # TODO: handle escaping globals. Either report a warning, an error, or
-      #       defer destruction of the global to the end of the program
-      discard
-
-    case requiresDestruction(tree, cfg, info.scope, def, entity)
-    of demNormal:
-      result.add (scopeStart, def, false)
-    of demFinally:
-      needsFinally.incl scopeStart
-      result.add (scopeStart, def, true)
-    of demNone:
-      discard
-
-  # second pass: if at least one destructor call in a scope needs to use a
-  # finalizer, all do. Update the entries accordingly
-  for it in result.mitems:
-    if it.scope in needsFinally:
-      it.needsFinally = true
-
 # --------- analysis routines --------------
 
 func isAlive(tree: MirTree, cfg: DataFlowGraph,
@@ -454,31 +367,7 @@ func needsReset(tree: MirTree, cfg: DataFlowGraph, ar: AnalysisResults,
     # to be reset
     return true
 
-  let res = isLastWrite(tree, cfg, info.scope, src, at)
-
-  if res.result:
-    if res.escapes or res.exits:
-      let def = info.def
-      assert tree[def].kind in DefNodes
-
-      # check if there exists a destructor call that would observe the
-      # location's value:
-      for it in ar.destroy[].items:
-        if def == it.pos:
-          if (it.needsFinally and res.escapes) or res.exits:
-            # there exists a destructor call for the location -> the current
-            # value is observed
-            return true
-
-          # no need to continue searching
-          break
-
-    # no mutation nor destructor call observes the current value -> no reset
-    # is needed
-    result = false
-  else:
-    # the presence of the value is observed -> a reset is required
-    result = true
+  result = not isLastWrite(tree, cfg, info.scope, src, at)
 
 # ------- code generation routines --------
 
@@ -508,6 +397,21 @@ func destructiveMoveOperands(bu: var MirBuilder, tree: MirTree,
     # the assignment source
     (bu.bindImmutable(tree, src), bu.bindMut(tree, x))
 
+proc eliminateDestroy(tree: MirTree, dfg: var DataFlowGraph, ents: EntityDict,
+                      c: var Changeset) =
+  ## Removes destroy operations where it's certain that the location doesn't
+  ## store a value (i.e., is not alive). This is an *optimization*, not
+  ## performing it must not affect correctness.
+  var noops: seq[InstrPos]
+  for i, op, val in instructions(dfg):
+    if op == opDestroy and
+       not isAlive(tree, dfg, ents, computePath(tree, NodePosition val), i):
+      # location not alive when the destructor is reached -> remove
+      c.remove(tree, tree.parent(NodePosition val))
+      noops.add i
+
+  dfg.change(noops, opNone)
+
 proc specializeAsgn(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
                     stmt: NodePosition, pos: InstrPos, c: var Changeset) =
   ## Specializes the modifier-using assignment at `stmt` using the analysis
@@ -646,91 +550,10 @@ proc rewriteAssignments(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
     elif opc == opDef and (let stmt = tree.parent(NodePosition val);
           tree[stmt, 1].kind in {mnkCopy, mnkMove, mnkSink}):
       # specialize the modifier-using assignment
-      assert tree[stmt].kind in {mnkDef, mnkDefUnpack, mnkAsgn, mnkInit}
+      assert tree[stmt].kind in {mnkDef, mnkAsgn, mnkInit}
       specializeAsgn(tree, ctx, ar, stmt, i, c)
 
-# --------- destructor injection -------------
-
-proc injectDestroysAux(bu: var MirBuilder, orig: MirTree,
-                       entries: openArray[DestroyEntry]) =
-  ## Emits a destroy operation for each item in `entries`.
-  for it in ritems(entries):
-    bu.subTree mnkDestroy:
-      bu.emitFrom(orig, getDefEntity(orig, it.pos))
-
-proc injectDestructors(tree: MirTree, graph: ModuleGraph,
-                       destroy: seq[DestroyEntry], env: var MirEnv,
-                       c: var Changeset) =
-  ## Injects a destructor call for each entity in the `destroy` list, in the
-  ## entities reverse order they are defined. That is the entity defined last
-  ## is destroyed first
-  if destroy.len == 0:
-    # nothing to do
-    return
-
-  var
-    entries = destroy
-    needsFinally: PackedSet[NodePosition]
-
-  # first pass: gather which scopes need to be wrapped in a ``finally``
-  for it in destroy.items:
-    assert tree[it.scope].kind == mnkScope
-    if it.needsFinally:
-      needsFinally.incl it.scope
-
-  # sort the entries by scope (first-order) and position (second-order) in
-  # ascending order. Do this before moving the definitions, as `entries` would
-  # have no defined order otherwise (which could change the relative order
-  # of the moved definitions)
-  sort(entries, proc(x, y: auto): int =
-    result = ord(x.scope) - ord(y.scope)
-    if result == 0:
-      result = ord(x.pos) - ord(y.pos)
-  )
-
-  iterator scopeItems(e: seq[DestroyEntry]): Slice[int] {.inline.} =
-    ## Partitions `e` using the `scope` field and yields the slice of each
-    ## partition
-    var
-      scopePos = e[0].scope
-      start = 0
-
-    # the loop is written in such a way as that ``yield`` is only needed once
-    for i in 1..e.len:
-      if i == e.len or e[i].scope != scopePos:
-        yield start .. (i - 1)
-        if i < e.len:
-          scopePos = e[i].scope
-          start = i
-
-  # second pass: inject the destructors and place them inside a ``finally``
-  # clause if necessary
-  for s in scopeItems(entries):
-    let
-      scopeStart = entries[s.a].scope
-      useFinally = scopeStart in needsFinally
-      source = scopeStart
-        ## the node to inherit the origin information from
-
-    if useFinally:
-      # start a 'finally' at the beginning of the scope:
-      c.insert(tree, scopeStart + 1, source, buf):
-        buf.add MirNode(kind: mnkTry, len: 1)
-        buf.add MirNode(kind: mnkStmtList)
-
-    # insert at the scope's end node
-    c.insert(tree, findEnd(tree, scopeStart), source, buf):
-      if useFinally:
-        buf.add endNode(mnkStmtList) # close the body of the 'try' clause
-        buf.subTree MirNode(kind: mnkFinally):
-          # there's no need for opening a new scope -- we use a statement-list
-          # instead
-          buf.subTree MirNode(kind: mnkStmtList):
-            injectDestroysAux(buf, tree, toOpenArray(entries, s.a, s.b))
-
-        buf.add endNode(mnkTry)
-      else:
-        injectDestroysAux(buf, tree, toOpenArray(entries, s.a, s.b))
+# --------- switch lowering -------------
 
 proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
                        idgen: IdGenerator, env: var MirEnv,
@@ -799,8 +622,7 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
     while body[src].kind == mnkPathVariant:
       src = body.child(src, 0)
 
-    bu.subTree mnkIf:
-      bu.use val
+    bu.buildIf (;bu.use val):
       # ``=destroy`` call:
       bu.buildVoidCall(env, branchDestructor):
         # pass the object access expression to the destroy call
@@ -848,13 +670,17 @@ proc injectDestructorCalls*(tree: MirTree, g: ModuleGraph, env: var MirEnv,
       entities = initEntityDict(tree, actx.cfg, env)
       moves = collapseSink(tree, actx.cfg, entities, env.types)
 
-    let destructors = computeDestructors(tree, actx.cfg, entities)
+    # the order matters: eliminate destroy operation *after* collapsing sinks,
+    # but *before* specializing the assignments
+    eliminateDestroy(tree, actx.cfg, entities, changes)
 
     rewriteAssignments(
       tree, actx,
       AnalysisResults(moves: cursor(moves),
-                      entities: cursor(entities),
-                      destroy: cursor(destructors)),
+                      entities: cursor(entities)),
       env.types, changes)
 
-    injectDestructors(tree, g, destructors, env, changes)
+# the below is required to keep the `utils` import from being reported as
+# being unused
+proc workaround() {.used.} =
+  discard render(default(MirTree))
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index ad0162a7911..f8e3cc6d467 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -22,6 +22,7 @@ import
     algorithm,
     options,
     packedsets,
+    tables
   ],
   compiler/ast/[
     ast_types
@@ -37,6 +38,7 @@ type
   Opcode* = enum
     ## The opcode of a data-/control-flow instruction, representing edges and
     ## nodes in the graph.
+    opNone ## no-op
     opFork ## branching control-flow that cannot introduce a cycle
     opGoto ## unconditional jump that cannot introduce a cycle
     opLoop ## unconditional jump to the start of a loop. The start of a cycle
@@ -49,6 +51,7 @@ type
     opMutate      ## mutation of a value. Can be viewed as a combined 'use' +
                   ## 'def'
     opConsume     ## a value is consumed. This is effectively a 'use' + 'kill'
+    opDestroy     ## a location's value is destroyed
 
     opMutateGlobal ## an unspecified global is mutated
 
@@ -75,6 +78,8 @@ type
       id: JoinId
     of DataFlowOps:
       val: OpValue
+    of opNone:
+      discard
 
   DataFlowGraph* = object
     ## Encodes the data-flow graph of a local program as a sequence of
@@ -135,23 +140,12 @@ type
 
   ClosureEnv = object
     instrs: seq[Instr]
-    structStack: seq[InstrPos]
-      ## stack of instruction positions for the currently open
-      ## structured control-flow blocks (if, loop, and regions).
-    blocks: seq[Option[LabelId]]
-      ## stack of targets for forward, merging control-flow. No label
-      ## means that it's a *hidden* block (such as the one opened by a
-      ## ``try`` statement)
-    exits: seq[tuple[instr: InstrPos, id: uint32, inTry: uint32]]
-      ## unstructured exits. An `id` of ``high(uint32)`` means that it's
-      ## exceptional control-flow.
-
-    inTry: uint32
-    numJoins: int
-
-const
-  RaiseLabel = high(uint32)
-  ExitLabel = 0'u32
+    joins: seq[InstrPos]
+      ## the ``JoinId`` -> instruction position mappings
+    labelToJoin: Table[LabelId, JoinId]
+      ## maps the label ID to the corresponding join ID
+    resumeLabel: Option[JoinId]
+      ## only setup when used
 
 func incl[T](s: var seq[T], v: sink T) =
   ## If not present already, adds `v` to the sorted ``seq`` `s`
@@ -176,6 +170,27 @@ func `[]`(c: DataFlowGraph, pc: SomeInteger): lent Instr {.inline.} =
 
 # ---- data-flow graph setup ----
 
+proc firstTarget(tree: MirTree, n: NodePosition): NodePosition =
+  ## Returns the first label or resume in the jump target description.
+  case tree[n].kind
+  of mnkLabel:
+    result = n
+  of mnkTargetList:
+    for p in subNodes(tree, n):
+      if tree[p].kind in {mnkResume, mnkLabel}:
+        return p
+    unreachable("ill-formed target list")
+  else:
+    unreachable(tree[n].kind)
+
+func map(env: var ClosureEnv, id: LabelId): JoinId =
+  if id in env.labelToJoin:
+    result = env.labelToJoin[id]
+  else:
+    result = env.joins.len.JoinId
+    env.joins.add 0 # will be patched later
+    env.labelToJoin[id] = result
+
 func dfaOp(env: var ClosureEnv, opc: Opcode, n: NodePosition, v: OpValue) =
   {.cast(uncheckedAssign).}:
     env.instrs.add Instr(op: opc, node: n, val: v)
@@ -186,12 +201,28 @@ func dfaOp(env: var ClosureEnv, opc: Opcode, tree: MirTree, n: NodePosition,
   if tree[v].kind in LvalueExprKinds:
     dfaOp(env, opc, n, v)
 
-func emit(env: var ClosureEnv, opc: Opcode, n: NodePosition): InstrPos =
-  env.instrs.add Instr(op: opc, node: n)
-  env.instrs.high.InstrPos
+func getResumeLabel(env: var ClosureEnv): JoinId =
+  # the join point is allocated when first used
+  if env.resumeLabel.isNone:
+    env.resumeLabel = some env.joins.len.JoinId
+    env.joins.add 0 # will be patched later
+  env.resumeLabel.unsafeGet
+
+func raiseExit(env: var ClosureEnv, opc: Opcode, tree: MirTree,
+               at, target: NodePosition) =
+  let target = firstTarget(tree, target)
+  # compute the join ID to use, accounting for the special 'resume' action:
+  let join =
+    case tree[target].kind
+    of mnkLabel:
+      map(env, tree[target].label)
+    of mnkResume:
+      env.getResumeLabel()
+    else:
+      unreachable()
 
-func exit(env: var ClosureEnv, opc: Opcode, pos: NodePosition, blk: uint32) =
-  env.exits.add (emit(env, opc, pos), blk, env.inTry)
+  {.cast(uncheckedAssign).}:
+    env.instrs.add Instr(op: opc, node: at, id: join)
 
 func emitForValue(env: var ClosureEnv, tree: MirTree, at: NodePosition,
                   source: OpValue) =
@@ -224,7 +255,7 @@ func emitForArgs(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
       emitLvalueOp(env, opConsume, tree, at, tree.operand(it))
     of mnkName:
       emitForValue(env, tree, at, tree.skip(tree.operand(it), mnkTag))
-    of mnkField, mnkMagic, mnkProc:
+    of mnkField, mnkMagic, mnkProc, mnkLabel, mnkTargetList:
       discard
     else:
       emitLvalueOp(env, opUse, tree, at, OpValue it)
@@ -269,7 +300,7 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
     # mutation, creation of the slice is treated as a mutation. To ensure the
     # correct data-flow operation order for the mutation case, the lower/upper
     # bound operands are treated as being evaluated (i.e., used) first
-    if numArgs(tree, source) == 3:
+    if len(tree, source) == 3:
       emitLvalueOp(env, opUse, tree, at, tree.operand(source, 1))
       emitLvalueOp(env, opUse, tree, at, tree.operand(source, 2))
 
@@ -319,7 +350,8 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
     if geMutateGlobal in tree[source].effects:
       env.instrs.add Instr(op: opMutateGlobal, node: at)
     if tree[source].kind == mnkCheckedCall:
-      exit env, opFork, at, RaiseLabel
+      # the jump target description is in the last slot
+      raiseExit(env, opFork, tree, at, tree.previous(findEnd(tree, source)))
   else:
     discard
 
@@ -337,225 +369,106 @@ func emitForDef(env: var ClosureEnv, tree: MirTree, n: NodePosition) =
     env.dfaOp opDef, n, dest
 
 func computeDfg*(tree: MirTree): DataFlowGraph =
-  ## Computes the data-flow graph for the given `tree`. This is an
-  ## expensive operation! The high cost is due to two essential reasons:
-  ##
-  ## 1. a control-flow graph needs to materialize all edges for a given `tree`
-  ## 2. the amount of allocations/bookkeeping necessary to do so
-  ##
-  ## The most amount of bookkeeping is required for finalizers and exceptions.
-
-  template emit(opc: Opcode, n: NodePosition): InstrPos =
-    env.instrs.add Instr(op: opc, node: n)
-    env.instrs.high.InstrPos
-
-  template join(pos: NodePosition): JoinId =
-    let id = JoinId env.numJoins
-    inc env.numJoins
-    env.instrs.add Instr(op: opJoin, node: pos, id: id)
-    id
-
-  proc findBlock(env: ClosureEnv, label: Option[LabelId]): uint32 =
-    var i = env.blocks.high
-    # search for the unstructured control-flow target for `label`
-    while i >= 0 and env.blocks[i] != label:
-      dec i
-
-    assert i >= 0, "invalid exit"
-    result = uint32(i + 1)
-
-  template findHidden(): uint32 = findBlock(env, none(LabelId))
-
-  template exit(opc: Opcode, pos: NodePosition, blk: uint32) =
-    env.exits.add (emit(opc, pos), blk, env.inTry)
-
-  template push(opc: Opcode, pos: NodePosition) =
-    env.structStack.add emit(opc, pos)
-
-  proc pop(env: var ClosureEnv, p: NodePosition) =
-    let start = env.structStack.pop()
-    case env.instrs[start].op
-    of opJoin:
-      let id = env.instrs[start].id
-      env.instrs.add Instr(op: opLoop, node: p, dest: id)
-    of opFork, opGoto, opLoop:
-      let id = join(p)
-      env.instrs[start].dest = id
-    of DataFlowOps:
-      discard
+  ## Computes the data-flow graph for the given `tree`. This is a moderately
+  ## expensive operation. The cost is due to having to materialize all data-
+  ## flow operation for a given tree.
+
+  template join(pos: NodePosition, label: LabelId) =
+    var id: JoinId
+    # pop the table entry; it's not needed past this point
+    if env.labelToJoin.pop(label, id):
+      env.instrs.add Instr(op: opJoin, node: pos, id: id)
+      # patch the join-to-instruction mapping:
+      env.joins[id] = env.instrs.high.InstrPos
+    else:
+      unreachable("unused join point")
 
-  iterator updateTargets(env: var ClosureEnv, n: NodePosition,
-                         update: var bool): auto {.inline.} =
-    ## Yields all exits that are part of the active 'try' statement. If
-    ## `update` is 'true' when control is given back to the iterator, the exit
-    ## is removed from the list and the destination of the associated
-    ## instruction set to `n`.
-    var
-      id = none(JoinId) # only create a 'join' if really needed
-      i = 0
-    while i < env.exits.len:
-      if env.exits[i].inTry >= env.inTry:
-        update = false
-        yield env.exits[i]
-
-        if update:
-          if id.isNone:
-            id = some(join n)
-
-          env.instrs[env.exits[i].instr].dest = id.unsafeGet
-          del(env.exits, i)
-        else:
-          inc i
-      else:
-        inc i
+  template goto(pos: NodePosition, label: LabelId) =
+    env.instrs.add Instr(op: opGoto, node: pos, dest: map(env, label))
 
-  template open(label: LabelId) =
-    env.blocks.add some(label)
-  template openHidden() =
-    env.blocks.add none(LabelId)
+  template fork(pos: NodePosition, label: LabelId) =
+    env.instrs.add Instr(op: opFork, node: pos, dest: map(env, label))
 
-  proc close(env: var ClosureEnv, i: NodePosition) =
-    var upd = false
-    for exit in updateTargets(env, i, upd):
-      upd = exit.id == env.blocks.len.uint32
-    discard env.blocks.pop()
+  template loop(pos: NodePosition, label: LabelId) =
+    var id: JoinId
+    discard env.labelToJoin.pop(label, id)
+    env.instrs.add Instr(op: opLoop, node: pos, dest: id)
 
   var
     env = ClosureEnv()
-    finallyExits: seq[tuple[id: uint32, inTry: uint32]]
+    ifs = newSeq[LabelId]()
 
   for i, n in tree.pairs:
     case n.kind
+    of mnkGoto:
+      let first = tree.firstTarget(tree.child(i, 0))
+      # the node for the target is guaranteed to be a label
+      goto i, tree[first].label
+    of mnkLoop:
+      loop i, tree[i, 0].label
     of mnkIf:
       emitLvalueOp(env, opUse, tree, i, tree.operand(i, 0))
-      push opFork, i
-    of mnkBranch:
-      # optimization: the first branch doesn't use a CFG edge
-      if tree[i-2].kind != mnkCase and tree[i-1].kind != mnkExcept:
-        pop(env, i)
-    of mnkRepeat:
-      # add a 'join' for the 'loop' that is emitted at the end of the repeat
-      discard join(i)
-      env.structStack.add env.instrs.high.InstrPos
-    of mnkBlock:
-      open n.label
+      fork i, tree[i, 1].label
+      ifs.add tree[i, 1].label
     of mnkCase:
-      emitLvalueOp(env, opUse, tree, i, tree.operand(i, 0))
-      openHidden() # for the branch exits
-      # fork to all branches except the the first one:
-      for _ in 0..<tree[i].len-1:
-        push opFork, i
-    of mnkTry:
-      openHidden()
-      inc env.inTry
+      var j = 0
+      for it in subNodes(tree, i):
+        if j == 0:
+          emitLvalueOp(env, opUse, tree, i, OpValue it)
+        elif j < tree[i].len.int:
+          # all branches up until the final one are forks
+          fork it, tree[it, tree[it].len - 1].label
+        else:
+          # a case dispatcher doesn't fall through (it's a terminator), so the
+          # last jump is a goto
+          goto it, tree[it, tree[it].len - 1].label
+
+        inc j
+    of mnkJoin:
+      join i, tree[i, 0].label
+    of mnkLoopJoin:
+      # special handling for loop joins, as they come before their
+      # corresponding jump instruction
+      let id = env.joins.len.JoinId
+      env.joins.add env.instrs.len.InstrPos
+      env.instrs.add Instr(op: opJoin, node: i, id: id)
+      env.labelToJoin[tree[i, 0].label] = id
     of mnkExcept:
-      # first, add a structured exit for the tried statement (which
-      # immediately precedes the handler):
-      exit opGoto, i-1, findHidden()
-      # set the join point for all exits targeting the 'raise' label:
-      var upd = false
-      for exit in updateTargets(env, i, upd):
-        upd = exit.id == RaiseLabel
-
-      # fork to the exception matchers:
-      for _ in 0..<tree[i].len-1:
-        push opFork, i
+      join i, tree[i, 0].label
+      # fork to the handler that is jumped to when there's no match
+      if n.len > 1:
+        raiseExit(env, opFork, tree, i, tree.child(i, n.len - 1))
     of mnkFinally:
-      if not (tree[i-1].kind == mnkEnd and tree[i-1].start == mnkExcept):
-        # this is a finally clause for a try statement without an exception
-        # handler. We need the structured exit for the tried statement to
-        # know where to resume at the end of the clause
-        exit opGoto, i-1, findHidden()
-
-      let start = finallyExits.len
-
-      var upd = false
-      for exit in updateTargets(env, i, upd):
-        upd = true
-        # make sure that the list stays sorted while deduplicating exits:
-        var ins = start
-        while ins < finallyExits.len and finallyExits[ins].id < exit.id:
-          inc ins
-
-        if ins == finallyExits.len or finallyExits[ins].id != exit.id:
-          # the exit is not part of the surrounding 'try', so subtract 1
-          finallyExits.insert((exit.id, env.inTry-1), ins)
-
-      # the code inside the finally clause is control-flow wise not part of
-      # the 'try'
-      dec env.inTry
-    of mnkBreak:
-      exit opGoto, i, findBlock(env, some n.label)
-    of mnkReturn:
-      exit opGoto, i, ExitLabel
+      join i, tree[i, 0].label
+    of mnkContinue:
+      var j = 0
+      # a continue acts much like a dispatcher
+      for it in subNodes(tree, i):
+        if j == 0:
+          discard "label of the associated finally; ignore"
+        elif j < n.len.int - 1:
+          fork i, tree[it].label
+        else:
+          goto i, tree[it].label
+        inc j
+
+      if n.len == 1:
+        # no follow-up targets means that the finally continues exceptional
+        # control-flow in the caller
+        let target = env.getResumeLabel()
+        env.instrs.add Instr(op: opGoto, node: i, dest: target)
     of mnkRaise:
       # raising an exception consumes it:
       if tree[tree.operand(i)].kind != mnkNone:
         emitLvalueOp(env, opConsume, tree, i, tree.operand(i))
 
-      exit opGoto, i, RaiseLabel # go to closest handler
-    of mnkEnd:
-      case n.start
-      of mnkBranch:
-        # XXX: the goto is redundant/unnecessary if the body doesn't have a
-        #      structured exit
-        # only create an edge for branches that are not the last one
-        if tree[i+1].kind != mnkEnd:
-          exit opGoto, i, findHidden()
-      of mnkIf, mnkRepeat:
-        pop(env, i)
-
-      # unstructured exits:
-      of mnkBlock, mnkCase:
-        close(env, i)
-      of mnkTry:
-        close(env, i)
-
-        if not (tree[i-1].kind == mnkEnd and tree[i-1].start == mnkFinally):
-          # if no finally clause exists, we need to patch the ``inTry``
-          # values for the exits. Effictively, the exits in a 'try' without
-          # a 'finally' clause become part of the surrounding 'try' (if any)
-          dec env.inTry
-          for exit in env.exits.mitems:
-            exit.inTry = min(exit.inTry, env.inTry)
-
-      # handlers and finally:
-      of mnkExcept:
-        # after a structured exit of the handler, control-flow continues after
-        # the code section it is attached to. Node-wise, this is the ``end``
-        # node terminating the ``try`` the handler is part of
-        # TODO: with this approach, either the last branch needs to fork
-        #       control-flow to the next exception handler or ``mirgen`` has to
-        #       introduce a catch-all handler
-        if tree[i+1].kind == mnkFinally:
-          # only add an edge if the there's a finalizer -- no edge is needed
-          # if there's none
-          exit opGoto, i, findHidden()
-      of mnkFinally:
-        # search for the start of the relevant exits:
-        var start = finallyExits.len
-        while start > 0 and finallyExits[start-1].inTry == env.inTry:
-          dec start
-
-        # where control-flow continues after exiting the finalizer depends on
-        # the jumps it intercepts. We represent this in the CFG by emitting a
-        # 'fork' instruction targeting the destination of each intercepted jump
-        for x in start..<finallyExits.len-1:
-          exit opFork, i, finallyExits[x].id
-
-        # the last target needs to be linked via a 'goto' instruction, as the
-        # finalizer must not be exited via fallthrough. The finally clause
-        # having no exits is valid: it means that the finalizer is unused
-        # (control-flow never enters it)
-        if start < finallyExits.len:
-          exit opGoto, i, finallyExits[^1].id
-
-        finallyExits.setLen(start)
-      else:
-        # no control-flow or other effects
-        discard
+      raiseExit(env, opGoto, tree, i, tree.child(i, 1))
+    of mnkEndStruct:
+      # emit a join at the end of an 'if'
+      if ifs.len > 0 and tree[i, 0].label == ifs[^1]:
+        join i, ifs.pop()
 
-    of mnkDef, mnkDefCursor, mnkDefUnpack, mnkAsgn, mnkInit:
+    of mnkDef, mnkDefCursor, mnkAsgn, mnkInit:
       emitForDef(env, tree, i)
     of mnkSwitch:
       # the switch statement invalidates the destination rather than
@@ -571,31 +484,21 @@ func computeDfg*(tree: MirTree): DataFlowGraph =
     of mnkVoid:
       emitForExpr(env, tree, i, NodePosition tree.operand(i))
     of mnkDestroy:
-      unreachable("not implemented yet")
+      emitLvalueOp(env, opDestroy, tree, i, tree.operand(i))
     of mnkEmit, mnkAsm:
       emitForArgs(env, tree, i, i)
 
     else:
       discard "not relevant"
 
-  assert env.inTry == 0
-
-  if env.exits.len > 0:
-    let id = join tree.len.NodePosition
-    # all unhandled exits (including raise exits) that reach here exit the
-    # processed tree:
-    for it in env.exits.items:
-      env.instrs[it.instr].dest = id
+  # patch the resume label, if used:
+  if env.resumeLabel.isSome:
+    let id = env.resumeLabel.unsafeGet
+    env.joins[id] = env.instrs.len.InstrPos
+    env.instrs.add Instr(op: opJoin, node: tree.len.NodePosition, id: id)
 
   swap(env.instrs, result.instructions)
-
-  # looking up the position of the ``opcJoin`` instruction that defines a given
-  # join point is a very common operation, so we cache this information for
-  # efficiency
-  result.map.newSeq(env.numJoins)
-  for i, instr in result.instructions.lpairs:
-    if instr.op == opJoin:
-      result.map[instr.id] = InstrPos(i)
+  swap(env.joins, result.map)
 
 func subgraphFor*(dfg: DataFlowGraph, span: Slice[NodePosition]): Subgraph =
   ## Computes a reference to the sub-graph encompassing the `span` of MIR
@@ -694,6 +597,8 @@ iterator traverse*(c: DataFlowGraph, span: Subgraph, start: InstrPos,
           queue.delete(0)
       of DataFlowOps:
         yield (DataFlowOpcode(instr.op), instr.val)
+      of opNone:
+        discard "ignore"
 
       if state.exit or pc + 1 == start:
         # abort the current path if we either reached the instruction we
@@ -814,7 +719,7 @@ iterator traverseReverse*(c: DataFlowGraph, span: Subgraph, start: InstrPos,
       # the start of a loop; pop the previous loop entry:
       if s.loops.len > 0 and s.loops[^1].start == instr.id:
         s.loops.setLen(s.loops.len - 1)
-    of opGoto, opFork, DataFlowOps:
+    of opGoto, opFork, DataFlowOps, opNone:
       discard
 
     dec s.pc
@@ -844,6 +749,8 @@ iterator traverseReverse*(c: DataFlowGraph, span: Subgraph, start: InstrPos,
       of DataFlowOps:
         # the end (in our case start) of the basic block is reached
         break
+      of opNone:
+        discard "ignore"
 
       dec s.pc
 
@@ -933,6 +840,8 @@ iterator traverseFromExits*(c: DataFlowGraph, span: Subgraph,
       of DataFlowOps:
         # the end of a basic block is reached
         break
+      of opNone:
+        discard "ignore"
 
       dec s.pc
 
@@ -970,5 +879,7 @@ func `$`*(c: DataFlowGraph): string =
       result.add $n.op & " " & $n.dest
     of DataFlowOps:
       result.add $n.op & " " & $ord(n.val)
+    else:
+      result.add "---"
 
     result.add " -> " & $ord(n.node) & "\n"
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 533f74baaf1..7ece383092f 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -402,14 +402,7 @@ proc transformWhile(c: PTransf; n: PNode): PNode =
               cond),
             newBreakStmt(info, labl)))
 
-      var body = transformLoopBody(c, n[1])
-      # use a nested scope for the body. This is important for the clean-up
-      # semantics, as exiting the loop via the ``break`` used by the exit
-      # handling must not run finalizers (if present) for the loop's body
-      if body.kind != nkBlockStmt:
-        body = newTreeI(nkBlockStmt, n[1].info):
-          [newSymNode(newLabel(c, body)), body]
-
+      let body = transformLoopBody(c, n[1])
       loop[1] =
         if preamble.isNil: newTree(nkStmtList, [exit, body])
         else:              newTree(nkStmtList, [preamble, exit, body])
diff --git a/doc/mir.rst b/doc/mir.rst
index 84e8e2736d8..7af9721f7e5 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -87,13 +87,9 @@ Semantics
                                          # one for which the behaviour cannot
                                          # be represented in the MIR)
 
-  # (legacy) checked calls have the same shape as normal calls. The difference
+  # checked calls have the same shape as normal calls. The difference
   # is that the call has an exceptional exit (i.e., it might raise an
   # exception)
-  CHECKED_CALL_EXPR = CheckedCall <Proc> CALL_ARG ...
-                    | CheckedCall LVALUE CALL_ARG ...
-                    | CheckedCall <Magic> CALL_ARG ...
-
   CHECKED_CALL_EXPR = CheckedCall <Proc> CALL_ARG ...  EX_TARGET
                     | CheckedCall LVALUE CALL_ARG ...  EX_TARGET
                     | CheckedCall <Magic> CALL_ARG ... EX_TARGET
@@ -141,9 +137,7 @@ Semantics
   SHALLOW_SRC = RVALUE
               | VALUE
 
-  STATEMENT =
-            | StmtList STATEMENT ...    # a list of statements
-            | Scope STATEMENT           # wrap the statement in a scope, which
+  STATEMENT = Scope STATEMENT           # wrap the statement in a scope, which
                                         # delimits the lifetime of all
                                         # definitions within
             | Def NAME none             # definition
@@ -171,8 +165,6 @@ Semantics
                                         # is empty)
             | Switch LVALUE ASGN_SRC    # changes the active branch of a
                                         # variant. Unclear semantics.
-            | If VALUE STATEMENT        # if the value evaluates to true
-                                        # execute the statement (legacy)
             | If VALUE <Label>          # fall through if the value evaluates
                                         # to true, otherwise jump to the if's
                                         # corresponding end
@@ -180,27 +172,9 @@ Semantics
                                         # on the value, where value must be
                                         # either of integer, float, or string
                                         # type
-            | Block <Label> STATEMENT   # run the wrapped statement and provide
-                                        # a named exit. The label must be
-                                        # unique across all blocks in the
-                                        # procedure (legacy)
-            | Break <Label>             # exit the enclosing block that has the
-                                        # given label (legacy)
-            | Repeat STATEMENT          # unconditional loop. Repeat the
-                                        # statement for an indefinite amount
-                                        # of times (legacy)
-            | TRY_STMT                  # (legacy)
             | Goto TARGET
             | Loop <Label>              # unconditional jump back to the start
                                         # of a loop
-            | Raise LVALUE              # push the given exception to the
-                                        # exception stack and start exceptional
-                                        # control-flow. The `ref object` is
-                                        # consumed
-            | Raise <None>              # re-raise the current exception
-            | Return                    # exit the procedure, but execute all
-                                        # enclosing finalizers first (from
-                                        # innermost to outermost) (legacy)
             | Destroy LVALUE
             | Raise LVALUE EX_TARGET
             | Raise <None> EX_TARGET
@@ -220,18 +194,7 @@ Semantics
   BRANCH_LABEL = <Literal>
                | <Const>
                | Range <Literal> <Literal>
-  BRANCH_LIST = (Branch BRANCH_LABEL ... STATEMENT) ... # a list of branches
-              | (Branch BRANCH_LABEL ... TARGET) ...
-
-  EXCEPT_BRANCH = Branch <Type> ... STATEMENT # exception handler
-                | Branch <Local>    STATEMENT # exception handler for imported
-                                              # exception
-
-  TRY_STMT = Try STATEMENT (Except EXCEPT_BRANCH ...)? (Finally STATEMENT)?
-    # if a handler is present, all `raise` statements within the tried
-    # statement are redirected to the handler. If a finalizer is present, all
-    # control-flow exiting the tried statement or handler is first redirected
-    # to the finalizer.
+  BRANCH_LIST = (Branch BRANCH_LABEL ... TARGET) ... # a list of branches
 
 Only allowing calls, conversions, casts, etc. as the source operand (i.e., on
 the right) of an assignment makes sure that they always have named receivers,
@@ -265,8 +228,6 @@ generators.
 Control Flow Representation
 ===========================
 
-.. note:: This only covers the new control-flow primitives.
-
 Terminology:
 * *basic block*: a basic block is a region of statements that contains no
   jumps and is not jumped into
diff --git a/tests/arc/topt_cursor.nim b/tests/arc/topt_cursor.nim
index c3ea4a8d054..40026762cfa 100644
--- a/tests/arc/topt_cursor.nim
+++ b/tests/arc/topt_cursor.nim
@@ -4,21 +4,23 @@ discard """
   nimout: '''--expandArc: main
 
 scope:
-  try:
-    def_cursor x: (string, int) = <D0>
-    block L0:
-      scope:
-        if cond:
-          scope:
-            x = <D1>
-            break L0
+  def_cursor x: (string, int) = <D0>
+  scope:
+    if cond:
       scope:
-        x = <D2>
-    def_cursor _3: (string, int) = x
-    def _4: string = $(arg _3) (raises)
-    echo(arg type(array[0..0, string]), arg _4) (raises)
-  finally:
+        x = <D1>
+        goto [L1]
+  scope:
+    x = <D2>
+  L1:
+  def_cursor _3: (string, int) = x
+  def _4: string = $(arg _3) -> [Resume]
+  echo(arg type(array[0..0, string]), arg _4) -> [L2, Resume]
+  goto [L2, L3]
+  finally (L2):
     =destroy(name _4)
+    continue {L3}
+  L3:
 -- end of expandArc ------------------------
 --expandArc: sio
 
@@ -26,34 +28,36 @@ scope:
   scope:
     def_cursor filename: string = "debug.txt"
     def_cursor _3: string = filename
-    def f: File = open(arg _3, arg fmRead, arg 8000) (raises)
-    try:
+    def f: File = open(arg _3, arg fmRead, arg 8000) -> [Resume]
+    scope:
+      def res: string = newStringOfCap(arg 80)
       scope:
-        try:
-          def res: string = newStringOfCap(arg 80)
-          block L0:
+        while true:
+          scope:
+            def_cursor _6: File = f
+            def :tmp: bool = readLine(arg _6, name res) -> [L1, L2, Resume]
             scope:
-              while true:
+              def_cursor _7: bool = :tmp
+              def _8: bool = not(arg _7)
+              if _8:
                 scope:
-                  def_cursor _6: File = f
-                  def :tmp: bool = readLine(arg _6, name res) (raises)
-                  scope:
-                    def_cursor _7: bool = :tmp
-                    def _8: bool = not(arg _7)
-                    if _8:
-                      scope:
-                        break L0
-                  scope:
-                    scope:
-                      def_cursor x: string = res
-                      def_cursor _10: string = x
-                      echo(arg type(array[0..0, string]), arg _10) (raises)
-        finally:
-          =destroy(name res)
-    finally:
+                  goto [L4]
+            scope:
+              def_cursor x: string = res
+              def_cursor _10: string = x
+              echo(arg type(array[0..0, string]), arg _10) -> [L1, L2, Resume]
+      L4:
+      goto [L1, L2, L5]
+      finally (L1):
+        =destroy(name res)
+        continue {L2}
+    finally (L2):
       scope:
         def_cursor _11: File = f
-        close(arg _11) (raises)
+        close(arg _11) -> [Leave(L2), Resume]
+      continue {L5}
+    L5:
+
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 3bc9582764c..0a86e9ccbd5 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -13,7 +13,7 @@ doing shady stuff...
   nimout: '''--expandArc: newTarget
 
 scope:
-  def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) (raises)
+  def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) -> [Resume]
   bind_mut _7: string = splat.0
   def _3: string = move _7
   wasMoved(name _7)
@@ -69,173 +69,195 @@ scope:
 --expandArc: tt
 
 scope:
-  try:
-    def_cursor it: KeyValue = x
-    def _4: seq[int]
-    =copy(name _4, arg it.0)
-    def _5: seq[int]
-    =copy(name _5, arg it.1)
-    def a: (seq[int], seq[int]) = (consume _4, consume _5)
-    def_cursor _6: (seq[int], seq[int]) = a
-    def _7: string = $(arg _6) (raises)
-    echo(arg type(array[0..0, string]), arg _7) (raises)
-  finally:
+  def_cursor it: KeyValue = x
+  def _4: seq[int]
+  =copy(name _4, arg it.0)
+  def _5: seq[int]
+  =copy(name _5, arg it.1)
+  def a: (seq[int], seq[int]) = (consume _4, consume _5)
+  def_cursor _6: (seq[int], seq[int]) = a
+  def _7: string = $(arg _6) -> [L0, Resume]
+  echo(arg type(array[0..0, string]), arg _7) -> [L1, L0, Resume]
+  goto [L1, L0, L2]
+  finally (L1):
     =destroy(name _7)
+    continue {L0}
+  finally (L0):
     =destroy(name a)
+    continue {L2}
+  L2:
 -- end of expandArc ------------------------
 --expandArc: extractConfig
 
 scope:
-  try:
-    def lan_ip: string = ""
+  def lan_ip: string = ""
+  scope:
+    def_cursor a: seq[string] = txt
+    def i: int = 0
+    def_cursor _5: seq[string] = a
+    def L: int = lengthSeq(arg _5)
     scope:
-      def_cursor a: seq[string] = txt
-      def i: int = 0
-      def_cursor _5: seq[string] = a
-      def L: int = lengthSeq(arg _5)
-      block L0:
+      while true:
         scope:
-          while true:
-            scope:
-              def_cursor _7: int = i
-              def :tmp: bool = ltI(arg _7, arg L)
-              scope:
-                def_cursor _8: bool = :tmp
-                def _9: bool = not(arg _8)
-                if _9:
-                  scope:
-                    break L0
+          def_cursor _7: int = i
+          def :tmp: bool = ltI(arg _7, arg L)
+          scope:
+            def_cursor _8: bool = :tmp
+            def _9: bool = not(arg _8)
+            if _9:
               scope:
+                goto [L2]
+          scope:
+            def_cursor _11: int = i
+            def line: lent string = borrow a[_11]
+            def_cursor _13: string = line[]
+            def splitted: seq[string] = split(arg _13, arg " ", arg -1) -> [L3, Resume]
+            scope:
+              def_cursor _14: string = splitted[0]
+              def _15: bool = eqStr(arg _14, arg "opt")
+              if _15:
                 scope:
-                  try:
-                    def_cursor _11: int = i
-                    def line: lent string = borrow a[_11]
-                    def_cursor _13: string = line[]
-                    def splitted: seq[string] = split(arg _13, arg " ", arg -1) (raises)
-                    scope:
-                      def_cursor _14: string = splitted[0]
-                      def _15: bool = eqStr(arg _14, arg "opt")
-                      if _15:
-                        scope:
-                          def_cursor _18: string = splitted[1]
-                          =copy(name lan_ip, arg _18)
-                    def_cursor _16: string = lan_ip
-                    echo(arg type(array[0..0, string]), arg _16) (raises)
-                    def_cursor _17: string = splitted[1]
-                    echo(arg type(array[0..0, string]), arg _17) (raises)
-                  finally:
-                    =destroy(name splitted)
-                i = addI(arg i, arg 1) (raises)
-  finally:
+                  def_cursor _18: string = splitted[1]
+                  =copy(name lan_ip, arg _18)
+            def_cursor _16: string = lan_ip
+            echo(arg type(array[0..0, string]), arg _16) -> [L4, L3, Resume]
+            def_cursor _17: string = splitted[1]
+            echo(arg type(array[0..0, string]), arg _17) -> [L4, L3, Resume]
+            goto [L4, L6]
+            finally (L4):
+              =destroy(name splitted)
+              continue {L3, L6}
+            L6:
+          i = addI(arg i, arg 1) -> [L3, Resume]
+    L2:
+  goto [L3, L7]
+  finally (L3):
     =destroy(name lan_ip)
+    continue {L7}
+  L7:
 --expandArc: mergeShadowScope
 
 scope:
-  try:
-    def shadowScope: Scope
-    =copy(name shadowScope, arg c[].currentScope)
-    rawCloseScope(arg c) (raises)
+  def shadowScope: Scope
+  =copy(name shadowScope, arg c[].currentScope)
+  rawCloseScope(arg c) -> [L0, Resume]
+  scope:
+    def_cursor _4: Scope = shadowScope
+    def_cursor a: seq[Symbol] = _4[].symbols
+    def i: int = 0
+    def_cursor _7: seq[Symbol] = a
+    def L: int = lengthSeq(arg _7)
     scope:
-      def_cursor _4: Scope = shadowScope
-      def_cursor a: seq[Symbol] = _4[].symbols
-      def i: int = 0
-      def_cursor _7: seq[Symbol] = a
-      def L: int = lengthSeq(arg _7)
-      block L0:
+      while true:
         scope:
-          while true:
-            scope:
-              def_cursor _9: int = i
-              def :tmp: bool = ltI(arg _9, arg L)
-              scope:
-                def_cursor _10: bool = :tmp
-                def _11: bool = not(arg _10)
-                if _11:
-                  scope:
-                    break L0
+          def_cursor _9: int = i
+          def :tmp: bool = ltI(arg _9, arg L)
+          scope:
+            def_cursor _10: bool = :tmp
+            def _11: bool = not(arg _10)
+            if _11:
               scope:
-                scope:
-                  def_cursor _13: int = i
-                  def sym: lent Symbol = borrow a[_13]
-                  def _14: Symbol
-                  =copy(name _14, arg sym[])
-                  addInterfaceDecl(arg c, consume _14) (raises)
-                i = addI(arg i, arg 1) (raises)
-  finally:
+                goto [L3]
+          scope:
+            def_cursor _13: int = i
+            def sym: lent Symbol = borrow a[_13]
+            def _14: Symbol
+            =copy(name _14, arg sym[])
+            addInterfaceDecl(arg c, consume _14) -> [L4, L0, Resume]
+            goto [L4, L5]
+            finally (L4):
+              continue {L0, L5}
+            L5:
+          i = addI(arg i, arg 1) -> [L0, Resume]
+    L3:
+  goto [L0, L6]
+  finally (L0):
     =destroy(name shadowScope)
+    continue {L6}
+  L6:
 -- end of expandArc ------------------------
 --expandArc: treturn
 
 scope:
-  try:
-    def x: sink string
-    scope:
-      def_cursor _2: sink string = x
-      def _3: int = lengthStr(arg _2)
-      def _4: bool = eqI(arg _3, arg 2)
-      if _4:
-        scope:
-          result := move x
-          wasMoved(name x)
-          return
-    def_cursor _5: sink string = x
-    def _6: int = lengthStr(arg _5)
-    def _7: string = $(arg _6) (raises)
-    echo(arg type(array[0..0, string]), arg _7) (raises)
-  finally:
+  def x: sink string
+  scope:
+    def_cursor _2: sink string = x
+    def _3: int = lengthStr(arg _2)
+    def _4: bool = eqI(arg _3, arg 2)
+    if _4:
+      scope:
+        result := move x
+        wasMoved(name x)
+        goto [L1, L2]
+  def_cursor _5: sink string = x
+  def _6: int = lengthStr(arg _5)
+  def _7: string = $(arg _6) -> [L1, Resume]
+  echo(arg type(array[0..0, string]), arg _7) -> [L3, L1, Resume]
+  goto [L3, L1, L4]
+  finally (L3):
     =destroy(name _7)
+    continue {L1}
+  finally (L1):
     =destroy(name x)
+    continue {L2, L4}
+  L4:
+L2:
 
 -- end of expandArc ------------------------
 --expandArc: check
 
 scope:
-  try:
-    def_cursor _2: string = this[].value
-    this[].isValid = fileExists(arg _2) (raises)
-    def _4: tuple[dir: string, front: string]
-    block L0:
+  def_cursor _2: string = this[].value
+  this[].isValid = fileExists(arg _2) -> [Resume]
+  def _4: tuple[dir: string, front: string]
+  scope:
+    def_cursor _5: string = this[].value
+    def _6: bool = dirExists(arg _5) -> [Resume]
+    if _6:
       scope:
-        def_cursor _5: string = this[].value
-        def _6: bool = dirExists(arg _5) (raises)
-        if _6:
-          scope:
-            def _7: string
-            =copy(name _7, arg this[].value)
-            _4 := (consume _7, consume "")
-            break L0
+        def _7: string
+        =copy(name _7, arg this[].value)
+        _4 := (consume _7, consume "")
+        goto [L1]
+  scope:
+    def_cursor _8: string = this[].value
+    def _9: string = parentDir(arg _8) -> [Resume]
+    def _10: string
+    =copy(name _10, arg this[].value)
+    def _11: tuple[head: string, tail: string] = splitPath(consume _10) -> [L2, Resume]
+    bind_mut _19: string = _11.1
+    def _12: string = move _19
+    wasMoved(name _19)
+    _4 := (consume _9, consume _12)
+    wasMoved(name _9)
+    =destroy(name _11)
+    goto [L2, L3]
+    finally (L2):
+      =destroy(name _9)
+      continue {L3}
+    L3:
+  L1:
+  def par: tuple[dir: string, front: string] = move _4
+  scope:
+    def_cursor _13: string = par.0
+    def _14: bool = dirExists(arg _13) -> [L4, Resume]
+    if _14:
       scope:
-        try:
-          def_cursor _8: string = this[].value
-          def _9: string = parentDir(arg _8) (raises)
-          def _10: string
-          =copy(name _10, arg this[].value)
-          def _11: tuple[head: string, tail: string] = splitPath(consume _10) (raises)
-          bind_mut _19: string = _11.1
-          def _12: string = move _19
-          wasMoved(name _19)
-          _4 := (consume _9, consume _12)
-          wasMoved(name _9)
-        finally:
-          =destroy(name _11)
-          =destroy(name _9)
-    def par: tuple[dir: string, front: string] = move _4
-    block L1:
-      scope:
-        def_cursor _13: string = par.0
-        def _14: bool = dirExists(arg _13) (raises)
-        if _14:
-          scope:
-            def_cursor _15: string = par.0
-            def_cursor _16: string = par.1
-            def _17: seq[string] = getSubDirs(arg _15, arg _16) (raises)
-            =sink(name this[].matchDirs, arg _17)
-            break L1
-      scope:
-        def _18: seq[string] = @[]
-        =sink(name this[].matchDirs, arg _18)
-  finally:
+        def_cursor _15: string = par.0
+        def_cursor _16: string = par.1
+        def _17: seq[string] = getSubDirs(arg _15, arg _16) -> [L4, Resume]
+        =sink(name this[].matchDirs, arg _17)
+        goto [L6]
+  scope:
+    def _18: seq[string] = @[]
+    =sink(name this[].matchDirs, arg _18)
+  L6:
+  goto [L4, L7]
+  finally (L4):
     =destroy(name par)
+    continue {L7}
+  L7:
+
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/arc/topt_refcursors.nim b/tests/arc/topt_refcursors.nim
index 6544c1ca6dc..4ad516800f4 100644
--- a/tests/arc/topt_refcursors.nim
+++ b/tests/arc/topt_refcursors.nim
@@ -5,46 +5,44 @@ discard """
 
 scope:
   def_cursor it: Node = root
-  block L0:
-    scope:
-      while true:
+  scope:
+    while true:
+      scope:
+        def_cursor _4: Node = it
+        def _5: bool = eqRef(arg _4, arg nil)
+        def :tmp: bool = not(arg _5)
         scope:
-          def_cursor _4: Node = it
-          def _5: bool = eqRef(arg _4, arg nil)
-          def :tmp: bool = not(arg _5)
-          scope:
-            def_cursor _6: bool = :tmp
-            def _7: bool = not(arg _6)
-            if _7:
-              scope:
-                break L0
-          scope:
-            def_cursor _8: Node = it
-            def_cursor _9: string = _8[].s
-            echo(arg type(array[0..0, string]), arg _9) (raises)
-            def_cursor _10: Node = it
-            it = _10[].ri
+          def_cursor _6: bool = :tmp
+          def _7: bool = not(arg _6)
+          if _7:
+            scope:
+              goto [L2]
+        def_cursor _8: Node = it
+        def_cursor _9: string = _8[].s
+        echo(arg type(array[0..0, string]), arg _9) -> [Resume]
+        def_cursor _10: Node = it
+        it = _10[].ri
+  L2:
   def_cursor jt: Node = root
-  block L1:
-    scope:
-      while true:
+  scope:
+    while true:
+      scope:
+        def_cursor _13: Node = jt
+        def _14: bool = eqRef(arg _13, arg nil)
+        def :tmp: bool = not(arg _14)
         scope:
-          def_cursor _13: Node = jt
-          def _14: bool = eqRef(arg _13, arg nil)
-          def :tmp: bool = not(arg _14)
-          scope:
-            def_cursor _15: bool = :tmp
-            def _16: bool = not(arg _15)
-            if _16:
-              scope:
-                break L1
-          scope:
-            def_cursor _18: Node = jt
-            def_cursor ri: Node = _18[].ri
-            def_cursor _19: Node = jt
-            def_cursor _20: string = _19[].s
-            echo(arg type(array[0..0, string]), arg _20) (raises)
-            jt = ri
+          def_cursor _15: bool = :tmp
+          def _16: bool = not(arg _15)
+          if _16:
+            scope:
+              goto [L5]
+        def_cursor _18: Node = jt
+        def_cursor ri: Node = _18[].ri
+        def_cursor _19: Node = jt
+        def_cursor _20: string = _19[].s
+        echo(arg type(array[0..0, string]), arg _20) -> [Resume]
+        jt = ri
+  L5:
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/arc/topt_wasmoved_destroy_pairs.nim b/tests/arc/topt_wasmoved_destroy_pairs.nim
index 42587fe13a7..4475c61e52f 100644
--- a/tests/arc/topt_wasmoved_destroy_pairs.nim
+++ b/tests/arc/topt_wasmoved_destroy_pairs.nim
@@ -6,93 +6,103 @@ discard """
 scope:
   def a: seq[seq[int]]
   def b: seq[seq[int]]
-  def x: seq[int] = f() (raises)
-  block L0:
-    scope:
-      if cond:
-        scope:
-          def _5: seq[int] = move x
-          add(name a, consume _5)
-          break L0
-    scope:
-      def _6: seq[int] = move x
-      add(name b, consume _6)
-  =destroy(name b)
-  =destroy(name a)
+  def x: seq[int] = f() -> [L0, Resume]
+  scope:
+    if cond:
+      scope:
+        def _5: seq[int] = move x
+        add(name a, consume _5)
+        goto [L2]
+  scope:
+    def _6: seq[int] = move x
+    add(name b, consume _6)
+  goto [L0, L3]
+  finally (L0):
+    =destroy(name b)
+    =destroy(name a)
+    continue {L3}
+  L3:
 -- end of expandArc ------------------------
 --expandArc: tfor
 
 scope:
-  try:
-    def a: seq[seq[int]]
-    def b: seq[seq[int]]
-    def x: seq[int] = f() (raises)
+  def a: seq[seq[int]]
+  def b: seq[seq[int]]
+  def x: seq[int] = f() -> [L0, Resume]
+  scope:
+    def a: int = 0
+    def b: int = 4
+    def i: int = copy a
     scope:
-      def a: int = 0
-      def b: int = 4
-      def i: int = copy a
-      block L0:
+      while true:
         scope:
-          while true:
-            scope:
-              def_cursor _9: int = i
-              def :tmp: bool = ltI(arg _9, arg b)
-              scope:
-                def_cursor _10: bool = :tmp
-                def _11: bool = not(arg _10)
-                if _11:
-                  scope:
-                    break L0
+          def_cursor _9: int = i
+          def :tmp: bool = ltI(arg _9, arg b)
+          scope:
+            def_cursor _10: bool = :tmp
+            def _11: bool = not(arg _10)
+            if _11:
               scope:
-                scope:
-                  def_cursor i: int = i
-                  scope:
-                    def _13: bool = eqI(arg i, arg 2)
-                    if _13:
-                      scope:
-                        return
-                  def _14: seq[int]
-                  =copy(name _14, arg x)
-                  add(name a, consume _14)
-                i = addI(arg i, arg 1) (raises)
-    block L1:
-      scope:
-        if cond:
+                goto [L3]
           scope:
-            def _15: seq[int] = move x
-            wasMoved(name x)
-            add(name a, consume _15)
-            break L1
+            def_cursor i: int = i
+            scope:
+              def _13: bool = eqI(arg i, arg 2)
+              if _13:
+                scope:
+                  goto [L5, L0, L6]
+            def _14: seq[int]
+            =copy(name _14, arg x)
+            add(name a, consume _14)
+          i = addI(arg i, arg 1) -> [L5, L0, Resume]
+    L3:
+  scope:
+    if cond:
       scope:
-        def _16: seq[int] = move x
+        def _15: seq[int] = move x
         wasMoved(name x)
-        add(name b, consume _16)
-  finally:
+        add(name a, consume _15)
+        goto [L8]
+  scope:
+    def _16: seq[int] = move x
+    wasMoved(name x)
+    add(name b, consume _16)
+  L8:
+  goto [L5, L0, L9]
+  finally (L5):
     =destroy(name x)
+    continue {L0}
+  finally (L0):
     =destroy(name b)
     =destroy(name a)
+    continue {L6, L9}
+  L9:
+L6:
 -- end of expandArc ------------------------
 --expandArc: texit
 scope:
-  try:
-    def str: string
-    def x: string = boolToStr(arg cond)
-    scope:
-      if cond:
-        scope:
-          return
-    def _4: string = boolToStr(arg cond)
-    str := move _4
-    scope:
-      def _5: bool = not(arg cond)
-      if _5:
-        scope:
-          result := move str
-          wasMoved(name str)
-          return
-  finally:
+  def str: string
+  def x: string = boolToStr(arg cond)
+  scope:
+    if cond:
+      scope:
+        goto [L1, L2]
+  def _4: string = boolToStr(arg cond)
+  str := move _4
+  scope:
+    def _5: bool = not(arg cond)
+    if _5:
+      scope:
+        result := move str
+        wasMoved(name str)
+        goto [L1, L2]
+  goto [L1, L4]
+  finally (L1):
     =destroy(name x)
     =destroy(name str)
+    continue {L2, L4}
+  L4:
+L2:
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/compiler/tmir_exec.nim b/tests/compiler/tmir_exec.nim
index d1f82019a7a..92dcaffb91f 100644
--- a/tests/compiler/tmir_exec.nim
+++ b/tests/compiler/tmir_exec.nim
@@ -141,6 +141,7 @@ func `==`(a, b: Instr): bool =
 
   result =
     case a.op
+    of opNone:                 true
     of opFork, opGoto, opLoop: a.dest == b.dest
     of opJoin:                 a.id == b.id
     of DataFlowOps:            a.node == b.node
@@ -165,37 +166,13 @@ func `==`(a, b: DataFlowGraph): bool =
         a.map[an.dest] == b.map[bn.dest]
       of opJoin:
         a.map[an.id] == b.map[bn.id]
-      of DataFlowOps:
+      of opNone, DataFlowOps:
         true
 
     if not result:
       return
 
 
-# -------------- CFG creation tests
-
-block:
-  # test CFG creation for ``while true: break``
-  let tree = @[
-    MirNode(kind: mnkStmtList),
-    MirNode(kind: mnkBlock, label: LabelId(0)),
-    MirNode(kind: mnkRepeat),
-    MirNode(kind: mnkBreak, label: LabelId(0)),
-    MirNode(kind: mnkEnd, start: mnkRepeat),
-    MirNode(kind: mnkEnd, start: mnkBlock),
-    MirNode(kind: mnkReturn),
-    MirNode(kind: mnkEnd, start: mnkStmtList)]
-  let cfg = computeDfg(tree)
-
-  doAssert cfg == parseCfg("""
-    0: join -> 2
-    goto 1  -> 3
-    loop 0  -> 4
-    1: join -> 5
-    goto 2  -> 6
-    2: join -> 8
-  """)
-
 # -------------- test for the traversal routines
 
 # TODO: also test forward traversal and backward traversal from all exits
diff --git a/tests/compiler/tmir_trees.nim b/tests/compiler/tmir_trees.nim
index 74456a2bc2c..3b91e176ad5 100644
--- a/tests/compiler/tmir_trees.nim
+++ b/tests/compiler/tmir_trees.nim
@@ -6,5 +6,5 @@ discard """
 import compiler/mir/mirtrees
 
 block last_sibling:
-  let tree = @[MirNode(kind: mnkStmtList), MirNode(kind: mnkEnd)]
+  let tree = @[MirNode(kind: mnkScope), MirNode(kind: mnkEnd)]
   doAssert sibling(tree, NodePosition 0) == NodePosition(tree.len)
diff --git a/tests/compiler/ttreechangesets.nim b/tests/compiler/ttreechangesets.nim
index 30043cbff9b..7889270e112 100644
--- a/tests/compiler/ttreechangesets.nim
+++ b/tests/compiler/ttreechangesets.nim
@@ -110,7 +110,7 @@ block insert_shared_start:
   # independent of the order in which they're recorded
   var bu: MirBuilder
   bu.add temp(0)
-  bu.subTree mnkStmtList: discard
+  bu.subTree mnkScope: discard
   bu.add temp(3)
   var (tree, _) = finish(bu)
 
@@ -136,7 +136,7 @@ block insert_shared_end:
   # *second*, independent of the order in which they're recorded
   var bu: MirBuilder
   bu.add temp(0)
-  bu.subTree mnkStmtList: discard
+  bu.subTree mnkScope: discard
   bu.add temp(3)
   var (tree, _) = finish(bu)
 
diff --git a/tests/lang_objects/destructor/tdestruction_in_unreachable.nim b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
index ab12209fb0e..8ab5348b415 100644
--- a/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
+++ b/tests/lang_objects/destructor/tdestruction_in_unreachable.nim
@@ -30,9 +30,7 @@ proc test(cond: bool) =
 
 test(true)
 
-# XXX: wasDestroy must be false, but it currently isn't. Testing the inverse
-#      makes sure that the test at least compiles
-doAssert wasDestroyed, "the behaviour is correct now"
+doAssert not wasDestroyed
 
 # ------------------------------
 # test without if/else statement
@@ -52,5 +50,4 @@ proc test2(cond: bool) =
   discard o
 
 test2(true)
-# XXX: same comment as for the assertion above
-doAssert wasDestroyed, "the behaviour is correct now"
\ No newline at end of file
+doAssert not wasDestroyed
diff --git a/tests/lang_objects/destructor/timplicit_move_bug.nim b/tests/lang_objects/destructor/timplicit_move_bug.nim
new file mode 100644
index 00000000000..a4c63fb426e
--- /dev/null
+++ b/tests/lang_objects/destructor/timplicit_move_bug.nim
@@ -0,0 +1,37 @@
+discard """
+  description: '''
+    Regression test for a location's value being moved even though it's used
+    afterwards.
+    Refer to https://github.com/nim-works/nimskull/issues/1303
+  '''
+  targets: c js vm
+"""
+
+type Object = object
+  has: bool
+
+var wasDestroyed = false
+
+proc `=destroy`(x: var Object) =
+  if x.has:
+    inc wasDestroyed
+
+proc f_sink(x: sink Object) =
+  # disarm the destructor:
+  x.has = false
+
+proc test() =
+  var o = Object(has: true)
+  try:
+    try:
+      f_sink(o) # `o` must not be sunken
+      raise CatchableError.newException("")
+    except IOError:
+      # omitting the inner try made the code work as expected
+      discard "not reached"
+  except CatchableError:
+    doAssert not wasDestroyed
+    discard o # use `o`, preventing it from being moved earlier
+
+test()
+doAssert wasDestroyed
diff --git a/tests/lang_objects/destructor/tv2_cast.nim b/tests/lang_objects/destructor/tv2_cast.nim
index c54fdbad387..65e884caa7b 100644
--- a/tests/lang_objects/destructor/tv2_cast.nim
+++ b/tests/lang_objects/destructor/tv2_cast.nim
@@ -6,64 +6,72 @@ destroying O1'''
   cmd: '''nim c --gc:arc --expandArc:main --expandArc:main1 --expandArc:main2 --expandArc:main3 --hints:off --assertions:off $file'''
   nimout: '''--expandArc: main
 scope:
-  try:
-    def _2: string = newString(arg 100)
-    def_cursor _3: seq[byte] = cast _2
-    def _4: openArray[byte] = toOpenArray _3
-    def _5: seq[byte] = encode(arg _4) (raises)
-    def_cursor _6: string = cast _5
-    def data: string
-    =copy(name data, arg _6)
-  finally:
-    =destroy(name data)
-    =destroy(name _5)
+  def _2: string = newString(arg 100)
+  def_cursor _3: seq[byte] = cast _2
+  def _4: openArray[byte] = toOpenArray _3
+  def _5: seq[byte] = encode(arg _4) -> [L0, Resume]
+  def_cursor _6: string = cast _5
+  def data: string
+  =copy(name data, arg _6)
+  =destroy(name data)
+  =destroy(name _5)
+  goto [L0, L1]
+  finally (L0):
     =destroy(name _2)
+    continue {L1}
+  L1:
 -- end of expandArc ------------------------
 --expandArc: main1
 scope:
-  try:
-    def s: string = newString(arg 100)
-    def_cursor _3: string = s
-    def _4: int = lengthStr(arg _3)
-    def _5: int = subI(arg _4, arg 1) (raises)
-    chckBounds(arg s, arg 0, arg _5) (raises)
-    def _6: openArray[byte] = toOpenArray s, 0, _5
-    def _7: seq[byte] = encode(arg _6) (raises)
-    def_cursor _8: string = cast _7
-    def data: string
-    =copy(name data, arg _8)
-  finally:
-    =destroy(name data)
-    =destroy(name _7)
+  def s: string = newString(arg 100)
+  def_cursor _3: string = s
+  def _4: int = lengthStr(arg _3)
+  def _5: int = subI(arg _4, arg 1) -> [L0, Resume]
+  chckBounds(arg s, arg 0, arg _5) -> [L0, Resume]
+  def _6: openArray[byte] = toOpenArray s, 0, _5
+  def _7: seq[byte] = encode(arg _6) -> [L0, Resume]
+  def_cursor _8: string = cast _7
+  def data: string
+  =copy(name data, arg _8)
+  =destroy(name data)
+  =destroy(name _7)
+  goto [L0, L1]
+  finally (L0):
     =destroy(name s)
+    continue {L1}
+  L1:
 -- end of expandArc ------------------------
 --expandArc: main2
 scope:
-  try:
-    def s: seq[byte] = newSeq(arg 100) (raises)
-    def _3: openArray[byte] = toOpenArray s
-    def _4: seq[byte] = encode(arg _3) (raises)
-    def_cursor _5: string = cast _4
-    def data: string
-    =copy(name data, arg _5)
-  finally:
-    =destroy(name data)
-    =destroy(name _4)
+  def s: seq[byte] = newSeq(arg 100) -> [Resume]
+  def _3: openArray[byte] = toOpenArray s
+  def _4: seq[byte] = encode(arg _3) -> [L0, Resume]
+  def_cursor _5: string = cast _4
+  def data: string
+  =copy(name data, arg _5)
+  =destroy(name data)
+  =destroy(name _4)
+  goto [L0, L1]
+  finally (L0):
     =destroy(name s)
+    continue {L1}
+  L1:
 -- end of expandArc ------------------------
 --expandArc: main3
 scope:
-  try:
-    def _2: seq[byte] = newSeq(arg 100) (raises)
-    def _3: openArray[byte] = toOpenArray _2
-    def _4: seq[byte] = encode(arg _3) (raises)
-    def_cursor _5: string = cast _4
-    def data: string
-    =copy(name data, arg _5)
-  finally:
-    =destroy(name data)
-    =destroy(name _4)
+  def _2: seq[byte] = newSeq(arg 100) -> [Resume]
+  def _3: openArray[byte] = toOpenArray _2
+  def _4: seq[byte] = encode(arg _3) -> [L0, Resume]
+  def_cursor _5: string = cast _4
+  def data: string
+  =copy(name data, arg _5)
+  =destroy(name data)
+  =destroy(name _4)
+  goto [L0, L1]
+  finally (L0):
     =destroy(name _2)
+    continue {L1}
+  L1:
 -- end of expandArc ------------------------'''
 """
 
diff --git a/tests/misc/tdont_fold_procedure_cast.nim b/tests/misc/tdont_fold_procedure_cast.nim
index e34028e0ef0..8d03ddbee2f 100644
--- a/tests/misc/tdont_fold_procedure_cast.nim
+++ b/tests/misc/tdont_fold_procedure_cast.nim
@@ -11,7 +11,7 @@ scope:
   def_cursor _2: proc (x: float){.nimcall.} = cast other
   def p: proc (x: float){.nimcall.} = copy _2
   def_cursor _3: proc (x: int){.nimcall.} = cast p
-  _3(arg 1) (raises)
+  _3(arg 1) -> [Resume]
 -- end of expandArc ------------------------
   '''
   output: "1"

From bda1ace299ecda352778c2874512b3f1184d09f9 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 26 May 2024 20:27:23 +0200
Subject: [PATCH 101/169] cgen: better code-gen for `seq.len` (#1321)

## Summary

Don't store the result of a `seq.len` in an additional temporary. An
optimizing C compiler can easily eliminate such temporaries, but doing
it on the NimSkull side reduces the amount of work for the C compiler.

## Details

* the temporary is a leftover from when argument expression purity
  wasn't guaranteed
* the `cgen.getIntTemp` procedure is now obsolete and thus removed
---
 compiler/backend/ccgexprs.nim | 11 +----------
 compiler/backend/cgen.nim     |  9 ---------
 2 files changed, 1 insertion(+), 19 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index d1b55649f94..1c1f4b90cbf 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1118,21 +1118,12 @@ proc genArrayLen(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
   of tyCstring:
     if op == mHigh: unaryExpr(p, e, d, "($1 ? (#nimCStrLen($1)-1) : -1)")
     else: unaryExpr(p, e, d, "($1 ? #nimCStrLen($1) : 0)")
-  of tyString:
+  of tyString, tySequence:
     var a: TLoc
     initLocExpr(p, e[1], a)
     var x = lenExpr(p, a)
     if op == mHigh: x = "($1-1)" % [x]
     putIntoDest(p, d, e, x)
-  of tySequence:
-    # we go through a temporary here because people write bullshit code.
-    var a, tmp: TLoc
-    initLocExpr(p, e[1], a)
-    getIntTemp(p, tmp)
-    var x = lenExpr(p, a)
-    if op == mHigh: x = "($1-1)" % [x]
-    lineCg(p, cpsStmts, "$1 = $2;$n", [tmp.r, x])
-    putIntoDest(p, d, e, tmp.r)
   of tyArray:
     # YYY: length(sideeffect) is optimized away incorrectly?
     if op == mHigh: putIntoDest(p, d, e, rope(lastOrd(p.config, typ)))
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index b7440c80ba5..02627a31d1e 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -484,15 +484,6 @@ proc getTemp(p: BProc, t: PType, result: var TLoc) =
         echo "ENORMOUS TEMPORARY! ", p.config $ p.lastLineInfo
       writeStackTrace()
 
-proc getIntTemp(p: BProc, result: var TLoc) =
-  inc(p.labels)
-  result.r = "T" & rope(p.labels) & "_"
-  linefmt(p, cpsLocals, "NI $1;$n", [result.r])
-  result.k = locTemp
-  result.storage = OnStack
-  result.lode = lodeTyp getSysType(p.module.g.graph, unknownLineInfo, tyInt)
-  result.flags = {}
-
 proc localVarDecl(p: BProc; n: CgNode, decl: Local): Rope =
   let loc = initLoc(locLocalVar, n, mangleLocalName(p, decl.name, n.local),
                     OnStack)

From 06eb867bc32dd5c194fca5901b0364cd4a2f4aaf Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 26 May 2024 20:47:38 +0200
Subject: [PATCH 102/169] lower float overflow checks with MIR pass (#1322)

## Summary

Lower checked float arithmetic operations with an MIR pass, instead
of as part of C code generation. This is a pure refactoring, with the
goal of shrinking down the C code generator.

## Details

* the checked float arithmetic operations are turned into an unchecked
  operation + infinity check (replicating what `cgen` did)
* the lowering in `cgen` for float arithmetic is removed
---
 compiler/backend/ccgexprs.nim | 15 --------------
 compiler/mir/rtchecks.nim     | 39 +++++++++++++++++++++++++++++++++++
 2 files changed, 39 insertions(+), 15 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 1c1f4b90cbf..c78e16eb9fc 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1377,20 +1377,6 @@ proc genStrEquals(p: BProc, e: CgNode, d: var TLoc) =
   else:
     binaryExpr(p, e, d, "#eqStrings($1, $2)")
 
-proc binaryFloatArith(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
-  if true:
-    const opr: array[mAddF64..mDivF64, string] = ["+", "-", "*", "/"]
-    var a, b: TLoc
-    assert(e[1].typ != nil)
-    assert(e[2].typ != nil)
-    initLocExpr(p, e[1], a)
-    initLocExpr(p, e[2], b)
-    putIntoDest(p, d, e, ropecg(p.module, "(($4)($2) $1 ($4)($3))",
-                              [opr[m], rdLoc(a), rdLoc(b),
-                              getSimpleTypeDesc(p.module, e[1].typ)]))
-    linefmt(p, cpsStmts, "if ($1 != 0.0 && $1*0.5 == $1) { #raiseFloatOverflow($1); $2}$n",
-            [rdLoc(d), raiseInstr(p, e.exit)])
-
 proc skipAddr(n: CgNode): CgNode =
   if n.kind == cnkHiddenAddr: n.operand
   else:                       n
@@ -1452,7 +1438,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
   case op
   of mNot..mUnaryPlusF64: unaryArith(p, e, e[1], d, op)
   of mUnaryMinusI, mUnaryMinusI64: unaryArithOverflow(p, e, d, op)
-  of mAddF64..mDivF64: binaryFloatArith(p, e, d, op)
   of mShrI..mXor: binaryArith(p, e, e[1], e[2], d, op)
   of mEqProc: genEqProc(p, e, d)
   of mAddI..mPred: binaryArithOverflow(p, e, d, op)
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 7268ef3a0f7..67a87127f39 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -293,6 +293,37 @@ proc emitObjectCheck(tree; call; graph; env; bu) =
     bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseObjectConversionError")):
       discard
 
+proc emitCheckedFloatOp(tree; call; graph; env; bu): Value =
+  ## Emits the lowered version of a checked float arithmetic operation.
+  ## Checked means that the result is tested for infinity.
+  let typ = tree[call].typ
+  const Map = [mAddF64: mnkAdd, mSubF64: mnkSub, mMulF64: mnkMul, mDivF64: mnkDiv]
+  result = bu.wrapTemp typ:
+    bu.subTree Map[tree[call + 1].magic], typ:
+      bu.emitFrom(tree, NodePosition tree.argument(call, 0))
+      bu.emitFrom(tree, NodePosition tree.argument(call, 1))
+
+  # test for infinity by multiplying the result with 0.5 and comparing it
+  # against the original result. If equal and the result was not 0, the result
+  # must be +inf or -inf
+  let cond = bu.wrapTemp BoolType:
+    bu.buildMagicCall mEqF64, BoolType:
+      bu.emitByVal result
+      bu.emitByVal literal(mnkFloatLit, env.getOrIncl(0.0), typ)
+  bu.buildIfNot cond:
+    let cmp = bu.wrapTemp typ:
+      bu.subTree mnkMul, typ:
+        bu.use result
+        bu.use literal(mnkFloatLit, env.getOrIncl(0.5), typ)
+    bu.subTree mnkAsgn:
+      bu.use cond
+      bu.buildMagicCall mEqF64, BoolType:
+        bu.emitByVal result
+        bu.emitByVal cmp
+    bu.buildIf cond:
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseFloatOverflow")):
+        bu.emitByVal result
+
 proc lowerChecks*(body; graph; env; changes: var Changeset) =
   ## Lowers all magic calls implementing the run-time checks.
   template tree: MirTree = body.code
@@ -324,5 +355,13 @@ proc lowerChecks*(body; graph; env; changes: var Changeset) =
         let call = tree.parent(i)
         changes.replaceMulti(tree, tree.parent(call), bu):
           emitObjectCheck(tree, call, graph, env, bu)
+
+      of mAddF64, mSubF64, mMulF64, mDivF64:
+        let call = tree.parent(i)
+        var tmp: Value
+        changes.insert(tree, tree.parent(call), call, bu):
+          tmp = emitCheckedFloatOp(tree, call, graph, env, bu)
+        changes.replaceMulti(tree, call, bu):
+          bu.use tmp
       else:
         discard "not relevant"

From e807f56c66a6e65213157d9dba6a39fda8d06513 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 28 May 2024 03:04:36 +0200
Subject: [PATCH 103/169] improve code generation for `@[...]` (#1323)

## Summary

Don't use an intermediate temporary for the array construction but
instead move the items into the constructed seq directly. All backends
are affected.

## Details

`mirgen` now translates a `@[...]` expression into a `mnkSeqConstr`
tree rather than:
```
def _1 = [...] # array construction
def _2 = arrToSeq(consume _1)
```
This gets rid of the unnecessary temporary and shallow array copy.

Handling of `mArrToSeq` in the code generators is also improved /
cleaned up:
* the handling of `cnkArrayConstr` operands is removed (it's a leftover
  from before the MIR rework)
* `jsgen`: the operand to `mArrToSeq` call is guaranteed to be owned,
  so no extra copy is required
* `cgen`: the `TLoc` passed to `genArrToSeq` is always a non-empty
  loc, so the `if d.k == locNone` check is unnecessary and thus removed
---
 compiler/backend/ccgexprs.nim |  7 -------
 compiler/backend/jsgen.nim    | 11 +++--------
 compiler/mir/mirgen.nim       |  8 ++++++++
 tests/arc/topt_no_cursor.nim  | 21 ++++++++++-----------
 4 files changed, 21 insertions(+), 26 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index c78e16eb9fc..a71c040cc65 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -991,13 +991,6 @@ proc genSeqConstr(p: BProc, n: CgNode, d: var TLoc) =
 
 proc genArrToSeq(p: BProc, n: CgNode, d: var TLoc) =
   var elem, a, arr: TLoc
-  if n[1].kind == cnkArrayConstr:
-    # XXX: dead code, but kept as a reminder
-    n[1].typ = n.typ
-    genSeqConstr(p, n[1], d)
-    return
-  if d.k == locNone:
-    getTemp(p, n.typ, d)
   # generate call to newSeq before adding the elements per hand:
   let L = toInt(lengthOrd(p.config, n[1].typ))
   block:
diff --git a/compiler/backend/jsgen.nim b/compiler/backend/jsgen.nim
index ad6497fb984..a30ba00aef8 100644
--- a/compiler/backend/jsgen.nim
+++ b/compiler/backend/jsgen.nim
@@ -1829,14 +1829,9 @@ proc genMagic(p: PProc, n: CgNode, r: var TCompRes) =
   of mNew: genNew(p, n, r)
   of mChr: gen(p, n[1], r)
   of mArrToSeq:
-    # only array literals doesn't need copy
-    if n[1].kind == cnkArrayConstr:
-      genJSArrayConstr(p, n[1], r)
-    else:
-      var x: TCompRes
-      gen(p, n[1], x)
-      useMagic(p, "nimCopy")
-      r.res = "nimCopy(null, $1, $2)" % [x.rdLoc, genTypeInfo(p, n.typ)]
+    # the argument is guaranteed to be moveable, it can simply be assigned to
+    # the destination
+    gen(p, n[1], r)
   of mDestroy, mTrace: discard "ignore calls to the default destructor"
   of mOrd: genOrd(p, n, r)
   of mLengthStr, mLengthSeq, mLengthOpenArray, mLengthArray:
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index d756701da2b..7355f919467 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -1000,6 +1000,14 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
         arg = arg[^1]
 
       c.emitOperandTree arg, sink=false
+  of mArrToSeq:
+    if n[1].kind == nkBracket:
+      # optimization: translate ``@[...]`` to a sequence construction
+      c.buildTree mnkSeqConstr, rtyp:
+        for it in n[1].items:
+          c.emitOperandTree it, sink=true
+    else:
+      genCall(c, n)
 
   # arithmetic operations:
   of mAddI, mSubI, mMulI, mDivI, mModI, mPred, mSucc:
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 0a86e9ccbd5..492e55655c0 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -48,20 +48,19 @@ scope:
 --expandArc: p1
 
 scope:
-  def _2: array[0..0, int] = [consume 123]
-  def lresult: seq[int] = arrToSeq(consume _2)
+  def lresult: seq[int] = @[consume 123]
   def lvalue: seq[int]
   def lnext: string
-  def _6: seq[int] = move lresult
-  def _: (seq[int], string) = (consume _6, consume ";")
-  bind_mut _8: seq[int] = _.0
-  lvalue := move _8
+  def _5: seq[int] = move lresult
+  def _: (seq[int], string) = (consume _5, consume ";")
+  bind_mut _7: seq[int] = _.0
+  lvalue := move _7
+  wasMoved(name _7)
+  bind_mut _8: string = _.1
+  lnext := move _8
   wasMoved(name _8)
-  bind_mut _9: string = _.1
-  lnext := move _9
-  wasMoved(name _9)
-  def _7: seq[int] = move(name lvalue)
-  result.value := move _7
+  def _6: seq[int] = move(name lvalue)
+  result.value := move _6
   =destroy(name _)
   =destroy(name lnext)
   =destroy(name lvalue)

From 29dc0c775da9e2a96e022f39c037a6db15cf415d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 28 May 2024 03:49:54 +0200
Subject: [PATCH 104/169] lower `mChckIndex` with MIR pass (#1324)

## Summary

Lower `mChckIndex` magic calls with an MIR pass, instead of as part of
C code generation. This is a pure refactoring, with the goal of
shrinking down the C code generator.

## Details

The lowering is integrated into `rtchecks`, and is a MIR port of the
lowering previously performed by `cgen.genIndexCheck` (which is now
removed), including two pre-existing bugs. The two bugs are documented
in the code, and a test (`tout_of_range_index_check.nim`) is added for
one them.

The lowering needs to query the unsigned version of the "size type", so
the `usizeType` query is added for `TypeEnv`.

Finally, a leftover `unreachable` debug statement that triggers on
unused labels is removed from `mirexec`: it would trigger when an index
check on a `cstring` (which gets eliminated by the lowering) is the
only jump-source for a label.
---
 compiler/backend/ccgexprs.nim                 |  37 ------
 compiler/mir/mirtypes.nim                     |  16 ++-
 compiler/mir/rtchecks.nim                     | 108 ++++++++++++++++++
 compiler/sem/mirexec.nim                      |   2 +-
 .../array/tout_of_range_index_check.nim       |  29 +++++
 5 files changed, 150 insertions(+), 42 deletions(-)
 create mode 100644 tests/lang_types/array/tout_of_range_index_check.nim

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index a71c040cc65..fbf2c02d71d 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -620,38 +620,6 @@ proc genBoundsCheck(p: BProc; arr, a, b: TLoc, exit: CgNode) =
   else:
     unreachable(ty.kind)
 
-proc genIndexCheck(p: BProc; x: CgNode, arr, idx: TLoc, exit: CgNode) =
-  ## Emits the index check logic + subsequent raise operation. `x` is
-  ## the array expression the `arr` loc resulted from from.
-  let ty = arr.t.skipTypes(abstractVar + tyUserTypeClasses +
-                           {tyPtr, tyRef, tyLent, tyVar})
-  case ty.kind
-  of tyArray:
-    var first = intLiteral(firstOrd(p.config, ty))
-    if firstOrd(p.config, ty) == 0 and lastOrd(p.config, ty) >= 0:
-      linefmt(p, cpsStmts, "if ((NU)($1) > (NU)($2)){ #raiseIndexError2($1, $2); $3}$n",
-              [rdCharLoc(idx), intLiteral(lastOrd(p.config, ty)),
-               raiseInstr(p, exit)])
-    else:
-      linefmt(p, cpsStmts, "if ($1 < $2 || $1 > $3){ #raiseIndexError3($1, $2, $3); $4}$n",
-              [rdCharLoc(idx), first, intLiteral(lastOrd(p.config, ty)),
-               raiseInstr(p, exit)])
-  of tySequence, tyString:
-    linefmt(p, cpsStmts,
-            "if ((NU)($1) >= (NU)$2){ #raiseIndexError2($1,$2-1); $3}$n",
-            [rdCharLoc(idx), lenExpr(p, arr), raiseInstr(p, exit)])
-  of tyOpenArray, tyVarargs:
-    if reifiedOpenArray(p, x):
-      linefmt(p, cpsStmts, "if ((NU)($1) >= (NU)($2.Field1)){ #raiseIndexError2($1,$2.Field1-1); $3}$n",
-              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p, exit)])
-    else:
-      linefmt(p, cpsStmts, "if ((NU)($1) >= (NU)($2Len_0)){ #raiseIndexError2($1,$2Len_0-1); $3}$n",
-              [rdCharLoc(idx), rdLoc(arr), raiseInstr(p, exit)])
-  of tyCstring:
-    discard "no bound checks"
-  else:
-    unreachable()
-
 proc genOpenArrayElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   var a, b: TLoc
   initLocExpr(p, x, a)
@@ -1529,11 +1497,6 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
       typ.add "*"
 
     linefmt(p, cpsStmts, "$1 = ($2)($3);$n", [a.r, typ, rdLoc(b)])
-  of mChckIndex:
-    var arr, a: TLoc
-    initLocExpr(p, e[1], arr)
-    initLocExpr(p, e[2], a)
-    genIndexCheck(p, e[1], arr, a, e.exit)
   of mChckBounds:
     var arr, a, b: TLoc
     initLocExpr(p, e[1], arr)
diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index 7b0f90879bf..92748c662d3 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -41,6 +41,8 @@ type
     types: Store[TypeId, PType]
     sizeType: TypeId
       ## the target-dependent integer type to use for size values
+    usizeType: TypeId
+      ## the target-dependent unsigned integer type to use for size values
 
 const
   VoidType*    = TypeId 0
@@ -64,7 +66,8 @@ proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
   ## Returns a fully initialized type environment instance.
   result = TypeEnv(map: default(TypeTable[TypeId]),
                    types: default(Store[TypeId, PType]),
-                   sizeType: VoidType)
+                   sizeType: VoidType,
+                   usizeType: VoidType)
 
   template add(kind: TTypeKind, expect: TypeId) =
     let
@@ -96,10 +99,10 @@ proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
   add(tyInt,   TypeId(ord(PointerType) + 1))
   add(tyFloat, TypeId(ord(PointerType) + 2))
 
-  result.sizeType =
+  (result.sizeType, result.usizeType) =
     case graph.config.target.intSize
-    of 1, 2, 4: Int32Type
-    of 8:       Int64Type
+    of 1, 2, 4: (Int32Type, UInt32Type)
+    of 8:       (Int64Type, UInt64Type)
     else:       unreachable()
 
 proc add*(env: var TypeEnv, t: PType): TypeId =
@@ -116,3 +119,8 @@ func sizeType*(env: TypeEnv): TypeId {.inline.} =
   ## Returns the type to use for values representing some size. This is a
   ## signed integer type of target-dependent bit-width.
   env.sizeType
+
+func usizeType*(env: TypeEnv): TypeId {.inline.} =
+  ## Returns the type to use for values representing some size. This is an
+  ## unsigned integer type of target-dependent bit-width.
+  env.usizeType
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 67a87127f39..a796e169518 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -75,6 +75,9 @@ template emitCall(bu; tree; call; prc: ProcedureId, arguments: untyped) =
 proc addCompilerProc(env; graph; name: string): ProcedureId =
   env.procedures.add(graph.getCompilerProc(name))
 
+proc makeLiteral(env; kind: MirNodeKind, val: Int128, typ: TypeId): Value =
+  literal(kind, env.getOrIncl(val.toUInt.BiggestUInt), typ)
+
 proc getInt(env: MirEnv, n: MirNode): Int128 =
   case n.kind
   of mnkIntLit:  toInt128 env.getInt(n.number)
@@ -201,6 +204,107 @@ proc emitNanCheck(tree; call; graph; env; bu) =
     bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseFloatInvalidOp")):
       discard
 
+proc emitIndexCheck(tree; call; graph; env; bu) =
+  ## Emits the lowered index check for `call`.
+  let
+    arrOperand = NodePosition tree.argument(call, 0)
+    ty = env[tree[arrOperand].typ].skipTypes(abstractInst +
+      tyUserTypeClasses + {tyLent, tyVar})
+
+  if ty.kind == tyCstring:
+    # no index check needed
+    # XXX: index checks should be omitted for cstrings when using the C
+    #      backend
+    return
+
+  let
+    idxOperand = NodePosition tree.argument(call, 1)
+    sizeType  = env.types.sizeType
+    usizeType = env.types.usizeType
+
+  if ty.kind == tyArray and (firstOrd(graph.config, ty) != Zero or
+     lastOrd(graph.config, ty) < Zero):
+    # FIXME: this branch also need to be taken when lastOrd >= high(int)
+    # we need to test against both the lower and upper bound
+    let
+      typ   = env.types.add(env[tree[arrOperand].typ][0])
+      first = env.makeLiteral(mnkIntLit, firstOrd(graph.config, ty), typ)
+      last  = env.makeLiteral(mnkIntLit, lastOrd(graph.config, ty), typ)
+
+    # FIXME: there are two problems here:
+    #        * the comparison operator is wrong for non-int types
+    #        * the comparison operands don't use the same type
+    #        As a consequence, C integer promotion rules apply, leading to
+    #        incorrect test results in some cases. The bound values need to
+    #        be converted to the index operand's type first, with boundary
+    #        checks omitted where the boundary's value cannot be represented
+    #        with the index operand's type
+
+    let cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mLtI, BoolType:
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, idxOperand)
+        bu.emitByVal first
+
+    bu.buildIfNot cond:
+      bu.subTree mnkAsgn:
+        bu.use cond
+        bu.buildMagicCall mLtI, BoolType:
+          bu.emitByVal last
+          bu.subTree mnkArg:
+            bu.emitFrom(tree, idxOperand)
+
+    bu.buildIf cond:
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseIndexError3")):
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, idxOperand)
+        bu.emitByVal first
+        bu.emitByVal last
+
+  else:
+    # if the first index is at 0 and the length is guaranteed to be in range
+    # 0..high(int), an optimization is used: the operand is coverted to a
+    # first, and then only a single comparison against the length is used.
+    # This works because a negative index operand becomes a value > high(int)
+    # after to-uint conversion
+    var len: Value
+    if ty.kind == tyArray:
+      # the length is static
+      len = env.makeLiteral(mnkUIntLit, lengthOrd(graph.config, ty), usizeType)
+    else:
+      # the length is dynamic
+      let tmp = bu.wrapTemp sizeType:
+        bu.buildMagicCall mLengthOpenArray, sizeType:
+          bu.subTree mnkArg:
+            bu.emitFrom(tree, arrOperand)
+
+      # convert the length:
+      len = bu.wrapTemp usizeType:
+        bu.subTree mnkConv, usizeType:
+          bu.use tmp
+
+    # convert the index:
+    let idx = bu.wrapTemp usizeType:
+      bu.subTree mnkConv, usizeType:
+        bu.emitFrom(tree, idxOperand)
+
+    # compare the values:
+    let cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mLeU, BoolType:
+        bu.emitByVal len
+        bu.emitByVal idx
+
+    bu.buildIf cond:
+      let val = bu.wrapTemp usizeType:
+        bu.subTree mnkSub, usizeType:
+          bu.use len
+          bu.use literal(mnkUIntLit, env.getOrIncl(1), usizeType)
+
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseIndexError2")):
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, idxOperand)
+        bu.emitByVal val
+
 proc emitFieldCheck(tree; source: SourceMap; call; graph; env; bu) =
   ## For ``chckField(set, discr, invert, msg)`` emits the MIR equivalent of:
   ##   if not contains(set, discr):
@@ -346,6 +450,10 @@ proc lowerChecks*(body; graph; env; changes: var Changeset) =
         # make sure to take the ``mnkVoid`` wrapper into account
         changes.replaceMulti(tree, tree.parent(call), bu):
           emitNanCheck(tree, call, graph, env, bu)
+      of mChckIndex:
+        let call = tree.parent(i)
+        changes.replaceMulti(tree, tree.parent(call), bu):
+          emitIndexCheck(tree, call, graph, env, bu)
       of mChckField:
         let call = tree.parent(i)
         # make sure to take the ``mnkVoid`` wrapper into account
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index f8e3cc6d467..d18560af7e1 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -381,7 +381,7 @@ func computeDfg*(tree: MirTree): DataFlowGraph =
       # patch the join-to-instruction mapping:
       env.joins[id] = env.instrs.high.InstrPos
     else:
-      unreachable("unused join point")
+      discard "label is not used, ignore"
 
   template goto(pos: NodePosition, label: LabelId) =
     env.instrs.add Instr(op: opGoto, node: pos, dest: map(env, label))
diff --git a/tests/lang_types/array/tout_of_range_index_check.nim b/tests/lang_types/array/tout_of_range_index_check.nim
new file mode 100644
index 00000000000..3726c9e9944
--- /dev/null
+++ b/tests/lang_types/array/tout_of_range_index_check.nim
@@ -0,0 +1,29 @@
+discard """
+  description: '''
+    Ensure that accessing an array works when the index operand's type cannot
+    be safely converted to the array's index type
+  '''
+  knownIssue.c: '''
+    The boundary checks are implemented improperly, leading to the array
+    appearing to effectively be empty
+  '''
+  knownIssue.vm: '''
+    Arrays with a start index outside of -128..127 crash the code generator
+  '''
+"""
+
+proc test1(index: int): int =
+  # try with an index range that overlaps with the `int` range
+  var arr: array[uint(high(int))..(uint(high(int)) + 2), int] = [1, 2, 3]
+  # not all valid array indices can be represented by `int`
+  result = arr[index]
+
+# the index is valid, no index error must be raised
+doAssert test1(high(int)) == 1
+
+proc test2(index: uint): int =
+  var arr: array[-1..1, int] = [1, 2, 3]
+  # not all valid array indices can be represented by `uint`
+  result = arr[index]
+
+doAssert test2(1) == 3

From fec3a493287d82af6a84a47bde7f58f500d5d5d8 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 29 May 2024 18:00:18 +0200
Subject: [PATCH 105/169] fix `result` not being cleaned up when procedure
 raises (#1326)

## Summary

The `result` variable is now destroyed when the procedure exits due to
a raised exception, fixing a memory/resource leak. All backends were
affected.

Fixes https://github.com/nim-works/nimskull/issues/1305.

## Details

* the `result` is destroyed within a special try-finally that only
  intercepts exceptional control-flow
* the new `errorOnly` field designates a `bkTryFinally` as only
  intercepting exceptional control-flow
* `mirgen` handles emitting the destroy operation and injecting the
  `try`

When the `result` variable is not initialized on any control-flow paths
leading to the destroy operation, the destroy is elided by the "destroy
elimination" pass; a test (`tno_destroy_for_empty_result.nim`) is added
to ensure this works.
---
 compiler/mir/mirgen.nim                       | 34 +++++++++++++++-
 compiler/mir/mirgen_blocks.nim                |  7 ++++
 tests/arc/topt_no_cursor.nim                  | 22 +++++++----
 .../destructor/tdestroy_result_when_raise.nim | 32 +++++++++++++++
 .../tno_destroy_for_empty_result.nim          | 39 +++++++++++++++++++
 5 files changed, 125 insertions(+), 9 deletions(-)
 create mode 100644 tests/lang_objects/destructor/tdestroy_result_when_raise.nim
 create mode 100644 tests/optimization/tno_destroy_for_empty_result.nim

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 7355f919467..dab8aa1a403 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -2400,10 +2400,21 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
   var c = initCtx(graph, config, owner, move env)
   c.sp.active = (body, c.sp.map.add(body))
 
+  let
+    needsTerminate = sfNeverRaises in owner.flags
+    needsCleanup = (c.injectDestructors and
+                    owner.kind in routineKinds and
+                    owner.typ[0] != nil and
+                    hasDestructor(owner.typ[0]))
+
   c.withBlock bkBlock: # the target for return statements
-    if sfNeverRaises in owner.flags:
+    if needsTerminate:
       # it needs to be ensured that no exceptions leave the body
       c.blocks.add Block(kind: bkTryExcept)
+    if needsCleanup:
+      # the result variable only needs to be cleaned up when the procedure
+      # exits via an exception
+      c.blocks.add Block(kind: bkTryFinally, errorOnly: true)
 
     c.scope:
       if owner.kind in routineKinds:
@@ -2433,8 +2444,27 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
 
       gen(c, body)
 
-    if sfNeverRaises in owner.flags and (let b = c.blocks.pop(); b.id.isSome):
+    var isFirst = true
+
+    if needsCleanup and (let b = c.blocks.pop(); b.id.isSome):
       leaveBlock(c) # jump over the handler
+      isFirst = false
+
+      # emit the finally section for cleaning up the result variable:
+      c.subTree mnkFinally:
+        c.add labelNode(b.id.unsafeGet)
+      c.subTree mnkDestroy:
+        c.use genLocation(c, owner.ast[resultPos])
+      # note: we don't need to reset the location. Per the MIR semantics, it's
+      # guaranteed that no one can observe the result location when the
+      # procedure raises
+      c.subTree mnkContinue:
+        c.add labelNode(b.id.unsafeGet)
+
+    if needsTerminate and (let b = c.blocks.pop(); b.id.isSome):
+      if isFirst:
+        leaveBlock(c)
+
       # emit the handler for panicking on escaping exceptions:
       c.subTree MirNode(kind: mnkExcept, len: 1):
         c.add labelNode(b.id.unsafeGet)
diff --git a/compiler/mir/mirgen_blocks.nim b/compiler/mir/mirgen_blocks.nim
index b32b1363b7c..8772505049b 100644
--- a/compiler/mir/mirgen_blocks.nim
+++ b/compiler/mir/mirgen_blocks.nim
@@ -45,6 +45,8 @@ type
     of bkTryFinally:
       doesntExit*: bool
         ## whether structured control-flow doesn't reach the end of the finally
+      errorOnly*: bool
+        ## whether only exceptional control-flow is intercepted
       exits*: seq[LabelId]
         ## unordered set of follow-up targets
     of bkTryExcept, bkFinally, bkExcept:
@@ -129,6 +131,11 @@ proc blockLeaveActions(c; bu; targetBlock: int): bool =
 
         last -= b.numRegistered
     of bkTryFinally:
+      if c.blocks[i].errorOnly and targetBlock >= 0 and
+         c.blocks[targetBlock].kind != bkTryExcept:
+        # ignore the finally; it only applies to exceptional control-flow
+        continue
+
       let label = bu.requestLabel(c.blocks[i])
       # register as outgoing edge of the preceding finally (if any):
       if previous != -1:
diff --git a/tests/arc/topt_no_cursor.nim b/tests/arc/topt_no_cursor.nim
index 492e55655c0..53496c6d0b2 100644
--- a/tests/arc/topt_no_cursor.nim
+++ b/tests/arc/topt_no_cursor.nim
@@ -13,7 +13,7 @@ doing shady stuff...
   nimout: '''--expandArc: newTarget
 
 scope:
-  def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) -> [Resume]
+  def splat: tuple[dir: string, name: string, ext: string] = splitFile(arg path) -> [L0, Resume]
   bind_mut _7: string = splat.0
   def _3: string = move _7
   wasMoved(name _7)
@@ -26,6 +26,10 @@ scope:
   def _6: Target = (consume _3, consume _4, consume _5)
   result := move _6
   =destroy(name splat)
+  goto [L1]
+finally (L0):
+  continue {}
+L1:
 -- end of expandArc ------------------------
 --expandArc: delete
 
@@ -190,16 +194,20 @@ scope:
         goto [L1, L2]
   def_cursor _5: sink string = x
   def _6: int = lengthStr(arg _5)
-  def _7: string = $(arg _6) -> [L1, Resume]
-  echo(arg type(array[0..0, string]), arg _7) -> [L3, L1, Resume]
-  goto [L3, L1, L4]
-  finally (L3):
+  def _7: string = $(arg _6) -> [L1, L3, Resume]
+  echo(arg type(array[0..0, string]), arg _7) -> [L4, L1, L3, Resume]
+  goto [L4, L1, L5]
+  finally (L4):
     =destroy(name _7)
     continue {L1}
   finally (L1):
     =destroy(name x)
-    continue {L2, L4}
-  L4:
+    continue {L2, L3, L5}
+  L5:
+goto [L2]
+finally (L3):
+  =destroy(name result)
+  continue {}
 L2:
 
 -- end of expandArc ------------------------
diff --git a/tests/lang_objects/destructor/tdestroy_result_when_raise.nim b/tests/lang_objects/destructor/tdestroy_result_when_raise.nim
new file mode 100644
index 00000000000..c8d757302b5
--- /dev/null
+++ b/tests/lang_objects/destructor/tdestroy_result_when_raise.nim
@@ -0,0 +1,32 @@
+discard """
+  description: '''
+    Ensure that the result variable is cleaned up when already initialized and
+    the procedure exits due to a `raise`
+  '''
+  targets: c js vm
+"""
+
+import mhelper
+
+proc test(doRaise: bool): Resource =
+  result = initResource()
+  if doRaise:
+    raise CatchableError.newException("")
+
+block no_raise:
+  # make sure the result isn't destroyed too early when no exception is
+  # raised
+  var v = test(false)
+  doAssert numDestroy == 0
+
+doAssert numDestroy == 1
+numDestroy = 0
+
+block do_raise:
+  try:
+    var v = test(true)
+    # `v` must not be destroyed, otherwise there'd be a double-free
+  except CatchableError:
+    discard
+
+  doAssert numDestroy == 1
diff --git a/tests/optimization/tno_destroy_for_empty_result.nim b/tests/optimization/tno_destroy_for_empty_result.nim
new file mode 100644
index 00000000000..30b07f2dd25
--- /dev/null
+++ b/tests/optimization/tno_destroy_for_empty_result.nim
@@ -0,0 +1,39 @@
+discard """
+  description: '''
+    Ensure that the destructor call for the result variable is optimized away
+    when possible
+  '''
+  matrix: "--expandArc:test --hints:off"
+  nimoutfull: true
+  nimout: '''--expandArc: test
+scope:
+  scope:
+    if x:
+      scope:
+        doRaise() -> [L1, Resume]
+  def _2: Object = ()
+  result := move _2
+goto [L2]
+finally (L1):
+  continue {}
+L2:
+
+-- end of expandArc ------------------------
+'''
+"""
+
+type Object = object
+
+proc `=destroy`(x: var Object) =
+  discard
+
+proc doRaise() =
+  raise CatchableError.newException("")
+
+proc test(x: bool): Object {.exportc.} =
+  if x:
+    # raise with a separate procedure so that the ``--expandArc`` output is
+    # shorter
+    doRaise()
+
+  result = Object()

From b847eb6f2f6cbaa9cf9e1af38adbef581a36f103 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 29 May 2024 21:20:24 +0200
Subject: [PATCH 106/169] lower integer overflow checks with MIR pass (#1325)

## Summary

Lower the integer overflow checks with an MIR pass, instead of as part
of C code generation. This is mainly a refactoring, with the goal of
shrinking down the C code generator. As a side-effect, overflow checks
are very slightly faster.

## Details

The MIR produced by the lowering is similar to what the C code
generator previously output, but with one major difference: integer
operands smaller than the target's integer size now use dedicated
compilerprocs instead of first converting to `int`, performing the
checked arithmetic, and then comparing against the integer bounds.

The main reason for this change is that it makes the lowering pass
simpler and requires less MIR code, but it also has the benefit of
producing more efficient code. Run-time behaviour is not affected.

No dedicated gcc built-ins for overflow-checked arithmetic with
`short int` (int16) and `signed char` (int8) exists, so all checked
arithmetic compilerprocs now map to the generic gcc built-ins.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/ccgexprs.nim |  65 ----------------
 compiler/mir/rtchecks.nim     | 141 ++++++++++++++++++++++++++++++++++
 lib/nimbase.h                 |  36 +++++----
 lib/system/integerops.nim     |  27 +++++++
 4 files changed, 190 insertions(+), 79 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index fbf2c02d71d..365138bb9a8 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -280,69 +280,6 @@ template unaryExprChar(p: BProc, e: CgNode, d: var TLoc, frmt: string) =
   initLocExpr(p, e[1], a)
   putIntoDest(p, d, e, ropecg(p.module, frmt, [rdCharLoc(a)]))
 
-template binaryArithOverflowRaw(p: BProc, t: PType, a, b: TLoc;
-                            cpname: string): Rope =
-  var size = getSize(p.config, t)
-  let storage = if size < p.config.target.intSize: rope("NI")
-                else: getTypeDesc(p.module, t)
-  var result = getTempName(p.module)
-  linefmt(p, cpsLocals, "$1 $2;$n", [storage, result])
-  lineCg(p, cpsStmts, "if (#$2($3, $4, &$1)) { #raiseOverflow(); $5};$n",
-      [result, cpname, rdCharLoc(a), rdCharLoc(b), raiseInstr(p, e.exit)])
-  if size < p.config.target.intSize or t.kind in {tyRange, tyEnum}:
-    linefmt(p, cpsStmts, "if ($1 < $2 || $1 > $3){ #raiseOverflow(); $4}$n",
-            [result, intLiteral(firstOrd(p.config, t)), intLiteral(lastOrd(p.config, t)),
-            raiseInstr(p, e.exit)])
-  result
-
-proc binaryArithOverflow(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
-  const
-    prc: array[mAddI..mModI, string] = [
-      "nimAddInt", "nimSubInt",
-      "nimMulInt", "nimDivInt", "nimModInt"
-    ]
-    prc64: array[mAddI..mModI, string] = [
-      "nimAddInt64", "nimSubInt64",
-      "nimMulInt64", "nimDivInt64", "nimModInt64"
-    ]
-  var a, b: TLoc
-  assert(e[1].typ != nil)
-  assert(e[2].typ != nil)
-  initLocExpr(p, e[1], a)
-  initLocExpr(p, e[2], b)
-  # skipping 'range' is correct here as we'll generate a proper range check
-  # later via 'chckRange'
-  let t = e.typ.skipTypes(abstractRange)
-  if true:
-    # we handle div by zero here so that we know that the compilerproc's
-    # result is only for overflows.
-    if m in {mDivI, mModI}:
-      linefmt(p, cpsStmts, "if ($1 == 0){ #raiseDivByZero(); $2}$n",
-              [rdLoc(b), raiseInstr(p, e.exit)])
-
-    let res = binaryArithOverflowRaw(p, t, a, b,
-      if t.kind == tyInt64: prc64[m] else: prc[m])
-    putIntoDest(p, d, e, "($#)($#)" % [getTypeDesc(p.module, e.typ), res])
-
-proc unaryArithOverflow(p: BProc, e: CgNode, d: var TLoc, m: TMagic) =
-  var
-    a: TLoc
-    t: PType
-  assert(e[1].typ != nil)
-  initLocExpr(p, e[1], a)
-  t = skipTypes(e.typ, abstractRange)
-  linefmt(p, cpsStmts, "if ($1 == $2){ #raiseOverflow(); $3}$n",
-          [rdLoc(a), intLiteral(firstOrd(p.config, t)), raiseInstr(p, e.exit)])
-  case m
-  of mUnaryMinusI:
-    putIntoDest(p, d, e, "((NI$2)-($1))" % [rdLoc(a), rope(getSize(p.config, t) * 8)])
-  of mUnaryMinusI64:
-    putIntoDest(p, d, e, "-($1)" % [rdLoc(a)])
-  of mAbsI:
-    putIntoDest(p, d, e, "($1 > 0? ($1) : -($1))" % [rdLoc(a)])
-  else:
-    assert(false, $m)
-
 proc binaryArith(p: BProc, e, x, y: CgNode, d: var TLoc, op: TMagic) =
   var
     a, b: TLoc
@@ -1398,10 +1335,8 @@ proc genBreakState(p: BProc, n: CgNode, d: var TLoc) =
 proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
   case op
   of mNot..mUnaryPlusF64: unaryArith(p, e, e[1], d, op)
-  of mUnaryMinusI, mUnaryMinusI64: unaryArithOverflow(p, e, d, op)
   of mShrI..mXor: binaryArith(p, e, e[1], e[2], d, op)
   of mEqProc: genEqProc(p, e, d)
-  of mAddI..mPred: binaryArithOverflow(p, e, d, op)
   of mGetTypeInfo: genGetTypeInfo(p, e, d)
   of mGetTypeInfoV2: genGetTypeInfoV2(p, e, d)
   of mConStrStr: genStrConcat(p, e, d)
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index a796e169518..b5f186a1d93 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -397,6 +397,132 @@ proc emitObjectCheck(tree; call; graph; env; bu) =
     bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseObjectConversionError")):
       discard
 
+# XXX: currently cannot be moved to within ``emitCheckedBinaryIntOp`` due to a
+#      csource compiler bug
+const ArithChcks: array[mAddI..mModI, array[tyInt..tyInt64, string]] = block:
+  # compile the names of the procedure at compile-time
+  var res: array[mAddI..mModI, array[tyInt..tyInt64, string]]
+  for op, it in res.mpairs:
+    let base = case op
+      of mAddI: "nimAddInt"
+      of mSubI: "nimSubInt"
+      of mMulI: "nimMulInt"
+      of mDivI: "nimDivInt"
+      of mModI: "nimModInt"
+
+    # the inner array stores the per-width names, which is the base name
+    # suffixed with the width
+    const intKinds = [tyInt8, tyInt16, tyInt32, tyInt64]
+    for i, k in intKinds.pairs:
+      it[k] = base & $(8 shl i)
+
+    # for the moment, there's still a generic-width version
+    it[tyInt] = base
+
+  res
+
+proc emitCheckedBinaryIntOp(tree; call; graph; env; bu): Value =
+  ## Emits the lowered version of a checked binary arithmetic operation.
+  ## Usually, it looks like this:
+  ##   def _1
+  ##   def _2 = nimAddInt(arg a, arg b, name _1)
+  ##   if _2:
+  ##     raiseOverflow()
+  ##   result = _1
+  let
+    magic = tree[call + 1].magic
+    t = env[tree[call].typ].skipTypes(abstractRange)
+    x = NodePosition tree.argument(call, 0)
+    y = NodePosition tree.argument(call, 1)
+
+  # divison-by-zero is checked for separately, so that a dedicated error can
+  # be reported:
+  if magic in {mDivI, mModI}:
+    let cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mEqI, BoolType:
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, y)
+        bu.emitByVal literal(mnkIntLit, env.getOrIncl(0), tree[x].typ)
+
+    bu.buildIf cond:
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseDivByZero")):
+        discard
+
+  result = bu.allocTemp(tree[call].typ)
+  bu.subTree mnkDef:
+    bu.use result
+    bu.add MirNode(kind: mnkNone)
+
+  let kind = t.skipTypes({tyEnum}).kind
+  if kind in {tyUInt..tyUInt64, tyBool}:
+    # enums using an unsigned integer as the underlying type can reach here
+    # (due to ``succ`` and ``pred`` lowering), and no integer overflow
+    # check is performed for them -- the same goes for the bool typ
+    # XXX: no checked operation should be emitted for bool and unsigned enum
+    #      types in the first place
+    bu.subTree mnkInit:
+      bu.use result
+      # only 'add' and 'sub' operations can reach here
+      const Map = [mAddI: mnkAdd, mSubI: mnkSub]
+      bu.subTree Map[magic], tree[call].typ:
+        bu.emitFrom(tree, x)
+        bu.emitFrom(tree, y)
+
+  else:
+    # emit a call to the checked arithmethic operation:
+    let cond = bu.wrapTemp BoolType:
+      bu.buildCall env.addCompilerProc(graph, ArithChcks[magic][kind]), BoolType:
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, x)
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, y)
+        bu.emitByName(result, ekReassign)
+
+    bu.buildIf cond:
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseOverflow")):
+        discard
+
+  # for enum types, it's checked that they stay within their valid range
+  # XXX: this is unprincipled. Range and bool types are not considered, but
+  #      without any clear reason as to why. Using range checks instead might
+  #      be a better solution
+  if t.kind == tyEnum:
+    let litKind = if isUnsigned(t): mnkUIntLit else: mnkIntLit
+    let cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mLtEnum, BoolType:
+        bu.emitByVal result
+        bu.emitByVal env.makeLiteral(litKind, firstOrd(graph.config, t),
+                                     result.typ)
+
+    bu.buildIfNot cond:
+      bu.subTree mnkAsgn:
+        bu.use cond
+        bu.buildMagicCall mLtEnum, BoolType:
+          bu.emitByVal env.makeLiteral(litKind, lastOrd(graph.config, t),
+                                       result.typ)
+          bu.emitByVal result
+
+    bu.buildIf cond:
+      bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseOverflow")):
+        discard
+
+proc emitUnaryOverflowCheck(tree; call; graph; env; bu) =
+  ## Emits the overflow check for an integer negation operation:
+  ##   if x == low(x):
+  ##     raiseOverflow()
+  let
+    typ = tree[call].typ
+    min = firstOrd(graph.config, env[typ])
+    cond = bu.wrapTemp BoolType:
+      bu.buildMagicCall mEqI, BoolType:
+        bu.subTree mnkArg:
+          bu.emitFrom(tree, NodePosition tree.argument(call, 0))
+        bu.emitByVal env.makeLiteral(mnkIntLit, min, typ)
+
+  bu.buildIf cond:
+    bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseOverflow")):
+      discard
+
 proc emitCheckedFloatOp(tree; call; graph; env; bu): Value =
   ## Emits the lowered version of a checked float arithmetic operation.
   ## Checked means that the result is tested for infinity.
@@ -464,6 +590,21 @@ proc lowerChecks*(body; graph; env; changes: var Changeset) =
         changes.replaceMulti(tree, tree.parent(call), bu):
           emitObjectCheck(tree, call, graph, env, bu)
 
+      of mAddI, mSubI, mMulI, mModI, mDivI:
+        let call = tree.parent(i)
+        var tmp: Value
+        changes.insert(tree, tree.parent(call), call, bu):
+          tmp = emitCheckedBinaryIntOp(tree, call, graph, env, bu)
+        changes.replaceMulti(tree, call, bu):
+          bu.use tmp
+      of mUnaryMinusI, mUnaryMinusI64:
+        let call = tree.parent(i)
+        changes.insert(tree, tree.parent(call), call, bu):
+          emitUnaryOverflowCheck(tree, call, graph, env, bu)
+        # replace with built-in negation operation:
+        changes.replaceMulti(tree, call, bu):
+          bu.subTree MirNode(kind: mnkNeg, typ: tree[call].typ):
+            bu.emitFrom(tree, NodePosition tree.argument(call, 0))
       of mAddF64, mSubF64, mMulF64, mDivF64:
         let call = tree.parent(i)
         var tmp: Value
diff --git a/lib/nimbase.h b/lib/nimbase.h
index 4720b251c5d..8b91e228d24 100644
--- a/lib/nimbase.h
+++ b/lib/nimbase.h
@@ -568,26 +568,34 @@ NIM_STATIC_ASSERT(sizeof(NI) == sizeof(void*) && NIM_INTBITS == sizeof(NI)*8, ""
 
 /* these exist to make the codegen logic simpler */
 #define nimModInt(a, b, res) (((*res) = (a) % (b)), 0)
+#define nimModInt8(a, b, res) (((*res) = (a) % (b)), 0)
+#define nimModInt16(a, b, res) (((*res) = (a) % (b)), 0)
+#define nimModInt32(a, b, res) (((*res) = (a) % (b)), 0)
 #define nimModInt64(a, b, res) (((*res) = (a) % (b)), 0)
 
 #if (!defined(_MSC_VER) || defined(__clang__)) && !defined(NIM_EmulateOverflowChecks)
   /* these exist because we cannot have .compilerProcs that are importc'ed
     by a different name */
 
-  #define nimAddInt64(a, b, res) __builtin_saddll_overflow(a, b, (long long int*)res)
-  #define nimSubInt64(a, b, res) __builtin_ssubll_overflow(a, b, (long long int*)res)
-  #define nimMulInt64(a, b, res) __builtin_smulll_overflow(a, b, (long long int*)res)
-
-  #if NIM_INTBITS == 32
-    #define nimAddInt(a, b, res) __builtin_sadd_overflow(a, b, res)
-    #define nimSubInt(a, b, res) __builtin_ssub_overflow(a, b, res)
-    #define nimMulInt(a, b, res) __builtin_smul_overflow(a, b, res)
-  #else
-    /* map it to the 'long long' variant */
-    #define nimAddInt(a, b, res) __builtin_saddll_overflow(a, b, (long long int*)res)
-    #define nimSubInt(a, b, res) __builtin_ssubll_overflow(a, b, (long long int*)res)
-    #define nimMulInt(a, b, res) __builtin_smulll_overflow(a, b, (long long int*)res)
-  #endif
+  #define nimAddInt8(a, b, res) __builtin_add_overflow(a, b, res)
+  #define nimSubInt8(a, b, res) __builtin_sub_overflow(a, b, res)
+  #define nimMulInt8(a, b, res) __builtin_mul_overflow(a, b, res)
+
+  #define nimAddInt16(a, b, res) __builtin_add_overflow(a, b, res)
+  #define nimSubInt16(a, b, res) __builtin_sub_overflow(a, b, res)
+  #define nimMulInt16(a, b, res) __builtin_mul_overflow(a, b, res)
+
+  #define nimAddInt32(a, b, res) __builtin_add_overflow(a, b, res)
+  #define nimSubInt32(a, b, res) __builtin_sub_overflow(a, b, res)
+  #define nimMulInt32(a, b, res) __builtin_mul_overflow(a, b, res)
+
+  #define nimAddInt64(a, b, res) __builtin_add_overflow(a, b, res)
+  #define nimSubInt64(a, b, res) __builtin_sub_overflow(a, b, res)
+  #define nimMulInt64(a, b, res) __builtin_mul_overflow(a, b, res)
+
+  #define nimAddInt(a, b, res) __builtin_add_overflow(a, b, res)
+  #define nimSubInt(a, b, res) __builtin_sub_overflow(a, b, res)
+  #define nimMulInt(a, b, res) __builtin_mul_overflow(a, b, res)
 #endif
 
 #define NIM_NOALIAS __restrict
diff --git a/lib/system/integerops.nim b/lib/system/integerops.nim
index d543fd3bbdb..bc09f6c1ade 100644
--- a/lib/system/integerops.nim
+++ b/lib/system/integerops.nim
@@ -26,6 +26,18 @@ when not defined(nimEmulateOverflowChecks):
   proc nimSubInt(a, b: int, res: ptr int): bool {.nimbaseH.}
   proc nimMulInt(a, b: int, res: ptr int): bool {.nimbaseH.}
 
+  proc nimAddInt8(a, b: int8, res: ptr int8): bool {.nimbaseH.}
+  proc nimSubInt8(a, b: int8, res: ptr int8): bool {.nimbaseH.}
+  proc nimMulInt8(a, b: int8, res: ptr int8): bool {.nimbaseH.}
+
+  proc nimAddInt16(a, b: int16, res: ptr int16): bool {.nimbaseH.}
+  proc nimSubInt16(a, b: int16, res: ptr int16): bool {.nimbaseH.}
+  proc nimMulInt16(a, b: int16, res: ptr int16): bool {.nimbaseH.}
+
+  proc nimAddInt32(a, b: int32, res: ptr int32): bool {.nimbaseH.}
+  proc nimSubInt32(a, b: int32, res: ptr int32): bool {.nimbaseH.}
+  proc nimMulInt32(a, b: int32, res: ptr int32): bool {.nimbaseH.}
+
   proc nimAddInt64(a, b: int64; res: ptr int64): bool {.nimbaseH.}
   proc nimSubInt64(a, b: int64; res: ptr int64): bool {.nimbaseH.}
   proc nimMulInt64(a, b: int64; res: ptr int64): bool {.nimbaseH.}
@@ -36,6 +48,9 @@ when not defined(nimEmulateOverflowChecks):
 # check for 0 to the codgen.
 proc nimModInt(a, b: int; res: ptr int): bool {.nimbaseH.}
 
+proc nimModInt8(a, b: int8; res: ptr int8): bool {.nimbaseH.}
+proc nimModInt16(a, b: int16; res: ptr int16): bool {.nimbaseH.}
+proc nimModInt32(a, b: int32; res: ptr int32): bool {.nimbaseH.}
 proc nimModInt64(a, b: int64; res: ptr int64): bool {.nimbaseH.}
 
 # Platform independent versions.
@@ -50,6 +65,9 @@ template addImplFallback(name, T, U) {.dirty.} =
         result = true
 
 addImplFallback(nimAddInt, int, uint)
+addImplFallback(nimAddInt8, int8, uint8)
+addImplFallback(nimAddInt16, int16, uint16)
+addImplFallback(nimAddInt32, int32, uint32)
 addImplFallback(nimAddInt64, int64, uint64)
 
 template subImplFallback(name, T, U) {.dirty.} =
@@ -62,6 +80,9 @@ template subImplFallback(name, T, U) {.dirty.} =
         result = true
 
 subImplFallback(nimSubInt, int, uint)
+subImplFallback(nimSubInt8, int8, uint8)
+subImplFallback(nimSubInt16, int16, uint16)
+subImplFallback(nimSubInt32, int32, uint32)
 subImplFallback(nimSubInt64, int64, uint64)
 
 template mulImplFallback(name, T, U, conv) {.dirty.} =
@@ -108,6 +129,9 @@ template mulImplFallback(name, T, U, conv) {.dirty.} =
           result = true
 
 mulImplFallback(nimMulInt, int, uint, toFloat)
+mulImplFallback(nimMulInt8, int8, uint8, toFloat)
+mulImplFallback(nimMulInt16, int16, uint16, toFloat)
+mulImplFallback(nimMulInt32, int32, uint32, toFloat)
 mulImplFallback(nimMulInt64, int64, uint64, toBiggestFloat)
 
 
@@ -120,6 +144,9 @@ template divImplFallback(name, T) {.dirty.} =
       res[] = a div b
 
 divImplFallback(nimDivInt, int)
+divImplFallback(nimDivInt8, int8)
+divImplFallback(nimDivInt16, int16)
+divImplFallback(nimDivInt32, int32)
 divImplFallback(nimDivInt64, int64)
 
 proc raiseFloatInvalidOp {.errorPrc.} =

From 876540a95b907b8de6640763270c5ce5e3c76128 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 29 May 2024 23:11:04 +0200
Subject: [PATCH 107/169] fix index check bugs affecting the C backend (#1327)

## Summary

Fix two bugs with index checks:
* accessing an `array` with a negative base index with a `uint` operand
  could result in false positive errors
* in some edge cases, array access would "wrap around", instead of a
  index error being reported; regression from
  https://github.com/nim-works/nimskull/pull/1324

Only the C backend was affected.

## Details

The MIR code produced by the `mChckIndex` lowering used different types
for the comparison operands, resulting in the C integer promotion rules
to apply, causing false positive and false negative results.

To fix the bug, the suggestion provided by the fixme is implemented,
namely that the boundary values are first converted to the index
operand's type prior to comparison.

If a boundary index value is not representable with the index operand's
type, the boundary test is omitted. Take, for example,
`array[-1..1, int]` that is index with a `uint` value: `uint` is
guaranteed to be >= 0, so the `-1 < idx` test can be folded away.

It's guaranteed that only one comparisons can be omitted, because
otherwise the array access can statically be proven to work, and no
index check must have been emitted by `mirgen` in the first place.

### Tests

* the `tout_of_range_index_check.nim` test is enabled for the C target
* a regression test for the fixed false negative check is added
---
 compiler/mir/rtchecks.nim                     | 73 +++++++++++--------
 .../array/tout_of_range_index_check.nim       | 10 ++-
 2 files changed, 48 insertions(+), 35 deletions(-)

diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index b5f186a1d93..3eef32f9a0c 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -219,40 +219,51 @@ proc emitIndexCheck(tree; call; graph; env; bu) =
 
   let
     idxOperand = NodePosition tree.argument(call, 1)
-    sizeType  = env.types.sizeType
-    usizeType = env.types.usizeType
-
-  if ty.kind == tyArray and (firstOrd(graph.config, ty) != Zero or
-     lastOrd(graph.config, ty) < Zero):
-    # FIXME: this branch also need to be taken when lastOrd >= high(int)
-    # we need to test against both the lower and upper bound
+    sizeType   = env.types.sizeType
+    usizeType  = env.types.usizeType
+    conf       = graph.config
+
+  if ty.kind == tyArray and (firstOrd(conf, ty) != Zero or
+     lengthOrd(conf, ty) > lastOrd(conf, env[sizeType])):
+    # we cannot check against just the length; the lower and upper bound need
+    # to be checked against separately
     let
-      typ   = env.types.add(env[tree[arrOperand].typ][0])
-      first = env.makeLiteral(mnkIntLit, firstOrd(graph.config, ty), typ)
-      last  = env.makeLiteral(mnkIntLit, lastOrd(graph.config, ty), typ)
-
-    # FIXME: there are two problems here:
-    #        * the comparison operator is wrong for non-int types
-    #        * the comparison operands don't use the same type
-    #        As a consequence, C integer promotion rules apply, leading to
-    #        incorrect test results in some cases. The bound values need to
-    #        be converted to the index operand's type first, with boundary
-    #        checks omitted where the boundary's value cannot be represented
-    #        with the index operand's type
-
-    let cond = bu.wrapTemp BoolType:
-      bu.buildMagicCall mLtI, BoolType:
-        bu.subTree mnkArg:
-          bu.emitFrom(tree, idxOperand)
-        bu.emitByVal first
-
-    bu.buildIfNot cond:
-      bu.subTree mnkAsgn:
-        bu.use cond
-        bu.buildMagicCall mLtI, BoolType:
-          bu.emitByVal last
+      idxTyp = env[tree[idxOperand].typ]
+      litKind = if isUnsigned(idxTyp): mnkUIntLit else: mnkIntLit
+      lo     = firstOrd(conf, ty)
+      hi     = lastOrd(conf, ty)
+      first  = env.makeLiteral(litKind, lo, tree[idxOperand].typ)
+      last   = env.makeLiteral(litKind, hi, tree[idxOperand].typ)
+      ltOp   = getMagicLessForType(idxTyp.skipTypes(abstractRange +
+                                                    tyUserTypeClasses)).lt
+
+    var cond: Value
+    if firstOrd(conf, idxTyp) < lo:
+      # lower bound needs to be checked against
+      cond = bu.wrapTemp BoolType:
+        bu.buildMagicCall ltOp, BoolType:
           bu.subTree mnkArg:
             bu.emitFrom(tree, idxOperand)
+          bu.emitByVal first
+
+    if lastOrd(conf, idxTyp) > hi:
+      # upper bound needs to be checked against
+      proc check(bu; tree; m: TMagic, src: NodePosition, val: Value) {.nimcall.} =
+        bu.buildMagicCall m, BoolType:
+          bu.emitByVal val
+          bu.subTree mnkArg:
+            bu.emitFrom(tree, src)
+
+      if firstOrd(conf, idxTyp) < lo:
+        # the upper bound only needs to be tested when the lower bound check
+        # succeeded
+        bu.buildIfNot cond:
+          bu.subTree mnkAsgn:
+            bu.use cond
+            check(bu, tree, ltOp, idxOperand, last)
+      else:
+        cond = bu.wrapTemp BoolType:
+          check(bu, tree, ltOp, idxOperand, last)
 
     bu.buildIf cond:
       bu.emitCall(tree, call, env.addCompilerProc(graph, "raiseIndexError3")):
diff --git a/tests/lang_types/array/tout_of_range_index_check.nim b/tests/lang_types/array/tout_of_range_index_check.nim
index 3726c9e9944..ab503ff10f7 100644
--- a/tests/lang_types/array/tout_of_range_index_check.nim
+++ b/tests/lang_types/array/tout_of_range_index_check.nim
@@ -3,10 +3,6 @@ discard """
     Ensure that accessing an array works when the index operand's type cannot
     be safely converted to the array's index type
   '''
-  knownIssue.c: '''
-    The boundary checks are implemented improperly, leading to the array
-    appearing to effectively be empty
-  '''
   knownIssue.vm: '''
     Arrays with a start index outside of -128..127 crash the code generator
   '''
@@ -27,3 +23,9 @@ proc test2(index: uint): int =
   result = arr[index]
 
 doAssert test2(1) == 3
+
+# regression test: make sure that an index that is valid after conversion to
+# uint gets caught by the index check
+when not defined(vm): # catching defects is not supported by the VM
+  doAssertRaises IndexDefect:
+    discard test1(low(int))

From 3618e765d3271b6ae55ec62e7bf3ad27dd89079c Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 31 May 2024 23:52:33 +0200
Subject: [PATCH 108/169] remove unnecessary `ccgutils` dependency (#1330)

## Summary

Remove an obsolete usage of `ccgIntroducedPtr` from sem, breaking an
import dependency between sem and the code generator, and allowing for
`ccgIntroducedPtr` to move back to `ccgtypes`.

## Details

It was originally possible for the arguments to a copy hook overlapping
in memory (a parameter aliasing violation), resulting in incorrect
behaviour when copying variant objects if they do.

ed126794b6af8b39960a7acc603cee1abc73da4a worked around this by checking
whether both parameters were (hidden) pointers to the same location,
skipping the copy if they are, with `ccgIntroducedPtr` used to check
whether the source parameter is passed as via a pointer indirection.

This is a layering violation, and also no longer necessary, since
`injecthooks` ensures that the immutable argument doesn't refer to the
same memory location as the mutable one -- the workaround in
`liftdestructors` can thus be removed.
---
 compiler/backend/ccgtypes.nim    | 26 +++++++++++++++++++
 compiler/backend/ccgutils.nim    | 44 +-------------------------------
 compiler/sem/liftdestructors.nim | 12 ---------
 3 files changed, 27 insertions(+), 55 deletions(-)

diff --git a/compiler/backend/ccgtypes.nim b/compiler/backend/ccgtypes.nim
index 999d266f41f..69d0571f112 100644
--- a/compiler/backend/ccgtypes.nim
+++ b/compiler/backend/ccgtypes.nim
@@ -199,6 +199,32 @@ proc addAbiCheck(m: BModule, t: PType, name: Rope) =
     m.s[cfsTypeInfo].addf("NIM_STATIC_ASSERT(sizeof($1) == $2, $3);$n", [name, rope(size), msg2.rope])
     # see `testCodegenABICheck` for example error message it generates
 
+proc ccgIntroducedPtr(conf: ConfigRef; s: PSym, retType: PType): bool =
+  var pt = skipTypes(s.typ, typedescInst)
+  assert skResult != s.kind
+
+  if tfByRef in pt.flags: return true
+  elif tfByCopy in pt.flags: return false
+  case pt.kind
+  of tyObject:
+    if s.typ.sym != nil and sfForward in s.typ.sym.flags:
+      # forwarded objects are *always* passed by pointers for consistency!
+      result = true
+    elif (optByRef in s.options) or (getSize(conf, pt) > conf.target.floatSize * 3):
+      result = true           # requested anyway
+    elif (tfFinal in pt.flags) and (pt[0] == nil):
+      result = false          # no need, because no subtyping possible
+    else:
+      result = true           # ordinary objects are always passed by reference,
+                              # otherwise casting doesn't work
+  of tyTuple:
+    result = (getSize(conf, pt) > conf.target.floatSize*3) or (optByRef in s.options)
+  else:
+    result = false
+  # first parameter and return type is 'lent T'? --> use pass by pointer
+  if s.position == 0 and retType != nil and retType.kind == tyLent:
+    result = not (pt.kind in {tyVar, tyArray, tyOpenArray, tyVarargs, tyRef, tyPtr, tyPointer} or
+      pt.kind == tySet and mapSetType(conf, pt) == ctArray)
 
 proc initResultParamLoc(conf: ConfigRef; param: CgNode): TLoc =
   result = initLoc(locParam, param, "Result", OnStack)
diff --git a/compiler/backend/ccgutils.nim b/compiler/backend/ccgutils.nim
index a00f4316543..473a29eacb8 100644
--- a/compiler/backend/ccgutils.nim
+++ b/compiler/backend/ccgutils.nim
@@ -14,19 +14,13 @@ import
     hashes, strutils
   ],
   compiler/ast/[
-    ast,
-    types
+    ast
   ],
   compiler/front/[
     options
   ],
   compiler/utils/[
     platform
-  ],
-  compiler/sem/[
-  ],
-  compiler/backend/[
-    cgendata,
   ]
 
 proc hashString*(conf: ConfigRef; s: string): BiggestInt =
@@ -108,39 +102,3 @@ proc mangle*(name: string): string =
       requiresUnderscore = true
   if requiresUnderscore:
     result.add "_"
-
-proc mapSetType(conf: ConfigRef; typ: PType): TCTypeKind =
-  case int(getSize(conf, typ))
-  of 1: result = ctInt8
-  of 2: result = ctInt16
-  of 4: result = ctInt32
-  of 8: result = ctInt64
-  else: result = ctArray
-
-proc ccgIntroducedPtr*(conf: ConfigRef; s: PSym, retType: PType): bool =
-  var pt = skipTypes(s.typ, typedescInst)
-  assert skResult != s.kind
-
-  if tfByRef in pt.flags: return true
-  elif tfByCopy in pt.flags: return false
-  case pt.kind
-  of tyObject:
-    if s.typ.sym != nil and sfForward in s.typ.sym.flags:
-      # forwarded objects are *always* passed by pointers for consistency!
-      result = true
-    elif (optByRef in s.options) or (getSize(conf, pt) > conf.target.floatSize * 3):
-      result = true           # requested anyway
-    elif (tfFinal in pt.flags) and (pt[0] == nil):
-      result = false          # no need, because no subtyping possible
-    else:
-      result = true           # ordinary objects are always passed by reference,
-                              # otherwise casting doesn't work
-  of tyTuple:
-    result = (getSize(conf, pt) > conf.target.floatSize*3) or (optByRef in s.options)
-  else:
-    result = false
-  # first parameter and return type is 'lent T'? --> use pass by pointer
-  if s.position == 0 and retType != nil and retType.kind == tyLent:
-    result = not (pt.kind in {tyVar, tyArray, tyOpenArray, tyVarargs, tyRef, tyPtr, tyPointer} or
-      pt.kind == tySet and mapSetType(conf, pt) == ctArray)
-
diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index 289412b5d6d..bb5e6ce798a 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -37,9 +37,6 @@ import
     semdata,
     sighashes,
     lowerings
-  ],
-  compiler/backend/[
-    ccgutils
   ]
 
 from compiler/ast/reports_sem import reportAst,
@@ -224,15 +221,6 @@ proc fillBodyObjT(c: var TLiftCtx; t: PType, body, x, y: PNode) =
     # for every field (dependent on dest.kind):
     #   `=` dest.field, src.field
     # =destroy(blob)
-    var dummy = newSym(skTemp, getIdent(c.g.cache, lowerings.genPrefix), nextSymId c.idgen, c.fn, c.info)
-    dummy.typ = y.typ
-    if ccgIntroducedPtr(c.g.config, dummy, y.typ):
-      # Because of potential aliasing when the src param is passed by ref, we need to check for equality here,
-      # because the wasMoved(dest) call would zero out src, if dest aliases src.
-      var cond = newTree(nkCall, newSymNode(c.g.getSysMagic(c.info, "==", mEqRef)),
-        newTreeIT(nkAddr, c.info, makePtrType(c.fn, x.typ, c.idgen), x), newTreeIT(nkAddr, c.info, makePtrType(c.fn, y.typ, c.idgen), y))
-      cond.typ = getSysType(c.g, x.info, tyBool)
-      body.add genIf(c, cond, newTreeI(nkReturnStmt, c.info, newNodeI(nkEmpty, c.info)))
     var temp = newSym(skTemp, getIdent(c.g.cache, lowerings.genPrefix), nextSymId c.idgen, c.fn, c.info)
     temp.typ = x.typ
     incl(temp.flags, sfFromGeneric)

From 36a314bfa20b9190693ed0c080f29f0cb41144dc Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 3 Jun 2024 19:40:51 +0200
Subject: [PATCH 109/169] mir: remove statement nesting (#1331)

## Summary

Scopes are now no longer subtrees that can have other statements nested
within them. This removes the last of case of statement nesting from
the MIR, meaning that all bodies are now made up of flat statement
lists.

## Details

Statement nesting complicates tree traversal, and - more importantly -
prevents the eventual removal of the `mnkEnd` nodes. Without `mnkEnd`
nodes, the number of sub-nodes is going to be explicitly stored in the
subtree nodes, which cannot efficiently work in the `Changeset`
architecture when statements can be nested.

Construction of MIR trees is updated accordingly (`subTree` cannot be
used for wrapping statements in a scope; the `scope` template is used
instead), as well as tree traversal.
---
 compiler/backend/backends.nim      |  7 ++++---
 compiler/backend/cgirgen.nim       | 11 +++++-----
 compiler/mir/injecthooks.nim       | 11 +++++-----
 compiler/mir/mirconstr.nim         |  5 +++--
 compiler/mir/mirgen.nim            | 13 ++++++------
 compiler/mir/mirpasses.nim         |  6 +++---
 compiler/mir/mirtrees.nim          | 11 ++++++----
 compiler/mir/rtchecks.nim          |  2 +-
 compiler/mir/utils.nim             | 16 ++++-----------
 compiler/sem/injectdestructors.nim | 32 ++++++++++++++++++++----------
 doc/mir.rst                        |  3 ++-
 11 files changed, 64 insertions(+), 53 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 2893dd51e46..02e9b9dfbb9 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -283,7 +283,7 @@ func isEmpty*(tree: MirTree): bool =
   ## Returns whether `tree` contains either no nodes or only nodes that have
   ## no meaning by themselves.
   for n in tree.items:
-    if n.kind notin {mnkScope, mnkEnd}:
+    if n.kind notin {mnkScope, mnkEndScope, mnkEnd}:
       return false
 
   result = true
@@ -416,13 +416,14 @@ proc produceFragmentsForGlobals(
     # on this
     if bu.front.len == 0:
       discard bu.addLocal(Local()) # empty result slot
-      bu.add(m.add(n)): MirNode(kind: mnkScope)
+      bu.setSource(m.add(n))
+      bu.subTree mnkScope: discard
 
   func finish(bu: sink MirBuilder, m: var SourceMap, n: PNode
              ): auto {.nimcall.} =
     if bu.front.len > 0:
       bu.setSource(m.add(n))
-      bu.add endNode(mnkScope)
+      bu.subTree mnkEndScope: discard
     # we're creating a body here, so there is no list of locals yet
     result = finish(bu, default(Store[LocalId, Local]))
 
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 6256c31f910..ecf2aec78c0 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -656,10 +656,11 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     toList cnkEmitStmt:
       res.add valueToIr(tree, cl, cr)
   of mnkScope:
+    leave(tree, cr)
     scopeToIr(tree, env, cl, cr, stmts)
   of mnkDestroy:
     unreachable("a 'destroy' that wasn't lowered")
-  of AllNodeKinds - StmtNodes:
+  of AllNodeKinds - StmtNodes + {mnkEndScope}:
     unreachable(n.kind)
 
 proc setElementToIr(tree: MirBody, cl: var TranslateCl,
@@ -771,7 +772,7 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   of mnkCopy, mnkMove, mnkSink:
     # translation of assignments needs to handle all modifiers
     unreachable("loose assignment modifier")
-  of AllNodeKinds - ExprKinds - {mnkNone}:
+  of AllNodeKinds - ExprKinds - {mnkNone} + {mnkEndScope}:
     unreachable(n.kind)
 
 proc genDefFor(sym: sink CgNode): CgNode =
@@ -797,11 +798,11 @@ proc scopeToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   cl.inUnscoped = 0
 
   # translate all statements:
-  while cr.hasNext(tree) and tree[cr].kind != mnkEnd:
+  while cr.hasNext(tree) and tree[cr].kind != mnkEndScope:
     stmtToIr(tree, env, cl, cr, stmts)
 
-  if cr.hasNext(tree) and tree[cr].kind == mnkEnd:
-    leave(tree, cr) # close the sub-tree
+  if cr.hasNext(tree) and tree[cr].kind == mnkEndScope:
+    skip(tree, cr)
 
   if cl.defs.len > prev:
     # insert all the lifted defs at the start of the scope
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index f2bb6b40277..ad192656f02 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -104,12 +104,11 @@ proc isUsedForSink(tree: MirTree, stmt: NodePosition): bool =
         break
     of mnkScope:
       inc depth
-    of mnkEnd:
-      if tree[n].kind == mnkScope:
-        dec depth
-        if depth < 0:
-          # the end of the temporary's surrounding scope is reached
-          break
+    of mnkEndScope:
+      dec depth
+      if depth < 0:
+        # the end of the temporary's surrounding scope is reached
+        break
     else:
       discard
 
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 7b487689274..ea6b23213d0 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -312,8 +312,9 @@ template stmtList*(bu: var MirBuilder, body: untyped) =
     body
 
 template scope*(bu: var MirBuilder, body: untyped) =
-  bu.subTree MirNode(kind: mnkScope):
-    body
+  bu.subTree mnkScope: discard
+  body
+  bu.subTree mnkEndScope: discard
 
 func allocTemp(bu: MirBuilder, t: TypeId; id: LocalId, alias: bool): Value =
   ## Allocates a new temporary or alias and returns it.
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index dab8aa1a403..521ab83b15b 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -277,7 +277,7 @@ template subTree(c: var TCtx, n: MirNode, body: untyped) =
 
 template scope(c: var TCtx, body: untyped) =
   inc c.scopeDepth
-  c.builder.subTree mnkScope:
+  c.builder.scope:
     let prev = c.blocks.startScope()
     body
     c.blocks.closeScope(c.builder, prev, not c.unreachable)
@@ -2013,11 +2013,12 @@ proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
                 c.emitByVal val
     do:
       # the check:
-      c.buildStmt mnkScope:
-        c.subTree mnkVoid:
-          c.buildDefectMagicCall mChckObj, VoidType:
-            c.emitByVal val
-            c.emitByVal typeLit(c.typeToMir(n.check))
+      c.buildStmt mnkScope: discard
+      c.buildStmt mnkVoid:
+        c.buildDefectMagicCall mChckObj, VoidType:
+          c.emitByVal val
+          c.emitByVal typeLit(c.typeToMir(n.check))
+      c.buildStmt mnkEndScope: discard
 
     c.buildOp mnkPathConv, typ:
       c.use val
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 8a75a1ef898..ab68eae6970 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -434,7 +434,7 @@ proc injectResultInit(tree: MirTree, resultTyp: TypeId, changes: var Changeset)
 
   if requiresInit(tree):
     assert tree[0].kind == mnkScope
-    let at = tree.child(NodePosition 0, 0)
+    let at = tree.sibling(NodePosition 0)
     changes.insert(tree, at, at, bu):
       bu.subTree mnkInit:
         bu.use toValue(mnkLocal, resultId, resultTyp)
@@ -451,14 +451,14 @@ proc injectProfilerCalls(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
     prcId = env.procedures.add(graph.getCompilerProc("nimProfile"))
 
   # insert the entry call within the outermost scope:
-  changes.insert(tree, tree.child(NodePosition 0, 0), NodePosition 0, bu):
+  changes.insert(tree, tree.sibling(NodePosition 0), NodePosition 0, bu):
     bu.subTree mnkVoid:
       bu.buildCall prcId, VoidType:
         discard "no arguments"
 
   for i in search(tree, {mnkLoop}):
     # insert the call before the loop end:
-    changes.insert(tree, i - 1, i, bu):
+    changes.insert(tree, i, i, bu):
       bu.subTree mnkVoid:
         bu.buildCall prcId, VoidType:
           discard "no arguments"
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index dbd9efe2576..dc85592c4ce 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -213,9 +213,12 @@ type
               ## * syntactic statement node for representing void calls
               ## * statement acting as a use of the given lvalue
 
-    mnkScope  ## the only way to introduce a scope. Scopes can be nested and
-              ## dictate the lifetime of the locals that are directly enclosed
-              ## by them
+    mnkScope  ## starts a scope, which are used to delimit lifetime of locals
+              ## they enclose. Can be nested, but must always be paired with
+              ## exactly one ``mnkEndScope`` statement
+    mnkEndScope## closes the current scope. Must always be paired with a
+              ## ``mnkScope`` statement
+    # future direction: both mnkScope and mnkEndScope should become atoms
 
     mnkGoto   ## unconditional jump
     mnkIf     ## depending on the run-time value of `x`, transfers control-
@@ -354,7 +357,7 @@ const
   StmtNodes* = {mnkScope, mnkGoto, mnkIf, mnkCase, mnkLoop, mnkJoin,
                 mnkLoopJoin, mnkExcept, mnkFinally, mnkContinue, mnkEndStruct,
                 mnkInit, mnkAsgn, mnkSwitch, mnkVoid, mnkRaise, mnkDestroy,
-                mnkEmit, mnkAsm} + DefNodes
+                mnkEmit, mnkAsm, mnkEndScope} + DefNodes
     ## Nodes that are treated like statements, in terms of syntax.
 
   # --- semantics-focused sets:
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index 3eef32f9a0c..fd718dfd4a1 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -49,7 +49,7 @@ template subTree(bu; k: MirNodeKind, t: TypeId, body: untyped) =
 
 template buildIf(bu; cond: Value, body: untyped) =
   bu.buildIf (;bu.use(cond)):
-    bu.subTree mnkScope:
+    bu.scope:
       body
 
 template buildIfNot(bu; cond: Value, body: untyped) =
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 293b7a02246..214ec768d17 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -519,9 +519,6 @@ proc renderNameWithType(tree: MirTree, i: var int, result: var string,
   result.add ": "
   typeToStr(result, n.typ, c.env)
 
-proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
-                c: RenderCtx)
-
 proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
                c: RenderCtx) =
   template tree(str: string, body: untyped) =
@@ -529,12 +526,6 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
     result.add str
     body
 
-  template tab(body: untyped) =
-    ## Runs `body` with the indentation increased by 1.
-    inc indent
-    body
-    dec indent
-
   let n {.cursor.} = next(nodes, i)
   case n.kind
   of mnkDef:
@@ -601,9 +592,10 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
 
     inc indent
   of mnkScope:
-    tree "scope:\n":
-      tab:
-        renderList(nodes, i, indent, result, c)
+    tree "scope:\n": discard
+    inc indent
+  of mnkEndScope:
+    dec indent # just dedent
   of mnkIf:
     tree "if ":
       valueToStr()
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 3402c21013b..44793eaa12d 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -207,6 +207,19 @@ iterator nodesWithScope(tree: MirTree): (NodePosition, lent MirNode, Slice[NodeP
   # the logic relies on the assumption that there exists a scope around
   # every 'def'
 
+  proc findScopeEnd(tree: MirTree, start: NodePosition): NodePosition =
+    ## Searches for the position of the ``mnkScopeEnd`` node for the current
+    ## scope.
+    var
+      i = start
+      depth = 0
+    while depth >= 0:
+      let kind = tree[i].kind
+      depth = depth + ord(kind == mnkScope) - ord(kind == mnkEndScope)
+      inc i
+
+    result = i - 1
+
   # XXX: profiling showed that a significant amount of time is spent in
   #      ``computeSpan`` and adding elements to the `scopeStack`. An approach
   #      where a scope's span is only computed when needed might be better
@@ -215,16 +228,15 @@ iterator nodesWithScope(tree: MirTree): (NodePosition, lent MirNode, Slice[NodeP
     of mnkScope:
       # start a new scope. The start and end node/token are not included in
       # the span
-      let span = computeSpan(tree, i)
-      scopeStack.add (span.a + 1)..(span.b - 1)
-    of mnkEnd:
-      if n.start == mnkScope:
-        # leave the current scope:
-        scopeStack.setLen(scopeStack.len - 1)
-        if scopeStack.len == 0:
-          # the following statements, if any, can only be joins, and those can
-          # safely be skipped here
-          break
+      let fin = findScopeEnd(tree, i + 1)
+      scopeStack.add tree.sibling(i)..(fin-1)
+    of mnkEndScope:
+      # leave the current scope:
+      scopeStack.setLen(scopeStack.len - 1)
+      if scopeStack.len == 0:
+        # the following statements, if any, can only be joins, and those can
+        # safely be skipped here
+        break
 
     else:
       yield (i, n, scopeStack[^1])
diff --git a/doc/mir.rst b/doc/mir.rst
index 7af9721f7e5..4b5fa82e18d 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -137,9 +137,10 @@ Semantics
   SHALLOW_SRC = RVALUE
               | VALUE
 
-  STATEMENT = Scope STATEMENT           # wrap the statement in a scope, which
+  STATEMENT = Scope                     # starts a new scope, which
                                         # delimits the lifetime of all
                                         # definitions within
+            | EndScope                  # close the current scope
             | Def NAME none             # definition
             | Def NAME ASGN_SRC         # definition + initial value assignment
             | DefCursor NAME            # definition of non-owning location

From 3c4cb3f1d3b651b6ffcd7ab4ee872c2cbc94eefe Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 4 Jun 2024 08:47:39 +0200
Subject: [PATCH 110/169] transf: remove unreachable code (#1329)

## Summary

Eliminate unreachable statements and expression during `transf`,
instead of in `mirgen`. This:
* removes some workarounds from `mirgen`
* improves the quality of unreachable code elimination
* fixes a compiler crash related to non-returning expressions

## Details

Statement lists can have trailing unreachable code, and expressions can
therefore be non-returning (e.g., `(;break; 1)`).

`mirgen` made an attempt at eliminating both, but the approach used
was indirect and didn't handle expressions well, leading to crashes for
code such as `f((;return; var x = 0; 1), x)`, because the `var x`
definition wasn't translated, but the subsequent usage of `x` was.

Removing unreachable statements/expressions is now done by an AST-based
pass that's run after early `transf` (so that iterator inlining took
place and the AST is less complex) but before the `closureiters`
transformation. The pass is implemented by the `unreachable_elim`
module.

Beyond fixing the crashes, this has the additional benefits that:
* the `closureiters` transformation doesn't take unreachable code into
  account
* `mirgen` can detect `finally` clauses that have no structured exit
  and emit better code for them. The handling for the no-structured-
  exit case already existed (`doesntExit`), just the detection was
  missing
* more straightforward MIR translation, using less conditionals

A test for the various possible scenarios of unreachable expressions/
statements is added.
---
 compiler/mir/mirgen.nim                       | 168 +++------
 compiler/modules/modulegraphs.nim             |   4 +
 compiler/sem/transf.nim                       |   6 +-
 compiler/sem/unreachable_elim.nim             | 341 ++++++++++++++++++
 .../lang_exprs/tnon_returning_expressions.nim | 188 ++++++++++
 5 files changed, 587 insertions(+), 120 deletions(-)
 create mode 100644 compiler/sem/unreachable_elim.nim
 create mode 100644 tests/lang_exprs/tnon_returning_expressions.nim

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 521ab83b15b..c124df345d4 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -157,11 +157,6 @@ type
       ## > 0 if the current statement/expression is part of a loop
     injectDestructors: bool
       ## whether injection of destroy operations is enabled
-    unreachable: bool
-      ## set to true when entering unreachable code (e.g., statements
-      ## immediately following a `break`). Disables:
-      ## * translation of AST
-      ## * emission of control-flow statements at block/scope end
 
     # input:
     userOptions: set[TOption]
@@ -193,21 +188,10 @@ proc isCursor(n: PNode): bool =
   else:
     false
 
-func endsInNoReturn(n: PNode): bool =
-  ## Tests and returns whether the simple or compound statement `n` ends in a
-  ## no-return statement
-
-  # TODO: this is a patched version of ``sem.endsInNoReturn`` that also
-  #       considers ``nkPragmaBlock``. Move this procedure somewhere common and
-  #       replace ``sem.endsInNoReturn`` with it
-  const SkipSet = {nkStmtList, nkStmtListExpr, nkPragmaBlock}
-  var it {.cursor.} = n
-  while it.kind in SkipSet and it.len > 0:
-    it = it.lastSon
-
-  result = it.kind in nkLastBlockStmts or
-    (it.kind in nkCallKinds and it[0].kind == nkSym and
-     sfNoReturn in it[0].sym.flags)
+template doesReturn(n: PNode): bool =
+  ## Returns whether `n` is a statement with a structured exit.
+  mixin c
+  n.typ != c.graph.noreturnType
 
 func initDestination(v: sink Value, isFirst, sink: bool): Destination =
   var flags: set[DestFlag]
@@ -275,12 +259,15 @@ template subTree(c: var TCtx, n: MirNode, body: untyped) =
   c.builder.subTree n:
     body
 
-template scope(c: var TCtx, body: untyped) =
+template scope(c: var TCtx, exits: bool, body: untyped) =
+  ## `exits` signals whether the body of the scope has a structured control-
+  ## flow exit.
+  let e = exits
   inc c.scopeDepth
   c.builder.scope:
     let prev = c.blocks.startScope()
     body
-    c.blocks.closeScope(c.builder, prev, not c.unreachable)
+    c.blocks.closeScope(c.builder, prev, e)
   dec c.scopeDepth
 
 template use(c: var TCtx, val: Value) =
@@ -808,10 +795,6 @@ proc genCall(c: var TCtx, n: PNode) =
     if kind == mnkCheckedCall:
       raiseExit(c)
 
-  # code following the call of a .noreturn routine is unreachable:
-  if n[0].kind == nkSym and sfNoReturn in n[0].sym.flags:
-    c.unreachable = true
-
 proc genMacroCallArgs(c: var TCtx, n: PNode, kind: TSymKind, fntyp: PType) =
   ## Generates the arguments for a macro/template call expression. `n` is
   ## expected to be a ``getAst`` expression that has been transformed to the
@@ -1309,8 +1292,6 @@ proc genRaise(c: var TCtx, n: PNode) =
       c.add MirNode(kind: mnkNone)
       raiseExit(c)
 
-  # code following a raise statement is unreachable:
-  c.unreachable = true
 
 proc genReturn(c: var TCtx, n: PNode) =
   assert n.kind == nkReturnStmt
@@ -1320,8 +1301,6 @@ proc genReturn(c: var TCtx, n: PNode) =
   c.buildStmt mnkGoto:
     blockExit(c.blocks, c.builder, 0)
 
-  c.unreachable = true
-
 proc genAsgnSource(c: var TCtx, e: PNode, status: set[DestFlag]) =
   ## Generates the MIR code for the right-hand side of an assignment.
   ## `status` provides the information necessary to decide what assignment
@@ -1362,12 +1341,9 @@ proc genAsgn(c: var TCtx, dest: Destination, rhs: PNode) =
     if dfEmpty in dest.flags: mnkInit
     else:                     mnkAsgn
 
-  let rhs = unwrap(c, rhs)
-  # the right-hand expression not returning needs to be accounted for
-  if not c.unreachable:
-    c.buildStmt kind:
-      c.use dest.val
-      c.genAsgnSource(rhs, dest.flags)
+  c.buildStmt kind:
+    c.use dest.val
+    c.genAsgnSource(rhs, dest.flags)
 
 proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
   ## Generates the code for an assignment. `isFirst` indicates if this is the
@@ -1383,10 +1359,6 @@ proc genAsgn(c: var TCtx, isFirst, sink: bool, lhs, rhs: PNode) =
     lhs = unwrap(c, lhs)
     sink = sink and not isCursor(lhs)
 
-  if c.unreachable:
-    # the left-hand expression terminates -> the assignment is dead code
-    return
-
   case rhs.kind
   of ComplexExprs:
     # optimization: forward the destination. For example:
@@ -1578,18 +1550,15 @@ proc genWhile(c: var TCtx, n: PNode) =
   let label = c.allocLabel()
   c.subTree mnkLoopJoin:
     c.add labelNode(label)
-  c.scope:
+  c.scope(doesReturn n[1]):
     inc c.inLoop
     c.gen(n[1])
     dec c.inLoop
   c.subTree mnkLoop:
     c.add labelNode(label)
-  # a while loop has no structured exit:
-  c.unreachable = true
 
 proc closeBlock(c: var TCtx) =
-  if c.blocks.closeBlock(c.builder):
-    c.unreachable = false
+  discard c.blocks.closeBlock(c.builder)
 
 template withBlock(c: var TCtx, k: BlockKind, body: untyped) =
   c.blocks.add Block(kind: k)
@@ -1607,7 +1576,7 @@ proc genBlock(c: var TCtx, n: PNode, dest: Destination) =
   c.blocks.add Block(kind: bkBlock, label: n[0].sym)
 
   # generate the body:
-  c.scope:
+  c.scope(doesReturn(n[1])):
     c.genWithDest(n[1], dest)
   c.closeBlock()
 
@@ -1623,11 +1592,7 @@ proc genBranch(c: var TCtx, n: PNode, dest: Destination) =
     gen(c, n)
 
 proc leaveBlock(c: var TCtx) =
-  ## Emits a goto for jumping to the exit of first enclosing block, but only
-  ## if not in an unreachable context.
-  if c.unreachable:
-    return # omit the leave actions if not reachable
-
+  ## Emits a goto for jumping to the exit of first enclosing block.
   if c.scopeDepth > 0:
     # only emit the early scope exit if still within a scope
     earlyExit(c.blocks, c.builder)
@@ -1635,7 +1600,16 @@ proc leaveBlock(c: var TCtx) =
   c.subTree mnkGoto:
     blockExit(c.blocks, c.builder, closest(c.blocks))
 
-  c.unreachable = true # code following a goto is unreachable
+proc genScopedBranch(c: var TCtx, n: PNode, dest: Destination,
+                     withLeave: bool) =
+  ## Translates `n`, wrapping it in a scope. If `withLeave` is true, a jump to
+  ## the exit of the enclosing block is emitted at the end.
+  let returns = doesReturn(n)
+  c.scope(returns and not withLeave):
+    c.genBranch(n, dest)
+    # the leave is only necessary when the statement/expression returns
+    if returns and withLeave:
+      leaveBlock(c)
 
 proc genIf(c: var TCtx, n: PNode, dest: Destination) =
   ## Generates the code for an ``if`` statement (``nkIf(Stmt|Expr)``). It's
@@ -1671,24 +1645,17 @@ proc genIf(c: var TCtx, n: PNode, dest: Destination) =
   let hasValue = not isEmptyType(n.typ)
   assert hasValue == dest.isSome
 
-  template genElifBranch(branch: PNode, extra: untyped) =
+  template genElifBranch(branch: PNode, withLeave: bool) =
     ## Generates the code for a single ``nkElif(Branch|Expr)``
-    c.scope:
+    c.scope(true):
       let v = genUse(c, branch[0])
       c.buildIf (c.use v;):
-        c.scope:
-          genBranch(c, branch.lastSon, dest)
-          extra
-
-      # if the start of the branch was reachable, then so is the code
-      # following the branch
-      c.unreachable = false
+        c.genScopedBranch(branch.lastSon, dest, withLeave)
 
   if n.len == 1:
     # an ``if`` statement/expression with a single branch. Don't wrap in a
     # block
-    genElifBranch(n[0]):
-      discard
+    genElifBranch(n[0], false)
 
   else:
     # a multi-clause ``if`` statement/expression
@@ -1697,14 +1664,11 @@ proc genIf(c: var TCtx, n: PNode, dest: Destination) =
         for it in n.items:
           case it.kind
           of nkElifBranch, nkElifExpr:
-            genElifBranch(it):
-              leaveBlock(c)
+            genElifBranch(it, true)
 
           of nkElse, nkElseExpr:
-            c.scope:
-              genBranch(c, it[0], dest)
-
-            # since this is the last branch, a 'break' is not needed
+            # since this is the last branch, a jump is not needed
+            c.genScopedBranch(it[0], dest, withLeave=false)
           else:
             unreachable(it.kind)
 
@@ -1745,10 +1709,7 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
   c.withBlock bkBlock:
     for (i, branch) in branches(n):
       c.join LabelId(firstLabel + uint32(i))
-      c.unreachable = false # every branch starts as reachable again
-      c.scope:
-        genBranch(c, branch.lastSon, dest)
-        leaveBlock(c)
+      c.genScopedBranch(branch.lastSon, dest, withLeave=true)
 
 proc genExceptBranch(c: var TCtx, n: PNode, label: LabelId,
                      next: Option[LabelId], dest: Destination) =
@@ -1756,9 +1717,6 @@ proc genExceptBranch(c: var TCtx, n: PNode, label: LabelId,
   c.builder.useSource(c.sp, n)
   let withFilter = n.len > 1
 
-  # the except branch is reachable:
-  c.unreachable = false
-
   c.subTree MirNode(kind: mnkExcept,
                     len: uint32(1 + (n.len - 1) + ord(withFilter))):
     c.add labelNode(label) # name of the except
@@ -1788,9 +1746,7 @@ proc genExceptBranch(c: var TCtx, n: PNode, label: LabelId,
 
   # generate the body of the except branch:
   c.withBlock bkExcept, label:
-    c.scope:
-      genBranch(c, n.lastSon, dest)
-      leaveBlock(c)
+    c.genScopedBranch(n.lastSon, dest, withLeave=true)
 
   c.subTree mnkEndStruct:
     c.add labelNode(label)
@@ -1820,14 +1776,13 @@ proc genFinally(c: var TCtx, n: PNode) =
     # the finally is never entered, omit it
     return
 
-  c.unreachable = false # the finally is reachable
   c.builder.useSource(c.sp, n)
   c.subTree mnkFinally:
     c.add labelNode(blk.id.unsafeGet)
 
   # translate the body:
   c.withBlock bkFinally, blk.id.unsafeGet:
-    c.scope:
+    c.scope(not blk.doesntExit):
       c.gen(n[^1])
 
   # the continue statement is always necessary, even if the body has no
@@ -1848,15 +1803,14 @@ proc genTry(c: var TCtx, n: PNode, dest: Destination) =
   if hasFinally:
     # the finally clause also applies to the except clauses, so it's
     # pushed first
-    c.blocks.add Block(kind: bkTryFinally)
+    c.blocks.add Block(kind: bkTryFinally,
+                       doesntExit: not doesReturn(n[^1][0]))
 
   if hasExcept:
     c.blocks.add Block(kind: bkTryExcept)
 
   # the body of the try:
-  c.scope:
-    c.genBranch(n[0], dest)
-    leaveBlock(c)
+  c.genScopedBranch(n[0], dest, withLeave=true)
 
   if hasExcept:
     genExcept(c, n, n.len - ord(hasFinally), dest)
@@ -1864,8 +1818,6 @@ proc genTry(c: var TCtx, n: PNode, dest: Destination) =
   if hasFinally:
     genFinally(c, n[^1])
 
-  # presume unreachable, closing the block will correct the presumption
-  c.unreachable = true
   c.closeBlock()
 
 proc genAsmOrEmitStmt(c: var TCtx, kind: range[mnkAsm..mnkEmit], n: PNode) =
@@ -2105,20 +2057,7 @@ proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
       for i in 0..<orig.len-1:
         gen(c, orig[i])
 
-    if c.unreachable:
-      # don't translate the expression if it's unreachable. The callsite still
-      # expects some expression, and thus a default-intialized temporary is
-      # used. Do note that the code is unreachable, and the assignment is thus
-      # never evaluated -- it's just there to uphold the callsite's syntactic
-      # expectations
-      # XXX: ideally, non-terminating statement list expressions should
-      #      have the trailing expression cut off and be turned into
-      #      ``nkStmtList`` nodes at an earlier stage
-      c.wrapAndUse typ:
-        c.buildMagicCall mDefault, typ:
-          discard
-    else:
-      recurse()
+    recurse()
   of pirComplex:
     # attempting to generate the code for a complex expression without a
     # destination specified -> assign the value resulting from it to a
@@ -2178,9 +2117,6 @@ proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
 
 proc gen(c: var TCtx, n: PNode) =
   ## Generates and emits the MIR code for the statement `n`
-  if c.unreachable:
-    return
-
   c.builder.useSource(c.sp, n)
 
   # because of ``.discardable`` calls, we can't require `n` to be of void
@@ -2215,8 +2151,6 @@ proc gen(c: var TCtx, n: PNode) =
   of nkBreakStmt:
     c.buildStmt mnkGoto:
       blockExit(c.blocks, c.builder, findBlock(c.blocks, n[0].sym))
-
-    c.unreachable = true # code following a break is unreachable
   of nkVarSection, nkLetSection:
     genVarSection(c, n)
   of nkAsgn:
@@ -2258,12 +2192,7 @@ proc gen(c: var TCtx, n: PNode) =
           c.builder.pop(f)
   of nkDiscardStmt:
     if n[0].kind != nkEmpty:
-      let n = unwrap(c, n[0])
-      if c.unreachable:
-        # don't translate the expression
-        return
-
-      let e = exprToPmir(c, n, false, false)
+      let e = exprToPmir(c, n[0], false, false)
       case classify(e)
       of Rvalue:
         discard toValue(c, e, e.high, mnkDefCursor)
@@ -2312,8 +2241,6 @@ proc genWithDest(c: var TCtx, n: PNode; dest: Destination) =
   ## assigning the resulting value to the given destination `dest`. `dest` can
   ## be 'none', in which case `n` is required to be a statement
   if dest.isSome:
-    assert not endsInNoReturn(n)
-
     case n.kind
     of ComplexExprs:
       genComplexExpr(c, n, dest)
@@ -2407,6 +2334,8 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
                     owner.kind in routineKinds and
                     owner.typ[0] != nil and
                     hasDestructor(owner.typ[0]))
+    doesReturn = doesReturn(body)
+      ## whether the body "falls through"
 
   c.withBlock bkBlock: # the target for return statements
     if needsTerminate:
@@ -2417,7 +2346,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
       # exits via an exception
       c.blocks.add Block(kind: bkTryFinally, errorOnly: true)
 
-    c.scope:
+    c.scope(doesReturn):
       if owner.kind in routineKinds:
         # the procedure backing a macro has its own internal signature; use that
         # beyond this point
@@ -2448,8 +2377,9 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
     var isFirst = true
 
     if needsCleanup and (let b = c.blocks.pop(); b.id.isSome):
-      leaveBlock(c) # jump over the handler
-      isFirst = false
+      if doesReturn:
+        leaveBlock(c) # jump over the handler
+        isFirst = false
 
       # emit the finally section for cleaning up the result variable:
       c.subTree mnkFinally:
@@ -2463,7 +2393,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
         c.add labelNode(b.id.unsafeGet)
 
     if needsTerminate and (let b = c.blocks.pop(); b.id.isSome):
-      if isFirst:
+      if doesReturn and isFirst:
         leaveBlock(c)
 
       # emit the handler for panicking on escaping exceptions:
@@ -2494,7 +2424,7 @@ proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
     rtyp = c.typeToMir(e.typ)
     res = c.addLocal(Local(typ: rtyp)) # the result variable
   c.withBlock bkBlock:
-    c.scope:
+    c.scope(true):
       c.buildStmt mnkDef:
         c.use toValue(mnkLocal, res, rtyp)
         if e.typ.kind == tyTypeDesc:
diff --git a/compiler/modules/modulegraphs.nim b/compiler/modules/modulegraphs.nim
index 5178b765774..feb901afa0f 100644
--- a/compiler/modules/modulegraphs.nim
+++ b/compiler/modules/modulegraphs.nim
@@ -139,6 +139,9 @@ type
     passes*: seq[TPass]
     idgen*: IdGenerator
     operators*: Operators
+    noreturnType*: PType
+      ## special type used for marking statements as not returning. Currently
+      ## only used in mid-end
     when defined(nimsuggest):
       onMarkUsed*: SuggestCallback
         ## callback decouples regular compiler code `markUsed` from suggest
@@ -522,6 +525,7 @@ proc newModuleGraph*(cache: IdentCache; config: ConfigRef): ModuleGraph =
   result.symBodyHashes = initTable[int, SigHash]()
   result.operators = initOperators(result)
   result.emittedTypeInfo = initTable[string, FileIndex]()
+  result.noreturnType = newType(tyVoid, nextTypeId(result.idgen), nil)
 
 proc resetAllModules*(g: ModuleGraph) =
   initStrTable(g.packageSyms)
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 7ece383092f..3ad578457d7 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -42,7 +42,8 @@ import
     closureiters,
     semfold,
     lambdalifting,
-    lowerings
+    lowerings,
+    unreachable_elim
   ],
   compiler/backend/[
     cgmeth
@@ -1433,6 +1434,7 @@ proc transformBody*(g: ModuleGraph, idgen: IdGenerator, prc: PSym, body: PNode):
   (result, c.env) = liftLambdas(g, prc, body, c.idgen)
   result = processTransf(c, result, prc)
   liftDefer(c, result)
+  result = eliminateUnreachable(g, result)
 
   if prc.isIterator:
     result = g.transformClosureIterator(c.idgen, prc, result)
@@ -1479,6 +1481,7 @@ proc transformStmt*(g: ModuleGraph; idgen: IdGenerator; module: PSym, n: PNode):
     var c = PTransf(graph: g, module: module, idgen: idgen)
     result = processTransf(c, n, module)
     liftDefer(c, result)
+    result = eliminateUnreachable(g, result)
     #result = liftLambdasForTopLevel(module, result)
     incl(result.flags, nfTransf)
 
@@ -1489,6 +1492,7 @@ proc transformExpr*(g: ModuleGraph; idgen: IdGenerator; module: PSym, n: PNode):
     var c = PTransf(graph: g, module: module, idgen: idgen)
     result = processTransf(c, n, module)
     liftDefer(c, result)
+    result = eliminateUnreachable(g, result)
     # expressions are not to be injected with destructor calls as that
     # the list of top level statements needs to be collected before.
     incl(result.flags, nfTransf)
diff --git a/compiler/sem/unreachable_elim.nim b/compiler/sem/unreachable_elim.nim
new file mode 100644
index 00000000000..ed7fd2f8344
--- /dev/null
+++ b/compiler/sem/unreachable_elim.nim
@@ -0,0 +1,341 @@
+## Implements elimination of unreachable statements and expression within an
+## AST already processed by early ``transf``. The transformation makes sure
+## that a non-returning statement is not immediately followed by other code.
+##
+## For example, for:
+##
+## .. code-block:: nim
+##
+##   return 1
+##   echo "a"
+##
+## The ``echo`` statement needs to be removed. This makes further processing
+## easier, since detecting whether a block of code returns is now possible by
+## inspecting just the trailing AST node.
+##
+## For later inspection, all non-returning statements (such as break, return,
+## etc.) have ``noreturnType`` assigned as the type.
+
+import
+  compiler/ast/[
+    ast_types,
+    ast_query,
+    ast,
+    trees,
+    wordrecg
+  ],
+  compiler/modules/[
+    modulegraphs
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+type
+  PassContext = object
+    blocks: seq[tuple[label: PSym, used: bool]]
+    voidType: PType
+
+iterator mitems(x: PNode): var PNode =
+  for i in 0..<x.len:
+    yield x[i]
+
+iterator mpairs(x: PNode): (int, var PNode) =
+  for i in 0..<x.len:
+    yield (i, x[i])
+
+func doesntReturn(c: PassContext, n: PNode): bool =
+  n.typ == c.voidType
+
+proc process(c: var PassContext, n: PNode): PNode =
+  ## Transforms a single tree layer. The AST is mutated in-place, and the
+  ## transformed node is returned.
+  ##
+  ## For signaling that the statement/expression doesn't return, it has the
+  ## 'void' type assigned to it; non-returning expressions are turned into
+  ## statements.
+  template recurse(n: PNode): PNode =
+    process(c, n)
+
+  template doesntReturn(n: PNode): bool =
+    doesntReturn(c, n)
+
+  case n.kind
+  of nkWithoutSons, nkSymChoices, nkNimNodeLit:
+    result = n # nothing to do
+  of nkCast, nkHiddenStdConv, nkHiddenSubConv, nkConv:
+    # single operand expressions with the operand in the second slot
+    let x = recurse(n[1])
+    if doesntReturn(x):
+      result = x
+    else:
+      result = n
+      result[1] = x
+
+  of nkHiddenAddr, nkAddr, nkHiddenDeref, nkDerefExpr, nkStringToCString,
+     nkCStringToString, nkObjDownConv, nkObjUpConv, nkCheckedFieldExpr,
+     nkReturnStmt, nkDiscardStmt, nkYieldStmt, nkRaiseStmt:
+    # statements and expressions where only the first operand is relevant
+    let x = recurse(n[0])
+    if doesntReturn(x):
+      result = x
+    else:
+      result = n
+      result[0] = x
+
+      if n.kind in {nkReturnStmt, nkRaiseStmt}:
+        # mark as noreturn
+        result.typ = c.voidType
+  of nkAsgn, nkFastAsgn, nkBracketExpr, nkDotExpr, nkRange:
+    # statements/expressions with two operands
+    let lhs = recurse(n[0])
+    if doesntReturn(lhs):
+      result = lhs
+    else:
+      let rhs = recurse(n[1])
+      if doesntReturn(rhs):
+        result = nkStmtList.newTreeIT(n.info, c.voidType,
+          nkDiscardStmt.newTreeI(lhs.info, lhs),
+          rhs)
+      else:
+        result = n
+        result[0] = lhs
+        result[1] = rhs
+  of nkStmtList:
+    result = n
+    for i, it in result.mpairs:
+      it = recurse(it)
+      if doesntReturn(it):
+        result.sons.setLen(i + 1)
+        result.typ = c.voidType
+        return
+
+  of nkStmtListExpr:
+    result = n
+    for i in 0..<n.len-1:
+      result[i] = recurse(n[i])
+      if doesntReturn(result[i]):
+        result.transitionSonsKind(nkStmtList)
+        # cut off the remaining statements
+        result.sons.setLen(i + 1)
+        result.typ = c.voidType
+        return
+
+    result[^1] = recurse(n[^1])
+    if doesntReturn(result[^1]):
+      # ends in a statement
+      result.transitionSonsKind(nkStmtList)
+      result.typ = c.voidType
+  of nkCallKinds, nkBracket, nkCurly, nkClosure, nkTupleConstr, nkChckRange,
+     nkChckRange64, nkChckRangeF, nkAsmStmt:
+    # some call-like operation with left-to-right evaluation. If an operand
+    # doesn't return, the remaining operands plus the operation itself are
+    # removed
+    for i, it in n.mpairs:
+      # destructively omit the expr-colon-expr; it's not needed beyond this
+      # point anyway
+      it = recurse(it.skipColon)
+      if doesntReturn(it):
+        result = n
+        result.transitionSonsKind(nkStmtList)
+        result.typ = c.voidType
+        # cut off the remaining expressions/statements; they're dead code
+        result.sons.setLen(i + 1)
+        # turn the expressions so far into statements by wrapping them in a
+        # 'discard' statement
+        for i in 0..<i:
+          # the argument might be a 'void' (unit, really) expression, no
+          # discard must be used then
+          if result[i].typ != nil:
+            result[i] = newTreeI(nkDiscardStmt, n.info, result[i])
+
+        return
+
+    result = n
+    if result.kind in nkCallKinds and result[0].kind == nkSym and
+       result[0].sym.kind in routineKinds and
+       sfNoReturn in result[0].sym.flags:
+      # calls to noreturn procedures don't return
+      result.typ = c.voidType
+  of nkObjConstr:
+    # similar to the call-like handling
+    for i in 1..<n.len:
+      n[i][1] = recurse(n[i][1])
+      if doesntReturn(n[i][1]):
+        # turn the operands so far into a valid statement list:
+        result = newNodeIT(nkStmtList, n.info, c.voidType, i - 1)
+        for j in 1..<i:
+          result[j - 1] = newTreeI(nkDiscardStmt, n[j][1].info, n[j][1])
+        return
+
+    result = n
+  of nkLetSection, nkVarSection:
+    for i, it in n.pairs:
+      assert it.kind in {nkIdentDefs, nkVarTuple}
+      let rhs = recurse(it[^1])
+      if doesntReturn(rhs):
+        if i == 0:
+          return rhs # discard the rest
+        else:
+          # cut off the identdefs past and including the current one
+          n.sons.setLen(i)
+          # wrap the section in a statement list and append the non-returning
+          # expression
+          result = newTreeIT(nkStmtList, n.info, c.voidType, n, rhs)
+          return
+
+    result = n
+  of nkBlockExpr, nkBlockStmt:
+    c.blocks.add (n[0].sym, false) # push a new block
+    let body = recurse(n[1])
+    let info = c.blocks.pop() # pop the block again
+
+    result = n
+    if doesntReturn(body):
+      # it's a statement
+      result.transitionSonsKind(nkBlockStmt)
+      if not info.used:
+        # the block is never broken out of and the body doesn't return -> the
+        # block doesn't return
+        result.typ = c.voidType
+
+    result[1] = body
+  of nkIfExpr, nkIfStmt:
+    result = n
+    var exits = 0 ## number of branches that return
+    for i, it in result.pairs:
+      case it.kind
+      of nkElifBranch, nkElifExpr:
+        let cond = recurse(it[0])
+        if doesntReturn(cond):
+          # the condition expression doesn't return; everything that follows
+          # is dead code
+          if i == 0:
+            return cond
+          else:
+            # turn into an else branch and cut off the remaining branches
+            result[i] = newTreeI(nkElse, cond.info, cond)
+            result.sons.setLen(i + 1)
+            break
+
+        it[1] = recurse(it[1])
+        exits += ord(not doesntReturn(it[1]))
+      of nkElse, nkElseExpr:
+        it[0] = recurse(it[0])
+        exits += ord(not doesntReturn(it[0]))
+      else:
+        unreachable(it.kind)
+
+    if exits == 0 and result[^1].kind in {nkElse, nkElseExpr}:
+      # exhaustive 'if' statement/expression and no branch returns -> it's a
+      # noreturn statement
+      result.transitionSonsKind(nkIfStmt)
+      result.typ = c.voidType
+  of nkCaseStmt:
+    let x = recurse(n[0])
+    if doesntReturn(x):
+      return x # the body is dead code
+
+    result = n
+    result[0] = x
+
+    # process all branches and count the number of exits:
+    var exits = 0
+    for i in 1..<n.len:
+      result[i][^1] = recurse(n[i][^1])
+      exits += ord(not doesntReturn(result[i][^1]))
+
+    if exits == 0:
+      # none of the branches return -> the case doesn't return
+      result.typ = c.voidType
+  of nkTryStmt, nkHiddenTryStmt:
+    result = n
+    var exits = 0
+    for it in result.mitems:
+      case it.kind
+      of nkExceptBranch:
+        it[^1] = recurse(it[^1])
+        exits += ord(not doesntReturn(it[^1]))
+      of nkFinally:
+        it[0] = recurse(it[0])
+      else:
+        # must be the main body
+        it = recurse(it)
+        exits += ord(not doesntReturn(it))
+
+    if exits == 0 or
+       (result[^1].kind == nkFinally and doesntReturn(result[^1][0])):
+      # the try/except or intercepting finally doesn't exit
+      result.typ = c.voidType
+  of nkWhileStmt:
+    result = n
+    result[^1] = recurse(n[1])
+    result.typ = c.voidType # ``while true`` statements never return
+  of nkBreakStmt:
+    # mark the break target as being broken out of:
+    for it in c.blocks.mitems:
+      if it.label.id == n[0].sym.id:
+        it.used = true
+        break
+
+    result = n
+    result.typ = c.voidType # mark as noreturn
+  of nkWhenStmt:
+    result = n
+    # process both branches of the ``when nimvm`` statement/expression
+    result[0][1] = recurse(n[0][1])
+    result[1][0] = recurse(n[1][0])
+    if doesntReturn(result[0][1]) and doesntReturn(result[1][0]):
+      # if both branches don't return, neither does the 'when'
+      result.typ = c.voidType
+    # XXX: if only one branches doesn't return, collapsing the 'when' to the
+    #      one that doesn't results in the unreachable code persisting
+  of nkPragmaBlock:
+    result = n
+    result[1] = recurse(n[1])
+    if doesntReturn(result[1]):
+      result.typ = c.voidType
+  of nkPragma:
+    # the emit pragma can contain run-time code... An emit statement is
+    # treated like a call: if one operand is a non-returning expression, the
+    # emitted code is never reached, and the would-be emited code can be elided
+    # XXX: the logic here could be simpler if emit pragma statements had a more
+    #      regular shape at this point (e.g., a single pragma per list)
+    for pIndex, it in n.pairs:
+      case whichPragma(it)
+      of wEmit:
+        # process all operands:
+        let args = it[1]
+        for i, x in args.mpairs:
+          x = recurse(x)
+          if doesntReturn(x):
+            # remove the emit pragma and remaining pragmas from the pragma
+            # list:
+            n.sons.setLen(pIndex)
+
+            let stmts = newNodeIT(nkStmtList, args.info, c.voidType, i + 1)
+            # wrap the previous operands in discard statements:
+            for j in 0..<i:
+              stmts[j] = newTreeI(nkDiscardStmt, args[j].info, args[j])
+            # assign the terminal expression and combine with the pragma:
+            stmts[i] = x
+            return newTreeIT(nkStmtList, n.info, c.voidType, n, stmts)
+
+      else:
+        discard
+
+    result = n
+  of callableDefs, nkConstSection, nkTypeSection, nkBindStmt, nkMixinStmt,
+     nkIncludeStmt, nkImportStmt, nkImportExceptStmt, nkFromStmt, nkExportStmt,
+     nkExportExceptStmt, nkTypeOfExpr:
+    # ignore declarative statements
+    result = n
+  else:
+    unreachable(n.kind)
+
+proc eliminateUnreachable*(graph: ModuleGraph, n: PNode): PNode =
+  ## Entry point into the pass. Removes all unreachable statements/expression,
+  ## making sure that a non-returning statement is always the last statement
+  ## in a block of code.
+  var c = PassContext(voidType: graph.noreturnType)
+  result = process(c, n)
diff --git a/tests/lang_exprs/tnon_returning_expressions.nim b/tests/lang_exprs/tnon_returning_expressions.nim
new file mode 100644
index 00000000000..2ad4cc92d30
--- /dev/null
+++ b/tests/lang_exprs/tnon_returning_expressions.nim
@@ -0,0 +1,188 @@
+discard """
+  description: '''
+    Ensure that the compiler can correctly handle all forms of:
+    * expression that don't return
+    * statements that don't return
+  '''
+  targets: c js vm
+"""
+
+proc noret() {.noreturn.} =
+  raise CatchableError.newException("")
+
+# ------------------------------
+# establish that the basics work
+
+proc testBreak() =
+  block:
+    var x = (;break; 1)
+    doAssert false
+
+testBreak()
+
+proc testReturn() =
+  var x = (;return; 1)
+  doAssert false
+
+testReturn()
+
+proc testRaise() =
+  var x = (;raise CatchableError.newException(""); 1)
+  doAssert false
+
+try: testRaise() except: discard
+
+proc testNoreturnCall() =
+  var x = (noret(); 1)
+  doAssert false
+
+try: testNoreturnCall() except: discard
+
+# ----------
+# statements
+
+template testStmt(body: untyped) =
+  # provides the fixture for testing statements
+  proc p(): int {.gensym.} =
+    body
+    doAssert false
+  discard p()
+
+proc call(a, b: int) = discard
+
+# callee:
+testStmt: (;return; call)(1, 2)
+# arguments:
+testStmt: call((;return; 1), 2)
+testStmt: call((;return; var val = 0; 1), val)
+
+# ------------------------------------
+# complex statements that don't return
+
+# discard operand doesn't return:
+testStmt:
+  discard (;return; 1)
+
+# raise operand doesn't return:
+testStmt:
+  raise (;return; CatchableError.newException(""))
+
+# first definition doesn't return:
+testStmt:
+  let
+    x = (;return; var a = 2; 1)
+    y = a
+
+# second (non-trailing) definition doesn't return:
+testStmt:
+  let
+    x = 1
+    y = (;return; var a = 3; 2)
+    z = a
+
+# lhs in assignment doesn't return:
+testStmt:
+  var x = 0
+  (;return; var y = 1; x) = y
+
+# rhs in assignment doesn't return:
+testStmt:
+  var x = 0
+  x = (;return; 1)
+
+# condition expression in if doesn't return:
+testStmt:
+  let x = 1
+  if (;return; x == 1):
+    doAssert false
+
+# condition in trailing elif-branch doesn't return:
+testStmt:
+  let x = 2
+  if x == 1:
+    doAssert false
+  elif (;return; x == 2):
+    doAssert false
+
+# case statement selector expression doesn't return
+testStmt:
+  let x = 1
+  case (;return; x)
+  of 1:
+    doAssert false
+  else:
+    doAssert false
+
+when defined(c):
+  block:
+    var value = 0
+    testStmt:
+      {.emit: "`value` = 1;", emit: [value, "=", (;return; 2)].}
+
+    # make sure the first emitted statement was evaluated:
+    doAssert value == 1
+
+
+# -----------
+# expressions
+
+template testExpr(body: untyped) =
+  # provides the fixture for testing expressions
+  proc p() {.gensym.} =
+    let x = body
+    doAssert false
+  p()
+
+var global = 0
+
+proc effect(): int =
+  # effectful procedure
+  inc global
+  result = 1
+
+template testExprWithEffect(expect: int, body: untyped) =
+  # provides the fixture for testing expressions where some side-effect needs
+  # to be computed (or not)
+  global = 0
+  testExpr: body
+  doAssert global == expect
+
+type Obj = object
+  a, b, c: int
+
+# construction expressions:
+testExprWithEffect 0:
+  [(;return; var val = 0; 1), val, effect()]
+testExprWithEffect 0:
+  ((;return; var val = 0; 1), val, effect())
+testExprWithEffect 0:
+  Obj(a: (;return; var val = 0; 1), b: val, c: effect())
+
+# cast:
+testExprWithEffect 0:
+  cast[int]((;return; effect()))
+
+# conversion:
+testExprWithEffect 0:
+  int((;return; effect()))
+
+# object field access:
+testExpr:
+  let o = Obj(a: 1)
+  (;return; o).a
+
+# tuple field access:
+testExpr:
+  let t = (1, 2)
+  (;return; t)[0]
+
+# array operand expression doesn't return:
+testExprWithEffect 0:
+  var s = @[0, 1]
+  (;return; s)[effect()]
+
+# index operand expression doesn't return:
+testExprWithEffect 1:
+  var s = @[1, 2]
+  # the array operand must still be evaluated for side-effects
+  (;discard effect(); s)[(;return; 1)]

From 6b84b42c2811de87b6204acb41d93f312e24ad9b Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 4 Jun 2024 06:48:49 +0000
Subject: [PATCH 111/169] build(deps): Bump dawidd6/action-download-artifact
 from 3.1.4 to 4 (#1332)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 3.1.4 to 4.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v4</h2>
<h2>What's Changed</h2>
<ul>
<li><strong>VERSIONING CHANGE</strong>: now there will only be major
releases of this action, e.g. v5, v6 and so on</li>
<li>build(deps): bump undici from 5.28.3 to 5.28.4 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/284">dawidd6/action-download-artifact#284</a></li>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.1.4 to
2.1.5 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/285">dawidd6/action-download-artifact#285</a></li>
<li>build(deps): bump <code>@​actions/artifact</code> from 2.1.5 to
2.1.7 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/287">dawidd6/action-download-artifact#287</a></li>
<li>build(deps): bump adm-zip from 0.5.12 to 0.5.13 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/289">dawidd6/action-download-artifact#289</a></li>
<li>Set allow_forks to false by default by <a
href="https://github.com/timweri"><code>@​timweri</code></a> in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/290">dawidd6/action-download-artifact#290</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a href="https://github.com/timweri"><code>@​timweri</code></a> made
their first contribution in <a

href="https://redirect.github.com/dawidd6/action-download-artifact/pull/290">dawidd6/action-download-artifact#290</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3...v4">https://github.com/dawidd6/action-download-artifact/compare/v3...v4</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/854e2de9396304899dbe03bf9995fd73533190d1"><code>854e2de</code></a>
Set allow_forks to false by default (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/290">#290</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/436c9d3774019b3e2789d7332e9c4efdba3d9d79"><code>436c9d3</code></a>
build(deps): bump adm-zip from 0.5.12 to 0.5.13 (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/289">#289</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/14040524bb7e51dee9683e2e755e0d562621a1d5"><code>1404052</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.1.5 to 2.1.7
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/287">#287</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/8a9be734dc508dcf8d67c27ba3f727b0d682ccb0"><code>8a9be73</code></a>
build(deps): bump <code>@​actions/artifact</code> from 2.1.4 to 2.1.5
(<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/285">#285</a>)</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/df593bbd0462b45b479f042d043c3aa47fe1c483"><code>df593bb</code></a>
build(deps): bump undici from 5.28.3 to 5.28.4 (<a

href="https://redirect.github.com/dawidd6/action-download-artifact/issues/284">#284</a>)</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v3.1.4...v4">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=3.1.4&new-version=4)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 625cb2aa20a..2cefb2699d7 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v3.1.4
+        uses: dawidd6/action-download-artifact@v4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v3.1.4
+        uses: dawidd6/action-download-artifact@v4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v3.1.4
+        uses: dawidd6/action-download-artifact@v4
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v3.1.4
+        uses: dawidd6/action-download-artifact@v4
         with:
           workflow: ci.yml
           workflow_conclusion: success

From 55a988e5509502d155b237ebb13928d1ec26ccaa Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 7 Jun 2024 18:32:51 +0200
Subject: [PATCH 112/169] fix(sem): generic distinct types getting the same
 hooks (#1335)

## Summary

Fix instantiating a generic distinct type with generic parameters not
used in the body not resulting in a unique type internally, resulting
in all instances thereof sharing the very same generic hook
instantiations.

## Details

There were two issues in `semtypinst`:
1. no new type instance was created for `tyDistinct` types when there
   are no generic parameters used in the body
2. no new symbol being created for the `tyDistinct` when instantiating
   it

As a consequence of point 1, `sameType` and `hashType` treated the
instantiated `tyDistinct` types as being the same. `hashType` is used
by hook lifting for fetching the canonical type, so all `tyDistinct`
types resulting from a generic type with phantom type information got
the same set of hooks.

For point 2, the consequence was that the symbol for instantiated
generic distinct types always pointed to the original `tyGenericBody`,
not the instantiated type.

Same as with `tyObject` types (which are also nominal types), a new
`tyDistinct` instance is always created during instantiation, and a new
symbol is created for it.

### Tests

* the `tphantom_distinct_hooks` test is added, which is largely a copy
  of `tphantom_object_hooks`
* the `tphantom_distinct_types` typerel test is added for preventing
  future regressions. It already succeeded previously
---
 compiler/sem/liftdestructors.nim              |  5 ++-
 compiler/sem/semtypinst.nim                   | 12 +++++++
 .../destructor/tphantom_distinct_hooks.nim    | 36 +++++++++++++++++++
 tests/typerel/tphantom_distinct_types.nim     | 26 ++++++++++++++
 4 files changed, 76 insertions(+), 3 deletions(-)
 create mode 100644 tests/lang_objects/destructor/tphantom_distinct_hooks.nim
 create mode 100644 tests/typerel/tphantom_distinct_types.nim

diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index bb5e6ce798a..202f532eb6c 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -976,12 +976,11 @@ proc createTypeBoundOps(g: ModuleGraph; c: PContext; orig: PType; info: TLineInf
   if isEmptyContainer(skipped) or skipped.kind == tyStatic: return
 
   var canon: PType
-  if skipped.kind == tyObject:
+  if skipped.kind in {tyObject, tyDistinct}:
     # for nominal types, the type itself is already the canonical one (each one
     # is unique)
     # XXX: ^^ at present, this is only true for object types. Phantom
-    #      ``tyDistinct`` and ``tyEnum`` types still don't have unique
-    #      instances
+    #      ``tyEnum`` types still don't have unique instances
     canon = skipped
   else:
     # structural types use canonicalization
diff --git a/compiler/sem/semtypinst.nim b/compiler/sem/semtypinst.nim
index f27329caf1c..406bc57ec12 100644
--- a/compiler/sem/semtypinst.nim
+++ b/compiler/sem/semtypinst.nim
@@ -537,6 +537,18 @@ proc instantiate(cl: var TReplTypeVars, t: PType): PType =
 
     if cl.c.computeRequiresInit(cl.c, result):
       result.flags.incl tfRequiresInit
+  of tyDistinct:
+    # same as with object types, create a new type instance even if the body
+    # doesn't change during instantiation
+    result = instCopyType(cl, t)
+    result[0] = replaceTypeVarsT(cl, t[0])
+
+    # the type also needs a proper symbol
+    result.sym = copySym(t.sym, nextSymId cl.c.idgen)
+    result.sym.flags.incl sfFromGeneric
+    result.sym.owner = t.sym
+    result.sym.ast = t.sym.ast
+    result.sym.typ = result
   else:
     # XXX: these types also need new symbols...
     result = replaceTypeVarsT(cl, t)
diff --git a/tests/lang_objects/destructor/tphantom_distinct_hooks.nim b/tests/lang_objects/destructor/tphantom_distinct_hooks.nim
new file mode 100644
index 00000000000..8a6fe994ba8
--- /dev/null
+++ b/tests/lang_objects/destructor/tphantom_distinct_hooks.nim
@@ -0,0 +1,36 @@
+discard """
+  description: '''
+    Ensure that phantom distinct types can use generic hooks, and that every
+    instance gets its own instantiations thereof
+  '''
+  targets: "c js vm"
+  matrix: "--cursorInference:off"
+"""
+
+type
+  Phantom[T] = distinct int
+
+var trace: seq[string]
+
+proc `=copy`[T](x: var Phantom[T], y: Phantom[T]) =
+  trace.add("copy " & $T)
+
+proc `=sink`[T](x: var Phantom[T], y: Phantom[T]) =
+  trace.add("sink " & $T)
+
+proc `=destroy`[T](x: var Phantom[T]) =
+  trace.add("destroy " & $T)
+
+proc test[T](a: sink Phantom[T] = default(Phantom[T])) =
+  var x: Phantom[T]
+  x = a # copies
+  x = a # sinks
+  # `x` is destroyed
+
+test[int]()
+test[float]()
+
+# make sure that both types got their own hook instantiations
+doAssert trace == ["copy int", "sink int", "destroy int",
+                   "copy float", "sink float", "destroy float"],
+         $trace
diff --git a/tests/typerel/tphantom_distinct_types.nim b/tests/typerel/tphantom_distinct_types.nim
new file mode 100644
index 00000000000..9eda7848764
--- /dev/null
+++ b/tests/typerel/tphantom_distinct_types.nim
@@ -0,0 +1,26 @@
+discard """
+  description: '''
+    Ensure that instantiating a generic distinct type where the generic
+    parameter is not used in the body yields distinct types for different
+    parameters
+  '''
+  action: compile
+"""
+
+type
+  TypeA[T] = distinct T
+  TypeB[T] = distinct int
+
+static:
+  doAssert TypeA[int] is    TypeA[int]
+  # make sure two separate generic types result in distinct instances:
+  doAssert TypeA[int] isnot TypeB[int]
+  doAssert TypeB[int] isnot TypeA[int]
+
+  # try with a different parameter type:
+  doAssert TypeA[float] is    TypeA[float]
+  doAssert TypeA[float] isnot TypeB[float]
+  doAssert TypeB[float] isnot TypeA[float]
+
+  # ensure that different paramaters result in different types:
+  doAssert TypeA[int] isnot TypeA[float]

From 270b34c94456f401dba9ffd11556867b47bbe2c4 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 7 Jun 2024 22:20:57 +0200
Subject: [PATCH 113/169] macros: fix compiler crash with `parseExpr` (#1339)

## Summary

Fix a bug with `parseExpr` error handling that caused a compiler crash
when:
* an empty string was passed as the argument
* parsing the string returned more than one statement block

## Details

A `SemReport` was used instead of the correct `VMReport`. Since
`rvmOpcParseExpectedExpression` is not a valid report kind for
`SemReport`, the assertion in `wrap` failed and the compiler crashed.

The `ttryparseexpr` test is cleaned up and extended with two test cases
for the cases that trigger the "expected expression" case, ensuring
that previously faulty branch now has test coverage.
---
 compiler/vm/vm.nim                           |  4 ++--
 tests/lang_callable/macros/ttryparseexpr.nim | 24 ++++++++++++--------
 2 files changed, 16 insertions(+), 12 deletions(-)

diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index cd22818da90..d9ae7f724b9 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -67,7 +67,7 @@ import
   ]
 
 # xxx: reports are a code smell meaning data types are misplaced
-from compiler/ast/reports_sem import SemReport
+from compiler/ast/reports_vm import VMReport
 from compiler/ast/report_enums import ReportKind
 
 # xxx: `Report` is faaaar too wide a type for what the VM needs, even with all
@@ -2560,7 +2560,7 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
             assert ast.kind == nkStmtList
             Res.ok:  ast[0]
           else:
-            Res.err: SemReport(kind: rvmOpcParseExpectedExpression).wrap()
+            Res.err: VMReport(kind: rvmOpcParseExpectedExpression).wrap()
 
       if parsed.isOk:
         # success! Write the parsed AST to the result register and return an
diff --git a/tests/lang_callable/macros/ttryparseexpr.nim b/tests/lang_callable/macros/ttryparseexpr.nim
index 3c7654c81bc..923c34cdd07 100644
--- a/tests/lang_callable/macros/ttryparseexpr.nim
+++ b/tests/lang_callable/macros/ttryparseexpr.nim
@@ -1,10 +1,9 @@
 discard """
-  target: "!vm"
-  outputsub: '''Error: expression expected, but found '[EOF]' 45'''
+  description: "Ensure that `parseExpr` raises a catchable exception on error"
+  action: compile
+  targets: native
 """
 
-# disabled for VM until we support `getCurrentExceptionMsg` (knownIssue)
-
 # feature request #1473
 import std/macros
 
@@ -14,10 +13,15 @@ macro test(text: string): untyped =
   except ValueError:
     result = newLit getCurrentExceptionMsg()
 
-const
-  valid = 45
-  a = test("foo&&")
-  b = test("valid")
-  c = test("\"") # bug #2504
+const valid = 45
+
+static:
+  doAssert test("foo&&") == "Error: expression expected, but found '[EOF]'"
+  doAssert test("valid") == 45
+  doAssert test("\"")    == "Error: closing \" expected" # bug #2504
 
-echo a, " ", b
+  const error = "Error: expected expression, but got multiple statements"
+  # test with empty string
+  doAssert test("") == error
+  # test with multiple declarative statements
+  doAssert test("type A = int\ntype A = int") == error

From ab50b745bbd383d1868b0369b13df6c304850596 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 8 Jun 2024 21:22:57 +0200
Subject: [PATCH 114/169] fix: wrong code generation for synthesized object
 hooks (#1338)

## Summary

Fix a bug with synthesis of lifetime-tracking hooks for object types
using inheritance, which showed up as a C compiler error when using
recent versions of clang or gcc.

Fixes https://github.com/nim-works/nimskull/issues/1337.

## Details

When synthesizing the hooks for object types using inheritance, the
destination accessor expression wasn't wrapped in an object conversion
prior to emitting the parent object handling.

Without the conversion, the synthesized hook passed along its own
parameter to the call of the super type's hook as-is. This is wrong
in general (the argument's type doesn't match the parameter's), but
didn't cause concrete issues until gcc and clang started to disallow
implicit conversions between incompatible pointer types.
---
 compiler/sem/liftdestructors.nim              |  7 +++++-
 .../destructor/tsuper_type_destructor_bug.nim | 23 +++++++++++++++++++
 2 files changed, 29 insertions(+), 1 deletion(-)
 create mode 100644 tests/lang_objects/destructor/tsuper_type_destructor_bug.nim

diff --git a/compiler/sem/liftdestructors.nim b/compiler/sem/liftdestructors.nim
index 202f532eb6c..5d7e48031ea 100644
--- a/compiler/sem/liftdestructors.nim
+++ b/compiler/sem/liftdestructors.nim
@@ -196,7 +196,12 @@ proc fillBodyObj(c: var TLiftCtx; n, body, x, y: PNode; enforceDefaultOp: bool)
 
 proc fillBodyObjTImpl(c: var TLiftCtx; t: PType, body, x, y: PNode) =
   if t.len > 0 and t[0] != nil:
-    fillBody(c, skipTypes(t[0], abstractPtrs), body, x, y)
+    # also apply the operation to the super type. An up-conversion is required
+    # for proper typing
+    let
+      base = skipTypes(t[0], abstractPtrs)
+      obj = newTreeIT(nkObjUpConv, x.info, base, x)
+    fillBody(c, base, body, obj, y)
   fillBodyObj(c, t.n, body, x, y, enforceDefaultOp = false)
 
 proc fillBodyObjT(c: var TLiftCtx; t: PType, body, x, y: PNode) =
diff --git a/tests/lang_objects/destructor/tsuper_type_destructor_bug.nim b/tests/lang_objects/destructor/tsuper_type_destructor_bug.nim
new file mode 100644
index 00000000000..dd2851bc0d1
--- /dev/null
+++ b/tests/lang_objects/destructor/tsuper_type_destructor_bug.nim
@@ -0,0 +1,23 @@
+discard """
+  description: '''
+    Regression test for an internal typing issue with synthesized hooks for
+    objects using inheritance
+  '''
+  targets: c js vm
+"""
+
+type
+  Parent = object of RootObj
+    x: int
+  Sub = object of Parent
+
+proc `=destroy`(x: var Parent) =
+  # ensure that the parameter is at least accessible at run-time
+  doAssert x.x == 1
+
+# the destroy hook for `Sub` is synthesized by the compiler
+
+proc test() =
+  var x = Sub(x: 1)
+
+test()

From 9fe5a1d2144bd6e6d4c6f71fbae04d68708c8b79 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 8 Jun 2024 21:24:35 +0200
Subject: [PATCH 115/169] fix: crash when defining call/dot operators (#1341)

## Summary

Fix the compiler crashing when defining dot or call operator overloads
and the respective experimental feature is not enabled.

## Details

The formatting of the "call/dot operator not enabled" error messages
expects a symbol, but none was provided, resulting in an NPE.

For both "call/dot operator not enabled" diagnostics, when turning
them into reports, the symbol is now taken from the wrong node and
passed into the report.
---
 compiler/front/cli_reporter.nim         | 10 ++++++++--
 tests/errmsgs/tenable_call_operator.nim |  8 ++++++++
 tests/errmsgs/tenable_dot_operator.nim  |  8 ++++++++
 3 files changed, 24 insertions(+), 2 deletions(-)
 create mode 100644 tests/errmsgs/tenable_call_operator.nim
 create mode 100644 tests/errmsgs/tenable_dot_operator.nim

diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 43d110df1a4..08508dfa28d 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3238,8 +3238,6 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
       adSemSelectorMustBeOfCertainTypes,
       adSemInvalidPragmaBlock,
       adSemConceptPredicateFailed,
-      adSemDotOperatorsNotEnabled,
-      adSemCallOperatorsNotEnabled,
       adSemUnexpectedPattern,
       adSemIsOperatorTakes2Args,
       adSemNoTupleTypeForConstructor,
@@ -3274,6 +3272,14 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
         reportInst: diag.instLoc.toReportLineInfo,
         kind: kind,
         ast: diag.wrongNode)
+  of adSemDotOperatorsNotEnabled,
+     adSemCallOperatorsNotEnabled:
+    semRep = SemReport(
+        location: some diag.location,
+        reportInst: diag.instLoc.toReportLineInfo,
+        kind: kind,
+        ast: diag.wrongNode,
+        sym: diag.wrongNode.sym)
   of adSemInvalidTupleSubscript:
     semRep = SemReport(
         location: some diag.location,
diff --git a/tests/errmsgs/tenable_call_operator.nim b/tests/errmsgs/tenable_call_operator.nim
new file mode 100644
index 00000000000..45658bf0f5f
--- /dev/null
+++ b/tests/errmsgs/tenable_call_operator.nim
@@ -0,0 +1,8 @@
+discard """
+  errormsg: '''
+    the overloaded () operator has to be enabled with {.experimental: "callOperator".}
+  '''
+  line: 8
+"""
+
+proc `()`(a: int) = discard
diff --git a/tests/errmsgs/tenable_dot_operator.nim b/tests/errmsgs/tenable_dot_operator.nim
new file mode 100644
index 00000000000..7050e5c44cc
--- /dev/null
+++ b/tests/errmsgs/tenable_dot_operator.nim
@@ -0,0 +1,8 @@
+discard """
+  errormsg: '''
+    the overloaded . operator has to be enabled with {.experimental: "dotOperators".}
+  '''
+  line: 8
+"""
+
+proc `.`(a: int) = discard

From b08c8f5ddc1ea777ab4dd8d408f5fd3e1fa7776d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 8 Jun 2024 21:35:25 +0200
Subject: [PATCH 116/169] sem: keep shape of array constructors in typed AST
 (#1340)

## Summary

Explicit indices in array constructors now stay in the AST after
typing. Since macros are able to observe this, this change is a
**breaking change**.

## Details

Keeping the explicit indices is also necessary for being able to
retype the AST after it was typed once (without the index, array
constructors for arrays not starting at zero would have a
different type afterwards).

Instead of dropping the explicit index together with the parent
`nkExprColonExpr` node, both are kept by `semArrayConstr`, and then
later discarded by `semfold` (during constant evaluation) and `transf`,
where they are no longer needed.
---
 compiler/sem/semexprs.nim                     | 45 +++++++++----------
 compiler/sem/semfold.nim                      |  4 +-
 compiler/sem/transf.nim                       |  5 +++
 tests/lang_exprs/ttyped_array_constr_expr.nim | 21 +++++++++
 4 files changed, 48 insertions(+), 27 deletions(-)
 create mode 100644 tests/lang_exprs/ttyped_array_constr_expr.nim

diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 7a5ab7a6dc7..455fdeb0b6f 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -772,32 +772,19 @@ proc semArrayConstr(c: PContext, n: PNode, flags: TExprFlags): PNode =
     result.sons.setLen(n.len)
     for i, it in n.pairs:
       # first, analyse the index expression (if one exist)
-      let (idx, val) =
+      var (idx, val) =
         if i == 0: (first, firstIndex)
         else:      semArrayElementIndex(c, it, indexType)
 
-      # figure out the node that holds the element expression, and validate
-      # the index if one is provided
-      var e =
-        case idx.kind
-        of nkError:
-          let r = shallowCopy(it)
-          r[0] = idx
-          r[1] = it[1]
-          c.config.wrapError(r)
-        of nkEmpty:
-          it
-        else:
-          if val == lastIndex + 1:
-            it[1]
-          else:
-            # the specified index value doesn't match with the expected one
-            c.config.newError(it,
-                          PAstDiag(kind: adSemInvalidOrderInArrayConstructor))
+      if idx.kind notin {nkError, nkEmpty} and val != lastIndex + 1:
+        # the specified index value doesn't match with the expected one
+        idx = c.config.newError(idx,
+          PAstDiag(kind: adSemInvalidOrderInArrayConstructor))
 
-      if e.kind != nkError:
-        e = semExprWithType(c, e, {})
-        e = exprNotGenericRoutine(c, e)
+      # always analyze the expression, even when the index expression is
+      # erroneous
+      var e = semExprWithType(c, it.skipColon, {})
+      e = exprNotGenericRoutine(c, e)
 
       if typ.isNil:
         # must be the first item; initialize the common type:
@@ -816,7 +803,11 @@ proc semArrayConstr(c: PContext, n: PNode, flags: TExprFlags): PNode =
         # yet
         typ = commonType(c, typ, e.typ)
 
-      result[i] = e
+      if it.kind == nkExprColonExpr:
+        result[i] = newTreeI(nkExprColonExpr, it.info, [idx, e])
+      else:
+        result[i] = e
+
       inc lastIndex
 
     # watch out for ``sink T``!
@@ -831,8 +822,12 @@ proc semArrayConstr(c: PContext, n: PNode, flags: TExprFlags): PNode =
     var hasError = false
     # fit all elements to be of the derived common type
     for it in result.sons.mitems:
-      it = fitNode(c, typ, it, it.info)
-      hasError = hasError or it.kind == nkError
+      if it.kind == nkExprColonExpr:
+        it[1] = fitNode(c, typ, it[1], it[1].info)
+        hasError = hasError or nkError in {it[0].kind, it[1].kind}
+      else:
+        it = fitNode(c, typ, it, it.info)
+        hasError = hasError or it.kind == nkError
 
     if hasError:
       result = c.config.wrapError(result)
diff --git a/compiler/sem/semfold.nim b/compiler/sem/semfold.nim
index 7a1125f3da2..e211a3a4db4 100644
--- a/compiler/sem/semfold.nim
+++ b/compiler/sem/semfold.nim
@@ -759,7 +759,7 @@ proc getConstExpr(m: PSym, n: PNode; idgen: IdGenerator; g: ModuleGraph): PNode
   of nkBracket, nkCurly:
     result = copyNode(n)
     for i, son in n.pairs:
-      let a = getConstExpr(m, son, idgen, g)
+      let a = getConstExpr(m, son.skipColon, idgen, g)
       if a == nil: return nil
       result.add a
     incl(result.flags, nfAllConst)
@@ -881,7 +881,7 @@ proc foldConstExprAux(m: PSym, n: PNode, idgen: IdGenerator, g: ModuleGraph): Fo
     # the last node is an expression
     result.add foldConstExprAux(m, n[^1], idgen, g)
   of nkExprColonExpr:
-    # comes here from tuple/object constructions
+    # comes here from array/tuple/object constructions
     result.add n[0]
     result.add foldConstExprAux(m, n[1], idgen, g)
     return
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 3ad578457d7..ac52b2d65bd 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -1364,6 +1364,11 @@ proc transform(c: PTransf, n: PNode): PNode =
   of nkPragmaExpr:
     # not needed in transformed AST -> drop it
     result = transform(c, n.lastSon)
+  of nkBracket:
+    # replace elements where the index is specified with just the expression
+    result = shallowCopy(n)
+    for i, it in n.pairs:
+      result[i] = transform(c, it.skipColon)
   else:
     result = transformSons(c, n)
   when false:
diff --git a/tests/lang_exprs/ttyped_array_constr_expr.nim b/tests/lang_exprs/ttyped_array_constr_expr.nim
new file mode 100644
index 00000000000..36753bdcbaf
--- /dev/null
+++ b/tests/lang_exprs/ttyped_array_constr_expr.nim
@@ -0,0 +1,21 @@
+discard """
+  description: '''
+    Ensure that the shape of literal array construction expresions is
+    preserved in typed AST
+  '''
+  action: compile
+"""
+
+import std/macros
+
+macro m(x: typed) =
+  doAssert treeRepr(x) == """Bracket
+  ExprColonExpr
+    IntLit 1
+    StrLit "a"
+  StrLit "b"
+  ExprColonExpr
+    IntLit 3
+    StrLit "c""""
+
+m([1: "a", "b", 3: "c"])

From dfa826b0213004f74673675d2b9b395b54385d19 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 8 Jun 2024 21:44:15 +0200
Subject: [PATCH 117/169] vm: don't use ref-counted cells for globals (#1342)

## Summary

Store a handle to a normal memory cell in the `globals` table, instead
of a handle to a ref-counted cell.

## Details

VM globals are normal locations that exists as long as the VM
environment does; they don't need to be reference-counted, which they
also never were.

Storing a handle to the memory cell in the global table directly
removes and unnecessary indirection through `HeapSlotHandle`, and thus
speeds up loading a global a tiny bit.
---
 compiler/vm/compilerbridge.nim | 12 ++++--------
 compiler/vm/vm.nim             |  3 +--
 compiler/vm/vmdef.nim          |  2 +-
 compiler/vm/vmjit.nim          |  2 +-
 compiler/vm/vmrunner.nim       |  2 +-
 5 files changed, 8 insertions(+), 13 deletions(-)

diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index a6e50f661e5..5bc74240bbe 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -684,21 +684,17 @@ proc getGlobalValue*(c: EvalContext, s: PSym): PNode =
   ## Does not perform type checking, so ensure that `s.typ` matches the
   ## global's type
   internalAssert(c.vm.config, s.kind in {skLet, skVar} and sfGlobal in s.flags)
-  let
-    slotIdx = c.vm.globals[c.jit.getGlobal(s)]
-    slot = c.vm.heap.slots[slotIdx]
-
-  result = c.vm.deserialize(slot.handle, s.typ, s.info)
+  let slot = c.vm.globals[c.jit.getGlobal(s)]
+  result = c.vm.deserialize(slot, s.typ, s.info)
 
 proc setGlobalValue*(c: var EvalContext; s: PSym, val: PNode) =
   ## Does not do type checking so ensure the `val` matches the `s.typ`
   internalAssert(c.vm.config, s.kind in {skLet, skVar} and sfGlobal in s.flags)
   let
-    slotIdx = c.vm.globals[c.jit.getGlobal(s)]
-    slot = c.vm.heap.slots[slotIdx]
+    slot = c.vm.globals[c.jit.getGlobal(s)]
     data = constDataToMir(c.vm, c.jit, val)
 
-  initFromExpr(slot.handle, data, c.jit.env, c.vm)
+  initFromExpr(slot, data, c.jit.env, c.vm)
 
 ## what follows is an implementation of the ``passes`` interface that evaluates
 ## the code directly inside the VM. It is used for NimScript execution and by
diff --git a/compiler/vm/vm.nim b/compiler/vm/vm.nim
index d9ae7f724b9..83bc8ee93a9 100644
--- a/compiler/vm/vm.nim
+++ b/compiler/vm/vm.nim
@@ -2235,9 +2235,8 @@ proc rawExecute(c: var TCtx, t: var VmThread, pc: var int): YieldReason =
 
     of opcLdGlobal:
       let rb = instr.regBx - wordExcess
-      let slot = c.globals[rb]
       ensureKind(rkHandle)
-      regs[ra].setHandle(c.heap.slots[slot].handle)
+      regs[ra].setHandle(c.globals[rb])
 
     of opcLdCmplxConst:
       decodeBx(rkHandle)
diff --git a/compiler/vm/vmdef.nim b/compiler/vm/vmdef.nim
index 7eb9b9935c9..a58de2cd708 100644
--- a/compiler/vm/vmdef.nim
+++ b/compiler/vm/vmdef.nim
@@ -696,7 +696,7 @@ type
       ## instruction raising
     ehCode*: seq[EhInstr]
       ## stores the instructions for the exception handling (EH) mechanism
-    globals*: seq[HeapSlotHandle] ## Stores each global's corresponding heap slot
+    globals*: seq[LocHandle] ## global slots
     constants*: seq[VmConstant] ## constant data
     complexConsts*: seq[LocHandle] ## complex constants (i.e. everything that
                                    ## is not a int/float/string literal)
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 506c9156c6d..315c8001659 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -126,7 +126,7 @@ proc updateEnvironment(c: var TCtx, env: var MirEnv, cp: EnvCheckpoint) =
   # globals (which includes threadvars)
   for id, sym in since(env.globals, cp.globals):
     let typ = c.getOrCreate(sym.typ)
-    c.globals.add c.heap.heapNew(c.allocator, typ)
+    c.globals.add c.allocator.allocSingleLocation(typ)
 
   # constants
   for id, data in since(env.data, cp.data):
diff --git a/compiler/vm/vmrunner.nim b/compiler/vm/vmrunner.nim
index 2d097ec5f4c..2485516113e 100644
--- a/compiler/vm/vmrunner.nim
+++ b/compiler/vm/vmrunner.nim
@@ -163,7 +163,7 @@ proc loadIntoContext(c: var TCtx, p: PackedEnv) =
   c.allocator.byteType = c.typeInfoCache.charType
 
   mapList(c.globals, p.globals, x):
-    c.heap.heapNew(c.allocator, c.types[x])
+    c.allocator.allocSingleLocation(c.types[x])
 
   mapList(c.complexConsts, p.cconsts, x):
     let

From 96cefc4fd6d78ff5fd26555db3bf30d8257f8d5e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 9 Jun 2024 07:32:22 +0200
Subject: [PATCH 118/169] compiler: add the `--showir` switch (#1343)

## Summary

* replace the debug defines for enabling IR printing with the proper
  `--showir` switch
* the switch has two forms: `--showir:<ir>` (enable globally) and
  `--showir:<ir>:<name>` (enable for procedures with given name)
* the supported IR names are: `transf`, `mir_in`, `mir_out`, `cgir`,
  and `vm`
* the old debug defines are removed (they now do nothing)

Using a proper compiler switch brings some usability improvements
(validation, style-insensitive names), and will make extending the
functionality in the future a bit easier.

## Details

* the enabled names are stored `ConfigRef` using in a `StringTableRef`,
  to allow for style-insensitive name lookup
* a `StringTableRef` only supports string-to-string mappings so
  only the showing of one IR per name is supported at the moment
* the `mir_out` option is new: it shows the MIR as it looks like right
  before `cgirgen`
* `mir_in` (corresponding to the previous `nimShowMir` define), now
  shows pretty-printed MIR, instead of the tree representation
* the `debug.rst` documentation mentioning the obsolete defines is
  updated

### Misc

* a bug with the MIR pretty-printer, where rendering locals with no
  name crashed the compiler, is fixed
---
 compiler/backend/backends.nim       |  5 +--
 compiler/front/options.nim          | 22 +++++++++++++
 compiler/front/optionsprocessor.nim | 23 ++++++++++++++
 compiler/mir/mirbridge.nim          | 33 ++++++++++----------
 compiler/mir/utils.nim              |  2 +-
 compiler/vm/compilerbridge.nim      | 13 +++-----
 compiler/vm/vmjit.nim               |  3 +-
 doc/debug.rst                       | 48 ++++++++++++++---------------
 8 files changed, 95 insertions(+), 54 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 02e9b9dfbb9..f5b4386b68e 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -390,7 +390,7 @@ proc translate*(id: ProcedureId, body: PNode, graph: ModuleGraph,
 
   echoInput(graph.config, prc, body)
   result = generateCode(graph, env, prc, config.tconfig, body)
-  echoMir(graph.config, prc, result)
+  echoMir(graph.config, prc, result, env)
 
   # now apply the passes:
   process(result, prc, graph, idgen, env)
@@ -399,6 +399,7 @@ proc generateIR*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
                  owner: PSym, body: sink MirBody): Body =
   ## Translates the MIR code provided by `code` into ``CgNode`` IR and,
   ## if enabled, echoes the result.
+  echoOutput(graph.config, owner, body, env)
   result = cgirgen.generateIR(graph, idgen, env, owner, body)
   echoOutput(graph.config, owner, result)
 
@@ -580,7 +581,7 @@ proc produceLoader(graph: ModuleGraph, m: Module, data: var DiscoveryData,
 
   echoInput(graph.config, sym, body)
   result = generateCode(graph, env, owner, conf.tconfig, body)
-  echoMir(graph.config, sym, result)
+  echoMir(graph.config, sym, result, env)
 
 # ----- discovery and queueing logic -----
 
diff --git a/compiler/front/options.nim b/compiler/front/options.nim
index 9b7629d0c44..c90c6046a3d 100644
--- a/compiler/front/options.nim
+++ b/compiler/front/options.nim
@@ -187,6 +187,15 @@ type
              ## argument
     pimFile  ## the main module is a file
 
+  IrName* = enum
+    ## Names of the IRs that can be rendered to the standard output for
+    ## debugging purposes.
+    irTransf = "transf"
+    irMirIn  = "mir_in"
+    irMirOut = "mir_out"
+    irCgir   = "cgir"
+    irVm     = "vm"
+
   ReportHook* = proc(conf: ConfigRef, report: Report): TErrorHandling {.closure.}
 
   HackController* = object
@@ -309,6 +318,13 @@ type
       debugUtilsStack*: seq[string] ## which proc name to stop trace output
       ## len is also used for output indent level
 
+    toDebugProc*: StringTableRef
+      ## maps identifiers to the name of the IR to print to the standard
+      ## output
+    toDebugIr*: set[IrName]
+      ## the IRs which should always be always printed to the standard
+      ## output
+
     when defined(nimDebugUnreportedErrors):
       unreportedErrors*: OrderedTable[NodeId, PNode]
 
@@ -903,6 +919,7 @@ proc initConfigRefCommon(conf: ConfigRef) =
   conf.notes = NotesVerbosity.main[conf.verbosity]
   conf.hack = defaultHackController
   conf.mainPackageNotes = NotesVerbosity.main[conf.verbosity]
+  conf.toDebugProc = newStringTable(modeStyleInsensitive)
   when defined(nimDebugUtils):
     # ensures that `nimDebugUtils` is defined for the compiled code so it can
     # access the `system.nimCompilerDebugRegion` template
@@ -1589,3 +1606,8 @@ func inDebug*(conf: ConfigRef): bool {.
   noSideEffect.} =
   ## Check whether 'nim compiler debug' is defined right now.
   return conf.isDefined("nimCompilerDebug")
+
+template isDebugEnabled*(c: ConfigRef, ir: IrName, name: string): bool =
+  ## Whether printing the `ir` IR is enabled specifically for the given `name`.
+  # a template is used so that `$ir` can be folded when `ir` is constant
+  c.toDebugProc.getOrDefault(name) == $ir
diff --git a/compiler/front/optionsprocessor.nim b/compiler/front/optionsprocessor.nim
index fb164293e08..4f869c40843 100644
--- a/compiler/front/optionsprocessor.nim
+++ b/compiler/front/optionsprocessor.nim
@@ -170,6 +170,7 @@ type
     cmdSwitchDeepcopy
     cmdSwitchProjStdin
     cmdSwitchCmdexitgcstats
+    cmdSwitchShowIr
     cmdSwitchConfigVar
 
   # Full list of all the command line options.
@@ -298,6 +299,7 @@ type
     fullSwitchTxtSourcemap           = "sourcemap"
     fullSwitchTxtDeepcopy            = "deepcopy"
     fullSwitchTxtCmdexitgcstats      = "cmdexitgcstats"
+    fullSwitchShowIr                 = "showir"
     smolSwitchTxtProjStdin           = ""               # `nim c -r -`, the `-` gets stripped
     fullSwitchTxtConfigVar           = "*.*"            # cfg var dummy entry
     fullSwitchTxtInvalid             = "!ERROR!"
@@ -426,6 +428,7 @@ const
       cmdSwitchDeepcopy           : {fullSwitchTxtDeepcopy},
       cmdSwitchProjStdin          : {smolSwitchTxtProjStdin},
       cmdSwitchCmdexitgcstats     : {fullSwitchTxtCmdexitgcstats},
+      cmdSwitchShowIr             : {fullSwitchShowIr},
       cmdSwitchConfigVar          : {fullSwitchTxtConfigVar},
     ]
 
@@ -616,6 +619,7 @@ func allowedCompileOptionsArgs*(switch: CmdSwitchKind): seq[string] =
   of cmdSwitchExperimental: experimentalFeatures.toSeq.mapIt($it)
   of cmdSwitchExceptions  : @["native", "goto"]
   of cmdSwitchStylecheck  : @["off", "hint", "error"]
+  of cmdSwitchShowIr      : IrName.toSeq.mapIt($it)
   else: unreachable("this is a compiler bug")
 
 func allowedCompileOptionArgs*(switch: string): seq[string] =
@@ -1627,6 +1631,25 @@ proc processSwitch*(switch, arg: string, pass: TCmdLinePass,
     setSwitchAndSrc cmdSwitchCmdexitgcstats
     # Print GC statistics for the compiler run
     conf.incl optCmdExitGcStats
+  of "showir":
+    setSwitchAndSrc cmdSwitchShowIr
+    expectArg(switch, arg)
+    # can either be ``--showir:a:b`` or just ``--showir:a``
+    let (irName, name) =
+      if (let p = find(arg, ':'); p != -1):
+        (arg.substr(0, p-1), arg.substr(p+1))
+      else:
+        (arg, "")
+
+    let ir =
+      try:    parseEnum[IrName](irName)
+      except: invalidArgValue(irName, switch)
+
+    if name.len == 0:
+      conf.toDebugIr.incl ir # enabled globally
+    else:
+      # IR debugging is enabled only for the specific procedure
+      conf.toDebugProc[name] = $ir # use the canonical name
   else:
     if strutils.find(switch, '.') >= 0:
       setSwitchAndSrc cmdSwitchConfigVar
diff --git a/compiler/mir/mirbridge.nim b/compiler/mir/mirbridge.nim
index c83a5ef4f33..f08c0fb608c 100644
--- a/compiler/mir/mirbridge.nim
+++ b/compiler/mir/mirbridge.nim
@@ -30,12 +30,6 @@ import
 
 export GenOption
 
-proc getStrDefine(config: ConfigRef, name: string): string =
-  if config.isDefined(name):
-    result = config.getDefined(name)
-  else:
-    result = ""
-
 template writeBody(config: ConfigRef, header: string, body: untyped) =
   # NOTE: if the debug traces should be kept, they should be properly
   #       integrated into the tracing pipeline
@@ -50,29 +44,36 @@ let reprConfig = block:
   rc.flags.incl trfShowSymKind
   rc
 
-# NOTE: the ``echoX`` are used as a temporary solution for inspecting inputs
-# and outputs in the context of compiler debugging until a more
-# structured/integrated solution is implemented
+template isEnabled(config: ConfigRef, ir: IrName, name: string): bool =
+  # debugging the IR must be enabled globally or locally
+  ir in config.toDebugIr or config.isDebugEnabled(ir, name)
 
 proc echoInput*(config: ConfigRef, owner: PSym, body: PNode) =
   ## If requested via the define, renders the input AST `body` and writes the
   ## result out through ``config.writeLine``.
-  if config.getStrDefine("nimShowMirInput") == owner.name.s:
+  if config.isEnabled(irTransf, owner.name.s):
     writeBody(config, "-- input AST: " & owner.name.s):
       config.writeln(treeRepr(config, body, reprConfig))
 
-proc echoMir*(config: ConfigRef, owner: PSym, body: MirBody) =
+proc echoMir*(config: ConfigRef, owner: PSym, body: MirBody, env: MirEnv) =
   ## If requested via the define, renders the `body` and writes the result out
   ## through ``config.writeln``.
-  if config.getStrDefine("nimShowMir") == owner.name.s:
+  if config.isEnabled(irMirIn, owner.name.s):
     writeBody(config, "-- MIR: " & owner.name.s):
-      config.writeln(treeRepr(body.code))
+      config.writeln(render(body.code, addr env, addr body))
+
+proc echoOutput*(config: ConfigRef, owner: PSym, body: MirBody, env: MirEnv) =
+  ## If enabled, renders the output IR `body` and outputs the result to
+  ## ``config.writeLine``.
+  if config.isEnabled(irMirOut, owner.name.s):
+    writeBody(config, "-- MIR: " & owner.name.s):
+      config.writeln(render(body.code, addr env, addr body))
 
 proc echoOutput*(config: ConfigRef, owner: PSym, body: Body) =
   ## If requested via the define, renders the output IR `body` and writes the
   ## result out through ``config.writeLine``.
-  if config.getStrDefine("nimShowMirOutput") == owner.name.s:
-    writeBody(config, "-- output AST: " & owner.name.s):
+  if config.isEnabled(irCgir, owner.name.s):
+    writeBody(config, "-- CGIR: " & owner.name.s):
       config.writeln(treeRepr(body.code))
 
 proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
@@ -82,7 +83,7 @@ proc canonicalize*(graph: ModuleGraph, idgen: IdGenerator, env: var MirEnv,
   echoInput(graph.config, owner, body)
   # step 1: generate a ``MirTree`` from the input AST
   let body = generateCode(graph, env, owner, config, body)
-  echoMir(graph.config, owner, body)
+  echoMir(graph.config, owner, body, env)
 
   # step 2: generate the ``CgNode`` tree
   result = cgirgen.generateIR(graph, idgen, env, owner, body)
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 214ec768d17..9b2d695c729 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -169,7 +169,7 @@ proc typeToStr(result: var string, t: TypeId, env: ptr MirEnv) =
 
 func addLocalName(result: var string, id: LocalId, open: string,
                   c: RenderCtx) =
-  if c.body.isNil:
+  if c.body.isNil or c.body[][id].name.isNil:
     # render just the ID
     idToStr(result, id, open)
   else:
diff --git a/compiler/vm/compilerbridge.nim b/compiler/vm/compilerbridge.nim
index 5bc74240bbe..31a4e26e798 100644
--- a/compiler/vm/compilerbridge.nim
+++ b/compiler/vm/compilerbridge.nim
@@ -119,15 +119,10 @@ func `$`(e: ExecErrorReport): string {.error.}
 proc logBytecode(c: TCtx, owner: PSym, start: int) =
   ## If enabled, renders the bytecode ranging from `start` to the current end
   ## into text that is then written to the standard output.
-  const Symbol = "expandVmListing"
-  if owner != nil and c.config.isDefined(Symbol):
-    let name = c.config.getDefined(Symbol)
-    # if no value is specified for the conditional sym (i.e.,
-    # ``--define:expandVmListing``), `name` is 'true', which we interpret
-    # as "log everything"
-    if name == "true" or name == owner.name.s:
-      let listing = codeListing(c, start)
-      c.config.msgWrite: renderCodeListing(c.config, owner, listing)
+  if irVm in c.config.toDebugIr or
+     (owner != nil and c.config.isDebugEnabled(irVm, owner.name.s)):
+    let listing = codeListing(c, start)
+    c.config.msgWrite: renderCodeListing(c.config, owner, listing)
 
 proc putIntoReg(dest: var TFullReg; jit: var JitState, c: var TCtx, n: PNode,
                 formal: PType) =
diff --git a/compiler/vm/vmjit.nim b/compiler/vm/vmjit.nim
index 315c8001659..7aa164e9f0b 100644
--- a/compiler/vm/vmjit.nim
+++ b/compiler/vm/vmjit.nim
@@ -260,11 +260,12 @@ proc genProc(jit: var JitState, c: var TCtx, s: PSym): VmGenResult =
 
   echoInput(c.config, s, body)
   var mirBody = generateCode(c.graph, jit.gen.env, s, selectOptions(c), body)
-  echoMir(c.config, s, mirBody)
+  echoMir(c.config, s, mirBody, jit.gen.env)
   applyPasses(c, jit.gen.env, s, mirBody)
   for _ in discover(jit.gen.env, cp):
     discard "nothing to register"
 
+  echoOutput(c.config, s, mirBody, jit.gen.env)
   let outBody = generateIR(c.graph, c.idgen, jit.gen.env, s, mirBody)
   echoOutput(c.config, s, outBody)
 
diff --git a/doc/debug.rst b/doc/debug.rst
index dbfde7cbf58..a5ebbe2a324 100644
--- a/doc/debug.rst
+++ b/doc/debug.rst
@@ -423,35 +423,33 @@ MIR Input and Output
 ====================
 
 For debugging issues related to the MIR but also code-generator issues in
-general, one can print the input and output to the MIR canonicalization step
-plus the corresponding `PNode`-AST output.
-
-To print the `PNode`-AST that reaches `mirgen`, `--define:nimShowMirInput=name`
-is used. This will print out the `PNode`-AST of all procedures and modules of
-which the name is equal to the specified `name` in the console. Because of how
-dead-code-elimination works, only the AST of alive procedures (i.e. used ones)
-is printed. If a procedure is used at both compile- and run-time, it will be
-printed twice.
-
-To print the generated MIR code for a procedure, `--define:nimShowMir=name`
-can be used. The same limitation as for `nimShowMirInput` apply.
-
-`--define:nimShowMirOutput=name` prints the `CgNode`-IR that is output by
-`cgirgen`. This is IR that the code generators operate on.
-
-While all of the defines listed above can be used simultaneously, only a single
-occurrence of each is considered. Each further occurrence will override the
-respective name.
+general, one can print the various IRs used during the mid-/back-end phase.
+
+This is done by using one of the following options with the
+`--showir`:option: switch:
+* `transf`:option: : shows the post `transf` AST that gets translated to the
+  MIR
+* `mir_in`:option: : shows the MIR produced by `mirgen`, without any passes
+  applied
+* `mir_out`:option: : shows the MIR after all passes were applied, right before
+  translation to the CGIR
+* `cgir`:option: : shows the CGIR as produced by `cgirgen`
+
+If a procedure is used at both compile- and run-time, it will show up in the
+output twice, though potentially with different bodies, as different passes are
+applied. Only procedures actually used in alive code are processed during the
+MIR and back-end phase; if a procedure is not alive, the IR for cannot be
+shown with `--showir`:option: .
 
 VM Codegen and Execution
 ========================
 
 For echoing the VM bytecode generated for compile-time procedures and macros,
-`--define:expandVmListing=vmTarget`:option: can be passed to the compiler (no
-special build of the compiler is required). The bytecode for all routines of
-which the name is `vmTarget` is then echoed to the standard output. Leaving
-`vmTarget` empty enables echoing for *all* VM bytecode that is generated as
-part of compile-time execution.
+`--showir:vm:vmTarget`:option: can be passed to the compiler (no special build
+of the compiler is required). The bytecode for all routines of which the name
+is `vmTarget` is then echoed to the standard output. Leaving `vmTarget` empty
+enables echoing for *all* VM bytecode that is generated as part of compile-time
+execution.
 
 For example (generated listing might not match exactly)
 
@@ -471,7 +469,7 @@ For example (generated listing might not match exactly)
 
 .. code-block:: cmd
 
-  nim c --filenames:canonical --define:expandVmListing=vmTarget file.nim
+  nim c --filenames:canonical --showir:vm:vmTarget file.nim
 
 
 .. code-block:: literal

From 33c8184b745fce6a3c192ed72e45b05ce4d8d5ca Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 11 Jun 2024 01:50:41 +0200
Subject: [PATCH 119/169] mir: remove the tree delimiter nodes (#1334)

## Summary

Instead of marking the end of a subtree with a dedicated node, the
number of child nodes in a subtree is now stored in the subtree's root
node. The idea is to:
* reduce the memory footprint of MIR trees
* make the storage format more streamlined
* simplify some traversal

## Details

The idea of using dedicated end nodes originated at a time where:
* fast back-/up-wards MIR traversal was required
* statements could be nested

Neither is the case anymore, and replacing the delimiter `mnkEnd` nodes
with storing the length has some benefits:
* significantly less nodes per `MirTree` (reduced memory usage, faster
  scanning, faster copying, etc.)
* `O(1)` length lookup
* lower cost of changing a subtree root node, or replacing it with its
  single child node
* simpler recursive traversal, as the end nodes don't have to be
  ignored/considered anymore

The downside of removing the delimiters nodes are that:
* slightly higher tree construction cost: the number of child nodes
  needs to be kept track of
* walking "upwards" (i.e., towards the root) in the tree has a higher
  cost

Ultimately, the upsides outweigh the downsides, especially since
walking the tree upwards is seldomly done.

### Adjustments

For memory efficiency, some subtree root nodes (like `mnkPathPos`)
stored extra information in the root node. Since all subtree root nodes
now need to store the length, this is no longer possible, and the
information has to be moved into separate nodes:
* for call trees, whether the call has side-effects is stored as an
  immediate value (using the new `mnkImmediate` node) in the tree's
  first slot
* for field/positional access, the field/position is stored in the
  tree's second slot

For easier processing of `mnkObjConstr`/`mnkRefConstr` trees, the
`mnkBinding` is introduced, which groups the `mnkField` and associated
expression together in a subtree.

The rest of the changes are about:
* updating the `MirBuilder` routines to track the child node count and
  patch the root nodes
* updating the construction of MIR trees in various places
* updating the various tree traversal logic that expected the old
  layout

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/backends.nim      |   2 +-
 compiler/backend/cgirgen.nim       |  68 +++-----
 compiler/backend/compat.nim        |   8 +-
 compiler/mir/datatables.nim        |   4 +-
 compiler/mir/injecthooks.nim       |   5 +-
 compiler/mir/mirconstr.nim         |  78 +++++++--
 compiler/mir/mirgen.nim            |  86 +++++-----
 compiler/mir/mirpasses.nim         |  18 ++-
 compiler/mir/mirtrees.nim          | 251 +++++++++++++----------------
 compiler/mir/rtchecks.nim          |   8 +-
 compiler/mir/treechangesets.nim    |   9 +-
 compiler/mir/utils.nim             | 141 ++++++----------
 compiler/sem/aliasanalysis.nim     |   6 +-
 compiler/sem/injectdestructors.nim |  14 +-
 compiler/sem/mirexec.nim           |  51 +++---
 compiler/vm/packed_env.nim         |   1 +
 compiler/vm/vmserialize.nim        |   4 +-
 doc/mir.rst                        |  45 +++---
 tests/compiler/tdatatables.nim     |  50 +++---
 tests/compiler/tmir_trees.nim      |   2 +-
 tests/compiler/ttreechangesets.nim |   8 +-
 21 files changed, 406 insertions(+), 453 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index f5b4386b68e..157300f4aa1 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -283,7 +283,7 @@ func isEmpty*(tree: MirTree): bool =
   ## Returns whether `tree` contains either no nodes or only nodes that have
   ## no meaning by themselves.
   for n in tree.items:
-    if n.kind notin {mnkScope, mnkEndScope, mnkEnd}:
+    if n.kind notin {mnkScope, mnkEndScope}:
       return false
 
   result = true
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index ecf2aec78c0..5d36237e7a6 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -95,10 +95,6 @@ func enter(t: MirBody, cr: var TreeCursor): lent MirNode {.inline.} =
   assert t.code[cr.pos].kind in SubTreeNodes, "not a sub-tree"
   result = get(t, cr)
 
-func leave(t: MirBody, cr: var TreeCursor) =
-  assert t.code[cr.pos].kind == mnkEnd, "not at the end of sub-tree"
-  inc cr.pos
-
 template info(cr: TreeCursor): TLineInfo =
   cr.origin.info
 
@@ -293,21 +289,24 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   of mnkPathNamed:
     let obj = recurse()
     result = newExpr(cnkFieldAccess, info, typ,
-                     [obj, newFieldNode(lookupInType(obj.typ, n.field.int))])
+                     [obj, newFieldNode(lookupInType(obj.typ,
+                                                     tree.get(cr).field))])
   of mnkPathVariant:
     if preferField:
       let
         obj = recurse()
-        field = lookupInType(obj.typ, n.field.int)
+        field = lookupInType(obj.typ, tree.get(cr).field)
       result = newExpr(cnkFieldAccess, info, field.typ,
                       [obj, newFieldNode(field)])
     else:
       # variant access itself has no ``CgNode`` counterpart at the moment
       result = recurse()
+      tree.skip(cr) # ignore the field
   of mnkPathPos:
     result = newExpr(cnkTupleAccess, info, typ,
                      [recurse(),
-                      CgNode(kind: cnkIntLit, intVal: n.position.BiggestInt)])
+                      CgNode(kind: cnkIntLit,
+                             intVal: tree.get(cr).imm.BiggestInt)])
   of mnkPathArray:
     # special case in order to support string literal access
     # XXX: this needs to be removed once there is a dedicated run-time-
@@ -330,8 +329,6 @@ proc lvalueToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   of AllNodeKinds - LvalueExprKinds - {mnkProcVal}:
     unreachable(n.kind)
 
-  leave(tree, cr)
-
 proc lvalueToIr(tree: MirBody, cl: var TranslateCl,
                 cr: var TreeCursor; preferField=true): CgNode {.inline.} =
   lvalueToIr(tree, cl, tree.get(cr), cr, preferField)
@@ -370,9 +367,8 @@ proc targetToIr(tree: MirBody, cr: var TreeCursor): CgNode =
     result = actionToIr(tree, n, cr.info)
   of mnkTargetList:
     result = newTree(cnkTargetList, cr.info)
-    while tree[cr].kind != mnkEnd:
+    for _ in 0..<n.len:
       result.add actionToIr(tree, tree.get(cr), cr.info)
-    leave(tree, cr)
   else:
     unreachable(n.kind)
 
@@ -383,13 +379,12 @@ proc argToIr(tree: MirBody, cl: var TranslateCl,
   ## operator (which indicates that the parameter is a ``var`` parameter).
   var n {.cursor.} = tree.get(cr)
   assert n.kind in ArgumentNodes, "argument node expected: " & $n.kind
-  # the inner node may be a tag node
   n = tree.get(cr)
   case n.kind
-  of mnkTag:
-    # it is one, the expression must be an lvalue
-    result = (true, lvalueToIr(tree, cl, cr))
-    leave(tree, cr)
+  of mnkImmediate:
+    # the argument must be a 'name' one, ignore the tag and expect
+    # an lvalue expression
+    result = (n.imm.EffectKind != ekNone, lvalueToIr(tree, cl, cr))
   of LiteralDataNodes, mnkType, mnkProcVal, mnkNone:
     # not a tag but an atom
     result = (false, atomToIr(n, cl, cr.info))
@@ -398,8 +393,6 @@ proc argToIr(tree: MirBody, cl: var TranslateCl,
   else:
     unreachable("not a valid argument expression")
 
-  leave(tree, cr)
-
 proc calleeToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode =
   case tree[cr].kind
   of mnkMagic:
@@ -417,6 +410,7 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   let info = cr.info
   result = newExpr((if n.kind == mnkCall: cnkCall else: cnkCheckedCall),
                    info, cl.map(n.typ))
+  tree.skip(cr) # skip the immediate value
   result.add calleeToIr(tree, cl, cr)
 
   # the code generators currently require some magics to not have any
@@ -425,7 +419,7 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
                result[0].magic in FakeVarParams
 
   # translate the arguments:
-  while tree[cr].kind in ArgumentNodes:
+  for _ in 2..<(n.len.int - ord(n.kind == mnkCheckedCall)):
     var (mutable, arg) = argToIr(tree, cl, cr)
     if noAddr:
       if arg.typ.kind == tyVar:
@@ -440,8 +434,6 @@ proc callToIr(tree: MirBody, cl: var TranslateCl, n: MirNode,
   if n.kind == mnkCheckedCall:
     result.add targetToIr(tree, cr)
 
-  leave(tree, cr)
-
 proc exprToIr(tree: MirBody, cl: var TranslateCl, cr: var TreeCursor): CgNode
 
 proc sourceExprToIr(tree: MirBody, cl: var TranslateCl,
@@ -454,12 +446,10 @@ proc sourceExprToIr(tree: MirBody, cl: var TranslateCl,
     # requires a full assignment
     discard enter(tree, cr)
     result = (valueToIr(tree, cl, cr), false)
-    leave(tree, cr)
   of mnkMove:
     # an ``x = move y`` assignment can be turned into a fast assignment
     discard enter(tree, cr)
     result = (valueToIr(tree, cl, cr), true)
-    leave(tree, cr)
   of LvalueExprKinds:
     # a fast assignment is correct for all raw lvalues
     result = (lvalueToIr(tree, cl, cr), true)
@@ -507,7 +497,6 @@ proc defToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       lvalueToIr(tree, cl, cr, preferField=false)
     else:
       sourceExprToIr(tree, cl, cr)[0]
-  leave(tree, cr)
   if n.kind in {mnkBind, mnkBindMut} and arg.typ.kind notin {tyVar, tyLent}:
     # wrap the operand in an address-of operation
     arg = newOp(cnkHiddenAddr, info, def.typ, arg)
@@ -569,15 +558,12 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   let info = cr.info ## the source information of `n`
 
   template to(kind: CgNodeKind, args: varargs[untyped]) =
-    let r = newStmt(kind, info, args)
-    leave(tree, cr)
-    stmts.add r
+    stmts.add newStmt(kind, info, args)
 
   template toList(k: CgNodeKind, body: untyped) =
     let res {.inject.} = newStmt(k, info)
-    while tree[cr].kind != mnkEnd:
+    for _ in 0..<n.len:
       body
-    leave(tree, cr)
     stmts.add res
 
   case n.kind
@@ -606,7 +592,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       # then the jump target of the next handler:
       excpt.add targetToIr(tree, cr)
 
-    leave(tree, cr)
     stmts.add excpt
     # XXX: temporary workaround, refer to ``inUnscoped`` doc comment
     inc cl.inUnscoped
@@ -617,7 +602,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     # skip the candidate list, it's not relevant to code generation:
     for _ in 1..<n.len:
       tree.skip(cr)
-    leave(tree, cr)
   of mnkVoid:
     var res = exprToIr(tree, cl, cr)
     if res.typ.isEmptyType():
@@ -625,7 +609,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
       discard
     else:
       res = newStmt(cnkVoidStmt, info, [res])
-    leave(tree, cr)
     stmts.add res
   of mnkIf:
     to cnkIfStmt, valueToIr(tree, cl, cr), labelToIr(tree, cr)
@@ -646,7 +629,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
 
     res.add targetToIr(tree, cr)
     stmts.add res
-    leave(tree, cr)
   of mnkCase:
     stmts.add caseToIr(tree, env, cl, n, cr)
   of mnkAsm:
@@ -656,7 +638,6 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
     toList cnkEmitStmt:
       res.add valueToIr(tree, cl, cr)
   of mnkScope:
-    leave(tree, cr)
     scopeToIr(tree, env, cl, cr, stmts)
   of mnkDestroy:
     unreachable("a 'destroy' that wasn't lowered")
@@ -674,7 +655,6 @@ proc setElementToIr(tree: MirBody, cl: var TranslateCl,
     discard enter(tree, cr)
     result = newTree(cnkRange, unknownLineInfo,
                      [valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)])
-    leave(tree, cr)
   else:
     unreachable()
 
@@ -695,9 +675,6 @@ proc caseToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl, n: MirNode,
     branch.add labelToIr(tree, cr)
 
     result.add branch
-    leave(tree, cr)
-
-  leave(tree, cr)
 
 proc exprToIr(tree: MirBody, cl: var TranslateCl,
               cr: var TreeCursor): CgNode =
@@ -707,15 +684,12 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   let info = cr.info
 
   template op(kind: CgNodeKind, e: CgNode): CgNode =
-    let r = newOp(kind, info, cl.map(n.typ), e)
-    leave(tree, cr)
-    r
+    newOp(kind, info, cl.map(n.typ), e)
 
   template treeOp(k: CgNodeKind, body: untyped): CgNode =
     let res {.inject.} = newExpr(k, info, cl.map(n.typ))
-    while tree[cr].kind != mnkEnd:
+    for _ in 0..<n.len:
       body
-    leave(tree, cr)
     res
 
   case n.kind
@@ -756,19 +730,19 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
     let typ = cl.map(n.typ)
     assert typ.skipTypes(abstractVarRange).kind in {tyObject, tyRef}
     treeOp cnkObjConstr:
+      discard enter(tree, cr) # enter the binding tree
       let f = newFieldNode(lookupInType(typ, get(tree, cr).field))
       res.add newTree(cnkBinding, cr.info, [f, argToIr(tree, cl, cr)[1]])
   of mnkCall, mnkCheckedCall:
     callToIr(tree, cl, n, cr)
   of UnaryOps:
     const Map = [mnkNeg: cnkNeg]
-    treeOp Map[n.kind]:
-      res.add valueToIr(tree, cl, cr)
+    newExpr(Map[n.kind], info, cl.map(n.typ), valueToIr(tree, cl, cr))
   of BinaryOps:
     const Map = [mnkAdd: cnkAdd, mnkSub: cnkSub,
                  mnkMul: cnkMul, mnkDiv: cnkDiv, mnkModI: cnkModI]
-    treeOp Map[n.kind]:
-      res.kids = @[valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)]
+    newExpr(Map[n.kind], info, cl.map(n.typ)):
+      @[valueToIr(tree, cl, cr), valueToIr(tree, cl, cr)]
   of mnkCopy, mnkMove, mnkSink:
     # translation of assignments needs to handle all modifiers
     unreachable("loose assignment modifier")
diff --git a/compiler/backend/compat.nim b/compiler/backend/compat.nim
index fa78e7e9c0a..98f82fc9fcd 100644
--- a/compiler/backend/compat.nim
+++ b/compiler/backend/compat.nim
@@ -150,13 +150,13 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
       for j in 0..<res.len:
         res.kids[j] = body
 
-      inc i # consume the end node
       res
 
     inc i # advance to the first child node
     case n.kind
     of mnkObjConstr, mnkRefConstr:
       tree cnkObjConstr:
+        inc i # skip the binding node
         let field = lookupInType(typ, t[i].field.int)
         inc i # advance to the arg node
         CgNode(kind: cnkBinding, info: unknownLineInfo,
@@ -178,9 +178,7 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
       tree cnkRange:
         recurse()
     of mnkArg:
-      let x = recurse()
-      inc i # skip the end node
-      x
+      recurse()
     of mnkNilLit:
       CgNode(kind: cnkNilLit, info: unknownLineInfo, typ: typ)
     of mnkIntLit:
@@ -200,7 +198,7 @@ proc translate*(t: MirTree, env: MirEnv): CgNode =
              astLit: env[n.ast])
     of mnkProcVal:
       CgNode(kind: cnkProc, info: unknownLineInfo, prc: n.prc, typ: typ)
-    of AllNodeKinds - ConstrTreeNodes + {mnkEnd, mnkField}:
+    of AllNodeKinds - ConstrTreeNodes + {mnkField, mnkBinding}:
       # 'end' nodes are skipped manually
       unreachable(n.kind)
 
diff --git a/compiler/mir/datatables.nim b/compiler/mir/datatables.nim
index af337cd7cd9..32a97beac17 100644
--- a/compiler/mir/datatables.nim
+++ b/compiler/mir/datatables.nim
@@ -42,7 +42,7 @@ func hashTree(tree: ConstrTree): Hash =
       result = result !& hash(n.len)
     of mnkField:
       result = result !& hash(n.field)
-    of mnkArg, mnkEnd, mnkNilLit:
+    of mnkArg, mnkNilLit, mnkBinding:
       discard
     of AllNodeKinds - ConstrTreeNodes:
       unreachable(n.kind)
@@ -74,7 +74,7 @@ proc cmp(a, b: ConstrTree): bool =
       a.len == b.len
     of mnkField:
       a.field == b.field
-    of mnkArg, mnkEnd, mnkNilLit:
+    of mnkArg, mnkNilLit, mnkBinding:
       true # same node kind -> equal nodes
     of AllNodeKinds - ConstrTreeNodes:
       unreachable(a.kind)
diff --git a/compiler/mir/injecthooks.nim b/compiler/mir/injecthooks.nim
index ad192656f02..8c1baca377a 100644
--- a/compiler/mir/injecthooks.nim
+++ b/compiler/mir/injecthooks.nim
@@ -253,9 +253,8 @@ proc injectHooks*(body: MirBody, graph: ModuleGraph, env: var MirEnv,
         #   =sink(name x, arg a.b)
         changes.replaceMulti(tree, stmt, bu):
           bu.buildVoidCall(env, op):
-            bu.subTree mnkName:
-              bu.subTree MirNode(kind: mnkTag, effect: ekMutate):
-                bu.emitFrom(tree, dest)
+            bu.emitByName ekMutate:
+              bu.emitFrom(tree, dest)
             bu.subTree mnkArg:
               bu.emitFrom(tree, src)
       else:
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index ea6b23213d0..3b22dcc2105 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -28,6 +28,8 @@ type
   Fragment* = object
     ## Identifies a fragment (usually a sub-tree) within the staging buffer.
     s: NodeSlice
+    num: int
+      ## number of child nodes in the fragment
     typ*: TypeId
 
   MirBuffer = object
@@ -37,6 +39,14 @@ type
       # XXX: should not be exported
     cursor: int
       ## points to the first node that hasn't had its ``info`` set up yet
+    num: int
+      ## number of child nodes in the current in-progress subtree
+
+  Context* = object
+    ## Low-overhead object capturing part of the builder state when
+    ## starting manual subtree construction.
+    pos: NodeIndex
+    num: int
 
   MirBuilder* = object
     ## Holds the state needed for building MIR trees and allocating
@@ -70,10 +80,6 @@ func typ*(val: Value): TypeId =
 func procNode*(id: ProcedureId): MirNode {.inline.} =
   MirNode(kind: mnkProc, prc: id)
 
-func endNode*(k: MirNodeKind): MirNode {.inline.} =
-  assert k in SubTreeNodes
-  MirNode(kind: mnkEnd, start: k)
-
 func typeLit*(t: TypeId): Value =
   Value(node: MirNode(kind: mnkType, typ: t))
 
@@ -189,12 +195,16 @@ template push*(bu: var MirBuilder, body: untyped): Fragment =
     start =
       if doSwap: bu.back.len
       else:      bu.front.len
+  var num = 0
 
   swap(bu, doSwap)
+  swap(num, bu.front.num) # change the child node counter to 0
   body
+  swap(num, bu.front.num) # restore the previous child counter
   swap(bu, doSwap)
 
   Fragment(s: NodeSlice(a: NodeIndex(start), b: NodeIndex(bu.staging.len)),
+           num: num,
            typ: if start < bu.staging.len:
                   bu.staging[start].typ
                 else:
@@ -216,9 +226,11 @@ func pop*(bu: var MirBuilder, f: Fragment) =
   if bu.swapped:
     assert f.s.b.int == bu.front.len
     popAux(bu.back, bu.front, f.s.a.int, bu.currentSourceId)
+    bu.back.num += f.num # register the nodes with current root
   else:
     assert f.s.b.int == bu.back.len
     popAux(bu.front, bu.back, f.s.a.int, bu.currentSourceId)
+    bu.front.num += f.num # register the nodes with current root
 
 template withFront*(bu: var MirBuilder, body: untyped) =
   ## Runs `body` with the final buffer as the front buffer.
@@ -279,6 +291,7 @@ func addLocal*(bu: var MirBuilder, data: sink Local): LocalId {.inline.} =
 
 func add*(bu: var MirBuilder, n: sink MirNode) {.inline.} =
   ## Emits `n` to the node buffers.
+  inc bu.front.num
   bu.front.add n
 
 func add*(bu: var MirBuilder, id: SourceId, n: sink MirNode) =
@@ -287,7 +300,7 @@ func add*(bu: var MirBuilder, id: SourceId, n: sink MirNode) =
   # the cursor is moved, so a flush has to be performed first
   bu.front.apply(bu.currentSourceId)
   n.info = id
-  bu.front.add n
+  bu.add(n)
   inc bu.front.cursor
 
 func emitFrom*(bu: var MirBuilder, tree: MirTree, n: NodePosition) =
@@ -295,13 +308,25 @@ func emitFrom*(bu: var MirBuilder, tree: MirTree, n: NodePosition) =
   bu.front.apply(bu.currentSourceId)
   bu.front.nodes.add toOpenArray(tree, int n, int tree.sibling(n)-1)
   bu.front.cursor = bu.front.len
+  inc bu.front.num # register the new node
+
+proc start*(bu: var MirBuilder, n: sink MirNode): Context {.inline.} =
+  ## Starts a subtree with a root node of `kind`. Must be paired with a call
+  ## to `finish <#finish,MirBuilder,Context>`_.
+  bu.add(n)
+  result = Context(num: bu.front.num, pos: NodeIndex(bu.front.len - 1))
+  bu.front.num = 0
+
+proc finish*(bu: var MirBuilder, saved: Context) {.inline.} =
+  ## Finish the manual subtree and restores the `saved` context previously
+  ## returned by ``start``.
+  bu.front.nodes[saved.pos].len = bu.front.num.uint32
+  bu.front.num = saved.num
 
 template subTree*(bu: var MirBuilder, n: MirNode, body: untyped) =
-  let start = bu.front.len
-  bu.add n
+  let saved = bu.start n
   body
-  # note: don't use `n.kind` here as that would evaluate `n` twice
-  bu.add endNode(bu.front.nodes[start].kind)
+  bu.finish(saved) # restore the old root
 
 template subTree*(bu: var MirBuilder, k: MirNodeKind, body: untyped) =
   bu.subTree MirNode(kind: k):
@@ -369,9 +394,18 @@ template wrapMutAlias*(bu: var MirBuilder, t: TypeId, body: untyped): Value =
     body
   val
 
+template rawBuildCall*(bu: var MirBuilder, k: MirNodeKind, t: TypeId,
+                       sideEffects: bool, body: untyped) =
+  ## Builds a call tree, with `k` as the call kind, `t` as the call's return
+  ## type, and `sideEffects` indicating whether the call potentially modifies
+  ## global data.
+  bu.subTree MirNode(kind: k, typ: t):
+    bu.add MirNode(kind: mnkImmediate, imm: uint32 ord(sideEffects))
+    body
+
 template buildMagicCall*(bu: var MirBuilder, m: TMagic, t: TypeId,
                          body: untyped) =
-  bu.subTree MirNode(kind: mnkCall, typ: t):
+  bu.rawBuildCall mnkCall, t, false: # no side-effects
     bu.add MirNode(kind: mnkMagic, magic: m)
     body
 
@@ -379,7 +413,7 @@ template buildCall*(bu: var MirBuilder, prc: ProcedureId, t: TypeId,
                     body: untyped) =
   ## Build and emits a call tree to the active buffer. `pt` is the type of the
   ## procedure.
-  bu.subTree MirNode(kind: mnkCall, typ: t):
+  bu.rawBuildCall mnkCall, t, false:  # no side-effects
     bu.add procNode(prc)
     body
 
@@ -389,8 +423,8 @@ func emitByVal*(bu: var MirBuilder, y: Value) =
 
 template emitByName*(bu: var MirBuilder, e: EffectKind, body: untyped) =
   bu.subTree mnkName:
-    bu.subTree MirNode(kind: mnkTag, effect: e):
-      body
+    bu.add MirNode(kind: mnkImmediate, imm: uint32 ord(e))
+    body
 
 func emitByName*(bu: var MirBuilder, val: Value, e: EffectKind) =
   bu.emitByName e:
@@ -418,6 +452,24 @@ func join*(bu: var MirBuilder, label: LabelId) =
   bu.subTree mnkJoin:
     bu.add MirNode(kind: mnkLabel, label: label)
 
+template pathNamed*(bu: var MirBuilder, t: TypeId, f: int32, body: untyped) =
+  ## Emits a ``mnkPathNamed`` expression.
+  bu.subTree MirNode(kind: mnkPathNamed, typ: t):
+    body
+    bu.add MirNode(kind: mnkField, field: f)
+
+template pathVariant*(bu: var MirBuilder, t: TypeId, f: int32, body: untyped) =
+  ## Emits a ``mnkPathVariant`` expression.
+  bu.subTree MirNode(kind: mnkPathVariant, typ: t):
+    body
+    bu.add MirNode(kind: mnkField, field: f)
+
+template pathPos*(bu: var MirBuilder, t: TypeId, p: uint32, body: untyped) =
+  ## Emits a ``mnkPathPos`` expression.
+  bu.subTree MirNode(kind: mnkPathPos, typ: t):
+    body
+    bu.add MirNode(kind: mnkImmediate, imm: p)
+
 template buildBlock*(bu: var MirBuilder, id: LabelId, body: untyped) =
   ## Emits `body` followed by a join statement for the given `id`.
   body
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index c124df345d4..1ec2b007290 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -282,9 +282,7 @@ template emitByVal(c: var TCtx, val: Value) =
 
 template emitByName(c: var TCtx, eff: EffectKind, body: untyped) =
   ## Emits a pass-by-name argument sub-tree with `val`.
-  c.subTree mnkName:
-    c.subTree MirNode(kind: mnkTag, effect: eff):
-      body
+  c.builder.emitByName(eff, body)
 
 template addLocal(c: var TCtx, local: Local): LocalId =
   c.builder.addLocal(local)
@@ -426,7 +424,7 @@ template buildMagicCall(c: var TCtx, m: TMagic, t: TypeId, body: untyped) =
 
 template buildCheckedMagicCall(c: var TCtx, m: TMagic, t: TypeId,
                                body: untyped) =
-  c.subTree MirNode(kind: mnkCheckedCall, typ: t):
+  c.builder.rawBuildCall mnkCheckedCall, t, false:
     c.add MirNode(kind: mnkMagic, magic: m)
     body
     raiseExit(c)
@@ -444,7 +442,7 @@ template buildDefectMagicCall(c: var TCtx, m: TMagic, t: TypeId,
     else:
       mnkCheckedCall
 
-  c.subTree MirNode(kind: kind, typ: t):
+  c.builder.rawBuildCall kind, t, false: # no side-effects
     c.add MirNode(kind: mnkMagic, magic: m)
     body
     if kind == mnkCheckedCall:
@@ -605,8 +603,7 @@ proc genFieldCheck(c: var TCtx, access: Value, call: PNode, inverted: bool,
       c.emitByVal c.genRd(call[1])
       # discriminator value operand:
       c.subTree mnkArg:
-        c.subTree MirNode(kind: mnkPathNamed, typ: c.typeToMir(discr.typ),
-                          field: discr.position.int32):
+        c.builder.pathNamed c.typeToMir(discr.typ), discr.position.int32:
           c.use access
       # inverted flag:
       c.emitByVal intLiteral(c.env, ord(inverted), BoolType)
@@ -767,7 +764,7 @@ proc genArgs(c: var TCtx, n: PNode) =
       # the procedure returns a view, but the first parameter is not something
       # that resembles a handle. We need to make sure that the first argument
       # (which the view could be created from), is passed by reference
-      c.subTree mnkName:
+      c.builder.emitByName ekNone:
         var e = exprToPmir(c, n[i], false, false)
         wantStable(e)
         genx(c, e, e.high)
@@ -784,12 +781,8 @@ proc genCall(c: var TCtx, n: PNode) =
     else:
       mnkCall
 
-  var effects: set[GeneralEffect]
-  if tfNoSideEffect notin fntyp.flags:
-    effects.incl geMutateGlobal
-
-  c.subTree MirNode(kind: kind, typ: c.typeToMir(fntyp[0]),
-                    effects: effects):
+  let hasSideEffect = tfNoSideEffect notin fntyp.flags
+  c.builder.rawBuildCall kind, c.typeToMir(fntyp[0]), hasSideEffect:
     genCallee(c, n[0])
     genArgs(c, n)
     if kind == mnkCheckedCall:
@@ -964,7 +957,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
   of mOffsetOf:
     # an offsetOf call that has to be evaluated by the backend
     c.buildMagicCall mOffsetOf, rtyp:
-      c.subTree mnkName:
+      c.builder.emitByName ekNone:
         # prevent all checks and make sure that the original lvalue
         # expression reaches the code generators
         # XXX: this is a brittle and problematic hack. The type plus field
@@ -1067,7 +1060,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
     # and panics are disabled, the call must be a checked call
     if optOverflowCheck in n[0].sym.options and
        optPanics notin c.graph.config.globalOptions:
-      c.buildTree mnkCheckedCall, rtyp:
+      c.builder.rawBuildCall mnkCheckedCall, rtyp, false:
         c.genCallee(n[0])
         arg n[1]
         raiseExit(c)
@@ -1174,8 +1167,7 @@ proc genMagic(c: var TCtx, n: PNode; m: TMagic) =
       # rewrite ``getAst(macro(a, b, c))`` -> ``macro(a, b, c)``
       # treat a macro call as potentially raising and as modifying global
       # data. While not wrong, it is pessimistic
-      c.subTree MirNode(kind: mnkCheckedCall, typ: rtyp,
-                        effects: {geMutateGlobal}):
+      c.builder.rawBuildCall mnkCheckedCall, rtyp, true:
         # we can use the internal signature
         genMacroCallArgs(c, n, skMacro, callee.sym.internal)
         raiseExit(c)
@@ -1239,7 +1231,7 @@ proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
       if isRef: mnkRefConstr
       else:     mnkObjConstr
 
-  c.subTree MirNode(kind: kind, typ: c.typeToMir(n.typ), len: uint32(n.len-1)):
+  c.subTree MirNode(kind: kind, typ: c.typeToMir(n.typ)):
     for i in 1..<n.len:
       let it = n[i]
       let field = lookupFieldAgain(n.typ.skipTypes(abstractInst), it[0].sym)
@@ -1251,8 +1243,9 @@ proc genObjConstr(c: var TCtx, n: PNode, isConsume: bool) =
         (isRef or isConsume) and
         sfCursor notin field.flags
 
-      c.add MirNode(kind: mnkField, field: field.position.int32)
-      c.emitOperandTree it[1], useConsume
+      c.subTree mnkBinding:
+        c.add MirNode(kind: mnkField, field: field.position.int32)
+        c.emitOperandTree it[1], useConsume
 
 proc genRaise(c: var TCtx, n: PNode) =
   assert n.kind == nkRaiseStmt
@@ -1273,8 +1266,7 @@ proc genRaise(c: var TCtx, n: PNode) =
       typ = skipTypes(n[0].typ, abstractPtrs)
       cp = c.graph.getCompilerProc("prepareException")
     c.buildStmt mnkVoid:
-      c.buildTree mnkCall, VoidType:
-        c.add procNode(c.env.procedures.add(cp))
+      c.builder.buildCall c.env.procedures.add(cp), VoidType:
         c.subTree mnkArg:
           # lvalue conversion to the base ``Exception`` type:
           c.buildTree mnkPathConv, c.typeToMir(cp.typ[1]):
@@ -1497,8 +1489,7 @@ proc genVarTuple(c: var TCtx, n: PNode) =
         # moved out of. The temporary tuple is not destroyed, so no
         # destructive move is required
         c.buildTree mnkMove, typ:
-          c.subTree MirNode(kind: mnkPathPos, typ: typ,
-                            position: i.uint32):
+          c.builder.pathPos typ, i.uint32:
             c.use val
 
     # it's guaranteed that all elements are moved out of the tuple, no
@@ -1677,13 +1668,13 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
   assert isEmptyType(n.typ) == not dest.isSome
 
   let v = genUse(c, n[0])
-  c.add MirNode(kind: mnkCase, len: uint32(n.len))
+  let start = c.builder.start MirNode(kind: mnkCase)
   c.use v
 
   let firstLabel = c.builder.nextLabel
   # first step: emit the dispatcher
   for (_, branch) in branches(n):
-    c.add MirNode(kind: mnkBranch, len: uint32(branch.len))
+    let start = c.builder.start MirNode(kind: mnkBranch)
 
     case branch.kind
     of nkElse:
@@ -1701,9 +1692,9 @@ proc genCase(c: var TCtx, n: PNode, dest: Destination) =
       unreachable(branch.kind)
 
     c.add newLabelNode(c) # the jump target
-    c.add endNode(mnkBranch)
+    c.builder.finish(start)
 
-  c.add endNode(mnkCase)
+  c.builder.finish(start)
 
   # second step: emit the branch bodies
   c.withBlock bkBlock:
@@ -1717,8 +1708,7 @@ proc genExceptBranch(c: var TCtx, n: PNode, label: LabelId,
   c.builder.useSource(c.sp, n)
   let withFilter = n.len > 1
 
-  c.subTree MirNode(kind: mnkExcept,
-                    len: uint32(1 + (n.len - 1) + ord(withFilter))):
+  c.subTree mnkExcept:
     c.add labelNode(label) # name of the except
 
     # emit the exception types the branch covers:
@@ -1787,7 +1777,7 @@ proc genFinally(c: var TCtx, n: PNode) =
 
   # the continue statement is always necessary, even if the body has no
   # structured exit
-  c.subTree MirNode(kind: mnkContinue, len: uint32(1 + blk.exits.len)):
+  c.subTree mnkContinue:
     c.add labelNode(blk.id.unsafeGet)
     for it in blk.exits.items:
       c.add labelNode(it)
@@ -1912,19 +1902,17 @@ proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
     c.buildOp mnkDerefView, typ:
       c.use toValue(c, e, i - 1)
   of pirTupleAccess:
-    c.subTree MirNode(kind: mnkPathPos, typ: typ, position: n.pos):
+    c.builder.pathPos typ, n.pos:
       recurse()
   of pirFieldAccess:
-    c.subTree MirNode(kind: mnkPathNamed, typ: typ,
-                      field: n.field.position.int32):
+    c.builder.pathNamed typ, n.field.position.int32:
       recurse()
   of pirArrayAccess, pirSeqAccess:
     c.buildOp mnkPathArray, typ:
       recurse()
       c.use toValue(c, e, n.index)
   of pirVariantAccess:
-    c.subTree MirNode(kind: mnkPathVariant, typ: typ,
-                      field: n.field.position.int32):
+    c.builder.pathVariant typ, n.field.position.int32:
       recurse()
   of pirLvalueConv:
     c.buildOp mnkPathConv, typ:
@@ -1948,8 +1936,7 @@ proc genx(c: var TCtx, e: PMirExpr, i: int; fromMove = false) =
       variant = toValue(c, e, i - 1)
       discr = genCheckedVariantAccess(c, variant, n.orig[0][1].sym.name,
                                       n.orig[n.nodeIndex])
-    c.subTree MirNode(kind: mnkPathVariant, typ: typ,
-                      field: discr.position.int32):
+    c.builder.pathVariant typ, discr.position.int32:
       c.use variant
   of pirCheckedObjConv:
     let
@@ -2162,8 +2149,8 @@ proc gen(c: var TCtx, n: PNode) =
       c.buildStmt mnkSwitch:
         # the 'switch' operations expects a variant access as the first
         # operand
-        c.subTree MirNode(kind: mnkPathVariant, typ: c.typeToMir(dest[^2].typ),
-                          field: dest[^1].field.position.int32):
+        c.builder.pathVariant c.typeToMir(dest[^2].typ),
+                              dest[^1].field.position.int32:
           genx(c, dest, dest.len - 2)
 
         genAsgnSource(c, n[1], {dfOwns}) # the source operand
@@ -2397,7 +2384,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
         leaveBlock(c)
 
       # emit the handler for panicking on escaping exceptions:
-      c.subTree MirNode(kind: mnkExcept, len: 1):
+      c.subTree mnkExcept:
         c.add labelNode(b.id.unsafeGet)
       c.subTree mnkVoid:
         let p = c.graph.getCompilerProc("nimUnhandledException")
@@ -2456,15 +2443,16 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       # no normalization/canonicalization takes place here, meaning that
       # ``Obj(a: 0, b: 1)`` and ``Obj(b: 1, a: 0)`` will result in two data
       # table entries, even though the values they represent are equivalent
-      bu.subTree MirNode(kind: mnkObjConstr, typ: typ, len: uint32(n.len-1)):
+      bu.subTree MirNode(kind: mnkObjConstr, typ: typ):
         for i in 1..<n.len:
-          bu.add MirNode(kind: mnkField, field: n[i][0].sym.position.int32)
-          bu.subTree mnkArg:
-            constToMirAux(bu, env, n[i][1])
+          bu.subTree mnkBinding:
+            bu.add MirNode(kind: mnkField, field: n[i][0].sym.position.int32)
+            bu.subTree mnkArg:
+              constToMirAux(bu, env, n[i][1])
     of nkCurly:
       # similar to object construction, no normalization means that ``{1, 2}``
       # and ``{2, 1}`` results in two data table entries
-      bu.subTree MirNode(kind: mnkSetConstr, typ: typ, len: uint32(n.len)):
+      bu.subTree MirNode(kind: mnkSetConstr, typ: typ):
         for it in n.items:
           constToMirAux(bu, env, it)
     of nkBracket, nkTupleConstr, nkClosure:
@@ -2476,7 +2464,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
         of tyProc:                  mnkClosureConstr
         else:                       unreachable()
 
-      bu.subTree MirNode(kind: kind, typ: typ, len: uint32(n.len)):
+      bu.subTree MirNode(kind: kind, typ: typ):
         for it in n.items:
           bu.subTree mnkArg:
             constToMirAux(bu, env, it.skipColon)
@@ -2491,7 +2479,7 @@ proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
       else:
         unreachable()
     of nkRange:
-      bu.subTree MirNode(kind: mnkRange, len: 2):
+      bu.subTree MirNode(kind: mnkRange):
         constToMirAux(bu, env, n[0])
         constToMirAux(bu, env, n[1])
     of nkNilLit:
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index ab68eae6970..c9b3d498899 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -143,7 +143,7 @@ proc preventRvo(tree: MirTree, types: TypeEnv, changes: var Changeset) =
       dest = tree.operand(i, 0)
       path = computePath(tree, NodePosition dest)
     var needsTemp = false
-    for kind, it in arguments(tree, NodePosition source):
+    for kind, _, it in arguments(tree, NodePosition source):
       let (check, arg) =
         case kind
         of mnkArg:
@@ -161,7 +161,7 @@ proc preventRvo(tree: MirTree, types: TypeEnv, changes: var Changeset) =
           else:
             (false, OpValue 0)
         of mnkName:
-          (true, tree.skip(it, mnkTag))
+          (true, it)
         of mnkConsume:
           (false, OpValue 0)
 
@@ -356,8 +356,8 @@ proc eliminateTemporaries(tree: MirTree, types: TypeEnv,
         # as eliding the temporary would be obersvable when the backend decides
         # to use pass-by-reference for the immutable parameter
         elide = true # unless proven otherwise
-        for k, arg in arguments(tree, expr):
-          if tree[arg].kind == mnkTag and overlaps(p, typ, tree.operand(arg)):
+        for k, eff, arg in arguments(tree, expr):
+          if eff != ekNone and overlaps(p, typ, arg):
             elide = false
             break
 
@@ -580,7 +580,7 @@ proc injectStrPreparation(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
   # storage
   for i, node in tree.pairs:
     case node.kind
-    of mnkAsgn, mnkInit, mnkMutView, mnkTag:
+    of mnkAsgn, mnkInit, mnkMutView:
       let op = tree.child(i, 0) # the operand
       if isStringAccess(op):
         # either
@@ -589,6 +589,14 @@ proc injectStrPreparation(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
         insertPrepareCall(changes, tree, tree.child(op, 0),
                           env.procedures.add(prc))
 
+    of mnkName:
+      let op = tree.child(i, 1)
+      if tree.effect(i) != ekNone and isStringAccess(op):
+        # an item of the string is passed to a parameter supporting
+        # mutation
+        insertPrepareCall(changes, tree, tree.child(op, 0),
+                          env.procedures.add(prc))
+
     of mnkToMutSlice:
       if env[tree[i, 0].typ].skipTypes(abstractInst).kind == tyString:
         # conservatively prepare the string for mutation when creating a
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index dc85592c4ce..00f9b5b70e5 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -82,6 +82,9 @@ type
     # store the type of the destination within each def, assignment, etc. and
     # then remove the type field from ``MirNode``
 
+    mnkImmediate ## special node only allowed in certain contexts. Used to
+                 ## store extra, context-dependent information in the tree
+
     mnkMagic  ## only allowed in a callee position. Refers to a magic
               ## procedure
 
@@ -176,10 +179,6 @@ type
               ## currently active exception. Otherwise, consumes the operand
               ## and sets it as the active exception
 
-    mnkTag    ## must only appear as the immediate subnode to a ``mnkName``
-              ## tree. Describes what kind of mutation is applied to the
-              ## lvalue within the called procedure
-
     mnkSetConstr  ## constructor for set values
     mnkRange      ## range constructor. May only appear in set constructions
                   ## and as a branch label
@@ -189,6 +188,8 @@ type
     mnkClosureConstr## constructor for closure values
     mnkObjConstr  ## constructor for object values
     mnkRefConstr  ## allocates a new managed heap cell and initializes it
+    mnkBinding    ## only valid as an object or ref construction child node.
+                  ## Associates an argument with a field
 
     mnkCopy   ## denotes the assignment as copying the source value
     mnkMove   ## denotes the assignment as moving the value. This does
@@ -242,14 +243,8 @@ type
     mnkAsm    ## embeds backend-dependent code directly into the output
     mnkEmit   ## embeds backend-dependent code directly into the output
 
-    mnkEnd    ## marks the end of a sub-tree. Has no behaviour associated with
-              ## it -- it's only required to know where a sub-tree ends
-    # future direction: replace the End node with storing the number of sub-
-    # nodes of a sub-tree on the node itself. This will require significant
-    # structural changes, as not all node kinds are able to use the length
-    # field at the moment
-
   EffectKind* = enum
+    ekNone      ## no effect
     ekMutate    ## the value in the location is mutated
     ekReassign  ## a new value is assigned to the location
     ekKill      ## the value is removed from the location (without observing
@@ -258,9 +253,6 @@ type
                 ## value become outdated. The state of it is now completely
                 ## unknown
 
-  GeneralEffect* = enum
-    geMutateGlobal ## the operation mutates global state
-
   MirNode* = object
     typ*: TypeId ## valid for all expression, including all calls
     info*: SourceId
@@ -275,7 +267,7 @@ type
       cnst*: ConstId
     of mnkParam, mnkLocal, mnkTemp, mnkAlias:
       local*: LocalId
-    of mnkField, mnkPathNamed, mnkPathVariant:
+    of mnkField:
       field*: int32
         ## field position
     of mnkIntLit, mnkUIntLit, mnkFloatLit:
@@ -284,20 +276,15 @@ type
       strVal*: StringId
     of mnkAstLit:
       ast*: AstId
-    of mnkPathPos:
-      position*: uint32 ## the 0-based position of the field
-    of mnkCall, mnkCheckedCall:
-      effects*: set[GeneralEffect]
     of mnkLabel, mnkLeave:
       label*: LabelId
+    of mnkImmediate:
+      imm*: uint32 ## meaning depends on the context
     of mnkMagic:
       magic*: TMagic
-    of mnkEnd:
-      start*: MirNodeKind ## the kind of the corresponding start node
-    of mnkTag:
-      effect*: EffectKind ## the effect that happens when the operator the
-                          ## tagged value is passed to is executed
-    else:
+    of mnkNone, mnkNilLit, mnkType, mnkResume:
+      discard
+    of {low(MirNodeKind)..high(MirNodeKind)} - {mnkNone .. mnkLeave}:
       len*: uint32
 
   MirTree* = seq[MirNode]
@@ -325,13 +312,12 @@ const
   AtomNodes* = {mnkNone..mnkLeave}
     ## Nodes that don't support sub nodes.
 
-  SubTreeNodes* = AllNodeKinds - AtomNodes - {mnkEnd}
-    ## Nodes that start a sub-tree. They're always matched with an ``mnkEnd``
-    ## node.
+  SubTreeNodes* = AllNodeKinds - AtomNodes
+    ## Nodes that start a sub-tree. They always store a length.
 
   SingleOperandNodes* = {mnkPathNamed, mnkPathPos, mnkPathVariant, mnkPathConv,
                          mnkAddr, mnkDeref, mnkView, mnkDerefView, mnkStdConv,
-                         mnkConv, mnkCast, mnkRaise, mnkTag, mnkArg,
+                         mnkConv, mnkCast, mnkRaise, mnkArg,
                          mnkName, mnkConsume, mnkVoid, mnkCopy, mnkMove,
                          mnkSink, mnkDestroy, mnkMutView, mnkToMutSlice}
     ## Nodes that start sub-trees but that always have a single sub node.
@@ -351,7 +337,8 @@ const
   ConstrTreeNodes* = {mnkSetConstr, mnkRange, mnkArrayConstr, mnkSeqConstr,
                       mnkTupleConstr, mnkClosureConstr, mnkObjConstr,
                       mnkRefConstr, mnkProcVal, mnkArg, mnkField,
-                      mnkEnd} + LiteralDataNodes
+                      mnkBinding} +
+                     LiteralDataNodes
     ## Nodes that can appear in the MIR subset used for constant expressions.
 
   StmtNodes* = {mnkScope, mnkGoto, mnkIf, mnkCase, mnkLoop, mnkJoin,
@@ -432,68 +419,48 @@ func `in`*(p: NodePosition, tree: MirTree): bool {.inline.} =
 template `[]`*(tree: MirTree, i: NodePosition | OpValue): untyped =
   tree[ord(i)]
 
+template isAtom(kind: MirNodeKind): bool =
+  # much faster than an `in SubTreeNodes` test
+  ord(kind) <= ord(mnkLeave)
+
 func parent*(tree: MirTree, n: NodePosition): NodePosition =
   result = n
-
-  var depth = 1
-  while depth > 0:
+  # walk backwards and compute the total number of nodes covered so far.
+  # Once the covered region includes the node we started at, we've found the
+  # parent
+  var covered = 0'u32
+  while true:
     dec result
 
-    let kind = tree[result].kind
-    depth += ord(kind == mnkEnd) - ord(kind in SubTreeNodes)
+    let node = tree[result]
+    if not isAtom(node.kind):
+      covered += node.len
 
-func parentEnd*(tree: MirTree, n: NodePosition): NodePosition =
-  # Computes the position of the ``mnkEnd`` node belonging to the sub-tree
-  # enclosing `n`
-  result = n
-
-  # start at depth '2' if `n` starts a sub-tree itself. The terminator of said
-  # sub-tree would be treated as the parent's end otherwise
-  var depth = 1 + ord(tree[n].kind in SubTreeNodes)
-  while depth > 0:
-    inc result
-
-    let kind = tree[result].kind
-    depth += ord(kind in SubTreeNodes) - ord(kind == mnkEnd)
+    if uint32(result) + covered >= uint32(n):
+      break
 
 func sibling*(tree: MirTree, n: NodePosition): NodePosition =
-  ## Computes the index of the next sibling node of `x`
-  # TODO: should return a option. Not all nodes have siblings
-  # TODO: since this doesn't consider 'end' nodes, the procedure should
-  #       probably be renamed to ``rawSibling``?
-  result = n + 1
-
-  var depth = ord(tree[n].kind in SubTreeNodes)
-  while depth > 0:
-    let kind = tree[result].kind
-    # to be more efficient, we don't use branching. We're incrementing
-    # `depth` whenever we encounter the start of a sub-tree and decrement
-    # it when an 'end' node is encountered
-    depth += ord(kind in SubTreeNodes) - ord(kind == mnkEnd)
-
+  ## Computes the index of the next node/sub-tree following the node at `n`.
+  # XXX: `sibling` is a misnomer; `next` would be more fitting
+  result = n
+  var last = n
+  while result <= last:
+    let node = tree[result]
+    if not isAtom(node.kind):
+      inc last, node.len.int
     inc result
 
-  if result.int == tree.len or tree[result].kind == mnkEnd:
-    # no sibling exists
-    discard
-
 func previous*(tree: MirTree, n: NodePosition): NodePosition =
   ## Computes the index of `n`'s the preceding sibling node. If there
-  ## is none, returns the index of the parent node.
-  var i = n - 1
-
-  var depth = ord(tree[i].kind == mnkEnd)
-  while depth > 0:
-    dec i
-    let kind = tree[i].kind
-
-    # to be more efficient, we don't use branching. We're incrementing
-    # `depth` whenever we encounter the end of a sub-tree and decrement
-    # it when a start of one is encountered
-    depth += ord(kind == mnkEnd) - ord(kind in SubTreeNodes)
-
-  assert ord(i) >= 0
-  result = i
+  ## is none, returns the index of the parent node. **This is a slow
+  ## operation, it should be used sparsely.**
+  # XXX: could be optimized to not require first seeking to the parent
+  result = tree.parent(n)
+  var next = result + 1 # first child node
+  # advance the position until the sibling is `n`
+  while next < n:
+    result = next
+    next = tree.sibling(result)
 
 func computeSpan*(tree: MirTree, n: NodePosition): Slice[NodePosition] =
   ## If `n` refers to a leaf node, returns a span with the `n` as the single
@@ -502,24 +469,6 @@ func computeSpan*(tree: MirTree, n: NodePosition): Slice[NodePosition] =
   ## at `n`. The 'end' node is included.
   result = n .. (sibling(tree, n) - 1)
 
-func start*(tree: MirTree, n: NodePosition): NodePosition =
-  ## Find the corresponding start node for an ``mnkEnd`` node
-  assert tree[n].kind == mnkEnd
-  result = n
-
-  var depth = 1
-  while depth > 0:
-    dec result
-
-    let kind = tree[result].kind
-    depth += ord(kind == mnkEnd) - ord(kind in SubTreeNodes)
-
-func findEnd*(tree: MirTree, n: NodePosition): NodePosition =
-  ## Finds the corresponding ``end`` node for the node `n` that starts a
-  ## sub-tree
-  assert tree[n].kind in SubTreeNodes
-  result = sibling(tree, n) - 1
-
 func child*(tree: MirTree, n: NodePosition, index: Natural): NodePosition =
   ## Returns the position of the child node at index `index`. `index` *must*
   ## refer to a valid sub-node -- no validation is performed
@@ -541,13 +490,12 @@ func `[]`*(tree: MirTree, n: OpValue, index: Natural): lent MirNode =
   ## Returns the `index`-th child node of sub-tree `n`.
   tree[child(tree, NodePosition n, index)]
 
-func getStart*(tree: MirTree, n: NodePosition): NodePosition =
-  ## If `n` refers to an ``end`` node, returns the corresponding start node --
-  ## `n` otherwise
-  if tree[n].kind == mnkEnd:
-    start(tree, n)
-  else:
-    n
+func last*(tree: MirTree, n: NodePosition): NodePosition =
+  ## Returns the last child node in the subtree at `n`.
+  let skip = tree[n].len - 1
+  result = tree.child(n, 0)
+  for _ in 0..<skip:
+    result = tree.sibling(result)
 
 func findParent*(tree: MirTree, start: NodePosition,
                  kind: MirNodeKind): NodePosition =
@@ -561,43 +509,34 @@ func findParent*(tree: MirTree, start: NodePosition,
 
 func len*(tree: MirTree, n: NodePosition): int =
   ## Computes the number of child nodes for the given sub-tree node.
-  var n = n + 1
-  while tree[n].kind != mnkEnd:
-    inc result
-    n = tree.sibling(n)
+  tree[n].len.int
 
 func numArgs*(tree: MirTree, n: NodePosition): int =
   ## Counts and returns the number of *call arguments* in the call tree at
   ## `n`.
   assert tree[n].kind in CallKinds
-  var n = tree.sibling(n + 1) # skip the callee
-  while tree[n].kind in ArgumentNodes:
-    inc result
-    n = tree.sibling(n)
+  result = tree[n].len.int - 2 - ord(tree[n].kind == mnkCheckedCall)
 
 func operand*(tree: MirTree, op: OpValue|NodePosition): OpValue =
-  ## Returns the index (``OpValue``) of the operand for the single-input node
-  ## at `op`.
-  assert tree[op].kind in SingleOperandNodes, $tree[op].kind
+  ## Returns the index (``OpValue``) of the operand for the single-operand
+  ## operation at `op`.
   let pos =
     when op is NodePosition: op
     else:                    NodePosition(op)
-  result = OpValue(pos + 1)
+  case tree[op].kind
+  of SingleOperandNodes - {mnkName}:
+    OpValue(pos + 1)
+  of mnkName:
+    OpValue(pos + 2)
+  else:
+    unreachable()
 
 func argument*(tree: MirTree, n: NodePosition, i: Natural): OpValue =
   ## Returns the `i`-th argument in the call-like tree at `n`, skipping
   ## tag nodes. It is expected that the call has at least `i` + 1
   ## arguments.
   assert tree[n].kind in CallKinds
-  var n = tree.sibling(n + 1)
-  for _ in 0..<i:
-    n = tree.sibling(n)
-  n = NodePosition tree.operand(n)
-  # skip the tag node if one exists
-  if tree[n].kind == mnkTag:
-    tree.operand(n)
-  else:
-    OpValue n
+  result = tree.operand(tree.child(n, 2 + i))
 
 func skip*(tree: MirTree, n: OpValue, kind: MirNodeKind): OpValue =
   ## If `n` is of `kind`, return its operand node, `n` otherwise.
@@ -613,19 +552,26 @@ iterator pairs*(tree: MirTree): (NodePosition, lent MirNode) =
 
 iterator subNodes*(tree: MirTree, n: NodePosition): NodePosition =
   ## Iterates over and yields all direct child nodes of `n`
-  var r = n + 1
-  while tree[r].kind != mnkEnd:
-    yield r
-    r = sibling(tree, r)
+  let L = tree[n].len
+  var n = tree.child(n, 0)
+  for _ in 0..<L:
+    yield n
+    n = tree.sibling(n)
 
-iterator arguments*(tree: MirTree, n: NodePosition): (ArgKinds, OpValue) =
+iterator arguments*(tree: MirTree, n: NodePosition): (ArgKinds, EffectKind, OpValue) =
   ## Returns the argument kinds together with the operand node (or tag tree).
   assert tree[n].kind in CallKinds
-  var i = tree.sibling(n + 1) # skip the callee
-  # XXX: iterating until no more argument nodes are found is a temporary
-  #      workaround until call nodes store their number of sub-nodes
-  while tree[i].kind in ArgumentNodes:
-    yield (ArgKinds(tree[i].kind), tree.operand(i))
+  # the jump target of checked calls is not an argument
+  let len = tree[n].len.int - ord(tree[n].kind == mnkCheckedCall)
+  var i = tree.child(n, 2) # skip the callee and effect node
+  for _ in 2..<len:
+    let node = tree[i]
+    let eff =
+      case node.kind
+      of mnkName: tree[i + 1].imm.EffectKind
+      else:       ekNone
+    # for efficiency, only use a single yield
+    yield (ArgKinds(node.kind), eff, tree.operand(i))
     i = tree.sibling(i)
 
 func findDef*(tree: MirTree, n: NodePosition): NodePosition =
@@ -646,7 +592,10 @@ func findDef*(tree: MirTree, n: NodePosition): NodePosition =
          tree[name].local == expected:
         return
 
-    result = tree.previous(result)
+    # seek to the previous statement:
+    dec result
+    while tree[result].kind notin StmtNodes:
+      dec result
 
   unreachable("no corresponding def found")
 
@@ -657,4 +606,28 @@ iterator lpairs*[T](x: seq[T]): (int, lent T) =
   let L = x.len
   while i < L:
     yield (i, x[i])
-    inc i
\ No newline at end of file
+    inc i
+
+# -------------------------------
+# queries for specific node kinds
+
+func callee*(tree: MirTree, n: NodePosition): NodePosition {.inline.} =
+  ## Returns the callee node for the call subtree `n`.
+  assert tree[n].kind in CallKinds
+  n + 2
+
+proc mutatesGlobal*(tree: MirTree, n: NodePosition): bool {.inline.} =
+  ## Whether evaluating the call expression at `n` potentially mutates
+  ## global state.
+  assert tree[n].kind in CallKinds
+  tree[n, 0].imm.bool
+
+func effect*(tree: MirTree, n: NodePosition): EffectKind {.inline.} =
+  ## Returns the effect for the ``mnkName`` node at `n`.
+  assert tree[n].kind == mnkName
+  tree[n, 0].imm.EffectKind
+
+func field*(tree: MirTree, n: NodePosition): int32 {.inline.} =
+  ## Returns the field position specified for the field access at `n`.
+  assert tree[n].kind in {mnkPathNamed, mnkPathVariant}
+  tree[n, 1].field
diff --git a/compiler/mir/rtchecks.nim b/compiler/mir/rtchecks.nim
index fd718dfd4a1..b136f6bf851 100644
--- a/compiler/mir/rtchecks.nim
+++ b/compiler/mir/rtchecks.nim
@@ -64,13 +64,13 @@ template emitCall(bu; tree; call; prc: ProcedureId, arguments: untyped) =
   ## Emits a void call of `prc`, inherting the checked-ness from `call`.
   bu.subTree mnkVoid:
     # if the input call is a checked call, so is the new call
-    bu.subTree tree[call].kind, VoidType:
+    bu.rawBuildCall tree[call].kind, VoidType, false:
       bu.add procNode(prc) # callee
       arguments # custom arguments
 
       if tree[call].kind == mnkCheckedCall:
         # copy the jump target
-        bu.emitFrom(tree, tree.previous(findEnd(tree, call)))
+        bu.emitFrom(tree, tree.last(call))
 
 proc addCompilerProc(env; graph; name: string): ProcedureId =
   env.procedures.add(graph.getCompilerProc(name))
@@ -441,7 +441,7 @@ proc emitCheckedBinaryIntOp(tree; call; graph; env; bu): Value =
   ##     raiseOverflow()
   ##   result = _1
   let
-    magic = tree[call + 1].magic
+    magic = tree[tree.callee(call)].magic
     t = env[tree[call].typ].skipTypes(abstractRange)
     x = NodePosition tree.argument(call, 0)
     y = NodePosition tree.argument(call, 1)
@@ -540,7 +540,7 @@ proc emitCheckedFloatOp(tree; call; graph; env; bu): Value =
   let typ = tree[call].typ
   const Map = [mAddF64: mnkAdd, mSubF64: mnkSub, mMulF64: mnkMul, mDivF64: mnkDiv]
   result = bu.wrapTemp typ:
-    bu.subTree Map[tree[call + 1].magic], typ:
+    bu.subTree Map[tree[tree.callee(call)].magic], typ:
       bu.emitFrom(tree, NodePosition tree.argument(call, 0))
       bu.emitFrom(tree, NodePosition tree.argument(call, 1))
 
diff --git a/compiler/mir/treechangesets.nim b/compiler/mir/treechangesets.nim
index fcfae9b2ab2..16863942c60 100644
--- a/compiler/mir/treechangesets.nim
+++ b/compiler/mir/treechangesets.nim
@@ -94,16 +94,11 @@ func replace*(c: var Changeset, tree: MirTree, at: NodePosition,
 func changeTree*(c: var Changeset, tree: MirTree, at: NodePosition,
                  with: sink MirNode) =
   ## Replaces the sub-tree at `at` with `with` while keeping all child trees.
-  ## The origin information is taken from the replaced node.
-  let
-    e = tree.findEnd(at)
-    with2 = MirNode(kind: mnkEnd, start: with.kind, info: tree[e].info)
-
+  ## The origin and length information is taken from the replaced node.
   {.cast(noSideEffect).}: # XXX: compiler bug workaround
     with.info = tree[at].info
+    with.len = tree[at].len
   c.rows.add row(at, at+1, c.nodes.addSingle(with))
-  # the end node needs to be replaced too
-  c.rows.add row(e, e+1, c.nodes.addSingle(with2))
 
 func insert*(c: var Changeset, at: NodePosition, n: sink MirNode) =
   ## Records the insertion of `n` at `at`. The ``info`` field on the node
diff --git a/compiler/mir/utils.nim b/compiler/mir/utils.nim
index 9b2d695c729..4a4362feb80 100644
--- a/compiler/mir/utils.nim
+++ b/compiler/mir/utils.nim
@@ -38,7 +38,7 @@ func `$`(n: MirNode): string =
   of mnkParam, mnkLocal, mnkTemp, mnkAlias:
     result.add " local: "
     result.addInt n.local.uint32
-  of mnkField, mnkPathNamed, mnkPathVariant:
+  of mnkField:
     result.add " field:"
     result.addInt n.field
   of mnkIntLit, mnkUIntLit, mnkFloatLit:
@@ -50,27 +50,20 @@ func `$`(n: MirNode): string =
   of mnkAstLit:
     result.add " ast: "
     result.addInt n.ast.uint32
-  of mnkPathPos:
-    result.add " position: "
-    result.add $n.position
-  of mnkCall, mnkCheckedCall:
-    result.add " effects: "
-    result.add $n.effects
   of mnkMagic:
     result.add " magic: "
     result.add $n.magic
   of mnkLabel, mnkLeave:
     result.add " label: "
     result.addInt n.label.uint32
-  of mnkEnd:
-    result.add " start: "
-    result.add $n.start
-  of mnkTag:
-    result.add " effect: "
-    result.add $n.effect
-  else:
+  of mnkImmediate:
+    result.add " imm: "
+    result.addInt n.imm
+  of mnkNone, mnkNilLit, mnkType, mnkResume:
+    discard
+  of SubTreeNodes:
     result.add " len: "
-    result.add $n.len
+    result.addInt n.len
 
   if n.typ != VoidType:
     result.add " typ: "
@@ -96,26 +89,14 @@ proc treeRepr*(tree: MirTree, pos = NodePosition(0)): string =
 
     case n.kind
     of SubTreeNodes:
-      var sub = 0
-      while true:
+      for sub in 0..<n.len.int:
         if i >= nodes.len:
-          line repeat("  ", indent), "out of bounds: end expected for ",
-               n.kind
+          line repeat("  ", indent+1), "error: nodes are missing"
           break
-        elif nodes[i].kind == mnkEnd:
-          if nodes[i].start == n.kind:
-            inc i
-            break
-          else:
-            line repeat("  ", indent+1), "loose end: ", nodes[i].start,
-                 " expected: ", n.kind
-            inc i
         else:
           aux(result, nodes, indent+1, sub, i)
 
-        inc sub
-
-    of AtomNodes + {mnkEnd}:
+    of AtomNodes:
       discard "already rendered"
 
   var i = pos.int
@@ -284,7 +265,6 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   template tree(start: string, body: untyped) =
     result.add start
     body
-    inc i # the end node
 
   let n {.cursor.} = next(nodes, i)
   case n.kind
@@ -298,13 +278,13 @@ proc valueToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
     tree "":
       valueToStr()
       result.add "."
-      result.addInt n.position
+      result.addInt next(nodes, i).imm
   of mnkPathNamed, mnkPathVariant:
     tree "":
       let typ = nodes[i].typ # type of the object operand
       valueToStr()
       result.add "."
-      fieldToStr(n.field, typ, result, c)
+      fieldToStr(next(nodes, i).field, typ, result, c)
   of mnkPathConv:
     tree "":
       valueToStr()
@@ -340,14 +320,11 @@ proc argToStr(tree: MirTree, i: var int, result: var string, c: RenderCtx) =
   of AllNodeKinds - ArgumentNodes:
     result.error(n)
 
-  if tree[i].kind == mnkTag:
+   # ignore the tag for 'name' trees
+  if n.kind == mnkName:
     discard next(tree, i)
-    valueToStr()
-    inc i # skip the tag's end node
-  else:
-    valueToStr()
 
-  inc i # skip the end node
+  valueToStr()
 
 template argToStr() =
   argToStr(treeParam(), i, result, c)
@@ -360,6 +337,13 @@ proc labelToStr(nodes: MirTree, i: var int, result: var string) =
   else:
     error(result, n)
 
+template commaSeparated(len: uint32, body: untyped) =
+  let x = len # capture the expression
+  for i in 0..<x:
+    if i > 0:
+      result.add ", "
+    body
+
 proc targetToStr(nodes: MirTree, i: var int, result: var string) =
   var n {.cursor.} = next(nodes, i)
   case n.kind
@@ -367,11 +351,8 @@ proc targetToStr(nodes: MirTree, i: var int, result: var string) =
     result.add n.label
   of mnkTargetList:
     result.add "["
-    let start = i
-    while (n = next(nodes, i); n.kind != mnkEnd):
-      if i > start + 1:
-        result.add ", "
-
+    commaSeparated n.len:
+      n = next(nodes, i)
       case n.kind
       of mnkLabel:  result.add n.label
       of mnkLeave:  result.add "Leave(L" & $n.label.int & ")"
@@ -390,18 +371,9 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
     result.add start
     inc i # skip the start node
     body
-    inc i # skip the end node
 
-  template commaSeparated(body: untyped) =
-    var first = true
-    while nodes[i].kind != mnkEnd:
-      if first:
-        first = false
-      else:
-        result.add ", "
-      body
-
-  case nodes[i].kind
+  let n {.cursor.} = nodes[i]
+  case n.kind
   of LvalueExprKinds + Atoms:
     valueToStr()
   of mnkAddr:
@@ -412,7 +384,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       valueToStr()
   of mnkToSlice, mnkToMutSlice:
     tree "toOpenArray ":
-      commaSeparated:
+      commaSeparated n.len:
         valueToStr()
   of mnkConv:
     tree "conv ":
@@ -425,27 +397,27 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       valueToStr()
   of mnkArrayConstr:
     tree "[":
-      commaSeparated:
+      commaSeparated n.len:
         argToStr()
       result.add "]"
   of mnkSeqConstr:
     tree "@[":
-      commaSeparated:
+      commaSeparated n.len:
         argToStr()
       result.add "]"
   of mnkTupleConstr:
     tree "(":
-      commaSeparated:
+      commaSeparated n.len:
         argToStr()
       result.add ")"
   of mnkClosureConstr:
     tree "closure (":
-      commaSeparated:
+      commaSeparated n.len:
         argToStr()
       result.add ")"
   of mnkSetConstr:
     tree "{":
-      commaSeparated:
+      commaSeparated n.len:
         exprToStr(nodes, i, result, c)
       result.add "}"
   of mnkRange:
@@ -456,27 +428,27 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
   of mnkObjConstr, mnkRefConstr:
     let typ = nodes[i].typ
     tree "(":
-      commaSeparated:
-        fieldToStr(next(nodes, i).field, typ, result, c)
-        result.add ": "
-        argToStr()
+      commaSeparated n.len:
+        tree "":
+          fieldToStr(next(nodes, i).field, typ, result, c)
+          result.add ": "
+          argToStr()
       result.add ")"
   of mnkCall:
     tree "":
+      inc i # skip the immediate value
       calleeToStr(nodes, i, result, c)
       result.add "("
-      commaSeparated:
+      commaSeparated n.len - 2:
         argToStr()
       result.add ")"
   of mnkCheckedCall:
     tree "":
+      inc i # skip the immediate value
       calleeToStr(nodes, i, result, c)
       result.add "("
       # arguments:
-      let first = i
-      while nodes[i].kind in ArgumentNodes:
-        if i > first:
-          result.add ", "
+      commaSeparated n.len - 3:
         argToStr()
 
       # jump target:
@@ -484,16 +456,14 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       targetToStr()
   of UnaryOps:
     const Map = [mnkNeg: "-"]
-    let kind = nodes[i].kind
-    tree Map[kind]:
+    tree Map[n.kind]:
       valueToStr()
   of BinaryOps:
-    let kind = nodes[i].kind
     tree "":
       valueToStr() # first operand
       const Map = [mnkAdd: " + ", mnkSub: " - ",
                    mnkMul: " * ", mnkDiv: " div ", mnkModI: " mod "]
-      result.add Map[kind]
+      result.add Map[n.kind]
       valueToStr() # second operand
   of mnkCopy:
     tree "copy ":
@@ -506,7 +476,7 @@ proc exprToStr(nodes: MirTree, i: var int, result: var string, c: RenderCtx) =
       valueToStr()
   else:
     # TODO: make this branch exhaustive
-    result.error(nodes[i])
+    result.error(n)
     inc i
 
 template exprToStr() =
@@ -622,19 +592,13 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
             result.add ": goto "
             labelToStr(nodes, i, result)
             result.add "\n"
-          inc i # skip the end node
         else:
           # make no attempt at error correction
           result.error(b)
 
   of mnkAsm, mnkEmit:
     tree (if n.kind == mnkAsm: "asm " else: "emit "):
-      var first = true
-      while nodes[i].kind != mnkEnd:
-        if first:
-          first = false
-        else:
-          result.add ", "
+      commaSeparated n.len:
         valueToStr()
       result.add "\n"
   of mnkVoid:
@@ -684,15 +648,6 @@ proc stmtToStr(nodes: MirTree, i: var int, indent: var int, result: var string,
   of AllNodeKinds - StmtNodes:
     result.error(n)
 
-  # skip the end node
-  i += ord(n.kind in SubTreeNodes)
-
-proc renderList(tree: MirTree, i: var int, indent: int, result: var string,
-                c: RenderCtx) =
-  var indent = indent # support mutation
-  while i < tree.len and tree[i].kind != mnkEnd:
-    stmtToStr(tree, i, indent, result, c)
-
 proc exprToStr*(tree: MirTree, n: NodePosition; env: ptr MirEnv = nil;
                 body: ptr MirBody = nil): string =
   ## Renders the expression at `n` into a human-readable text representation.
@@ -712,7 +667,9 @@ proc render*(tree: MirTree; env: ptr MirEnv = nil;
   ## Renders `tree` into a human-readable text representation. The output is
   ## meant for debugging and tracing and is not guaranteed to have a stable
   ## format.
+  let ctx = RenderCtx(env: env, body: body)
   var
     i = 0
     indent = 0
-  renderList(tree, i, indent, result, RenderCtx(env: env, body: body))
+  while i < tree.len:
+    stmtToStr(tree, i, indent, result, ctx)
diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index dc55551c1f7..8906d6bc5b4 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -146,11 +146,11 @@ proc computePath*(tree: MirTree, at: NodePosition): Path =
   while true:
     case tree[pos].kind
     of mnkPathNamed, mnkPathVariant:
-      add pikNamed, pos
+      add pikNamed, tree.child(pos, 1)
     of mnkPathConv:
       discard "ignore"
     of mnkPathPos:
-      add pikPos, pos
+      add pikPos, tree.child(pos, 1)
     of mnkPathArray:
       add pikIndex, tree.child(pos, 1)
     of mnkAlias:
@@ -200,7 +200,7 @@ proc compare*(body: MirTree, a, b: Path): CmpLocsResult =
         break
 
     of pikPos:
-      if na.position != nb.position:
+      if na.imm != nb.imm:
         overlaps = no
         break
 
diff --git a/compiler/sem/injectdestructors.nim b/compiler/sem/injectdestructors.nim
index 44793eaa12d..2edee0e4c2c 100644
--- a/compiler/sem/injectdestructors.nim
+++ b/compiler/sem/injectdestructors.nim
@@ -510,7 +510,6 @@ proc consumeArg(tree: MirTree, ctx: AnalyseCtx, ar: AnalysisResults,
   ## `expr` is the call, construction, or ``raise`` argument expression that
   ## the consume is part of; `src` is the consumed lvalue; and `pos` is the
   ## data-flow instruction correspondig to the consume operation.
-  assert tree[expr].kind in ExprKinds
   if isNamed(tree, src) and
      needsReset(tree, ctx.cfg, ar, computePath(tree, NodePosition src),
                 pos + 1):
@@ -575,9 +574,9 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
   assert body[stmt].kind == mnkSwitch
 
   let
-    target = body.operand(stmt, 0)
+    target = body.child(stmt, 0)
     objType = body[target].typ
-    field = lookupInType(env[objType], body[target].field.int)
+    field = lookupInType(env[objType], body.field(target).int)
     typ = env.types.add(field.typ)
 
   assert body[target].kind == mnkPathVariant
@@ -588,7 +587,7 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
   let
     a = bu.wrapMutAlias(typ):
       # bind the discriminator lvalue, not the variant lvalue
-      bu.subTree MirNode(kind: mnkPathNamed, typ: typ, field: body[target].field):
+      bu.pathNamed typ, body.field(target):
         bu.emitFrom(body, NodePosition body.operand(target))
     b = bu.wrapTemp typ:
       bu.emitFrom(body, body.child(stmt, 1))
@@ -629,7 +628,7 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
       bu.buildMagicCall mNot, BoolType:
          bu.emitByVal val
 
-    var src = body.child(NodePosition target, 0)
+    var src = body.child(target, 0)
     # skip all ``mnkPathVariant`` nodes:
     while body[src].kind == mnkPathVariant:
       src = body.child(src, 0)
@@ -638,9 +637,8 @@ proc lowerBranchSwitch(bu: var MirBuilder, body: MirTree, graph: ModuleGraph,
       # ``=destroy`` call:
       bu.buildVoidCall(env, branchDestructor):
         # pass the object access expression to the destroy call
-        bu.subTree mnkName:
-          bu.subTree MirNode(kind: mnkTag, effect: ekMutate):
-            bu.emitFrom(body, src)
+        bu.emitByName ekMutate:
+          bu.emitFrom(body, src)
 
   else:
     # the object doesn't need destruction, which means that neither does one
diff --git a/compiler/sem/mirexec.nim b/compiler/sem/mirexec.nim
index d18560af7e1..ff9e68f1b0a 100644
--- a/compiler/sem/mirexec.nim
+++ b/compiler/sem/mirexec.nim
@@ -246,16 +246,23 @@ func emitLvalueOp(env: var ClosureEnv, opc: DataFlowOpcode, tree: MirTree,
   emitForValue(env, tree, at, source)
   env.dfaOp(opc, tree, at, source)
 
+func emitForArg(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
+  case tree[source].kind
+  of mnkArg:
+    emitLvalueOp(env, opUse, tree, at, tree.operand(source))
+  of mnkConsume:
+    emitLvalueOp(env, opConsume, tree, at, tree.operand(source))
+  of mnkName:
+    emitForValue(env, tree, at, tree.operand(source))
+  else:
+    unreachable(tree[source].kind)
+
 func emitForArgs(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   for it in subNodes(tree, source):
     case tree[it].kind
-    of mnkArg:
-      emitLvalueOp(env, opUse, tree, at, tree.operand(it))
-    of mnkConsume:
-      emitLvalueOp(env, opConsume, tree, at, tree.operand(it))
-    of mnkName:
-      emitForValue(env, tree, at, tree.skip(tree.operand(it), mnkTag))
-    of mnkField, mnkMagic, mnkProc, mnkLabel, mnkTargetList:
+    of mnkArg, mnkConsume, mnkName:
+      emitForArg(env, tree, at, it)
+    of mnkMagic, mnkProc, mnkLabel, mnkTargetList, mnkImmediate:
       discard
     else:
       emitLvalueOp(env, opUse, tree, at, OpValue it)
@@ -268,8 +275,11 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
 
   case tree[source].kind
   of mnkCall, mnkCheckedCall, mnkArrayConstr, mnkSeqConstr, mnkTupleConstr,
-     mnkClosureConstr, mnkObjConstr, mnkRefConstr:
+     mnkClosureConstr:
     emitForArgs(env, tree, at, source)
+  of mnkObjConstr, mnkRefConstr:
+    for it in subNodes(tree, source):
+      emitForArg(env, tree, at, tree.child(it, 1))
   of mnkSetConstr:
     for it in subNodes(tree, source):
       case tree[it].kind
@@ -333,25 +343,24 @@ func emitForExpr(env: var ClosureEnv, tree: MirTree, at, source: NodePosition) =
   case tree[source].kind
   of mnkCall, mnkCheckedCall:
     # lvalue effects:
-    for k, it in arguments(tree, source):
-      if tree[it].kind == mnkTag:
-        let opr = tree.operand(it)
-        case tree[it].effect
-        of ekMutate:     op opMutate, opr
-        of ekReassign:   op opDef, opr
-        of ekKill:       op opKill, opr
-        of ekInvalidate: op opInvalidate, opr
-      elif k == mnkName:
-        # the lvalue may be read from within the procedure
-        op opUse, it
+    for k, effect, it in arguments(tree, source):
+      case effect
+      of ekMutate:     op opMutate, it
+      of ekReassign:   op opDef, it
+      of ekKill:       op opKill, it
+      of ekInvalidate: op opInvalidate, it
+      of ekNone:
+        if k == mnkName:
+          # the lvalue may be read from within the procedure
+          op opUse, it
 
     # the potential mutation happens within the procedure, so the data-flow
     # operation has to come before the fork
-    if geMutateGlobal in tree[source].effects:
+    if tree.mutatesGlobal(source):
       env.instrs.add Instr(op: opMutateGlobal, node: at)
     if tree[source].kind == mnkCheckedCall:
       # the jump target description is in the last slot
-      raiseExit(env, opFork, tree, at, tree.previous(findEnd(tree, source)))
+      raiseExit(env, opFork, tree, at, tree.last(source))
   else:
     discard
 
diff --git a/compiler/vm/packed_env.nim b/compiler/vm/packed_env.nim
index a61045e3ce4..598d44bb76c 100644
--- a/compiler/vm/packed_env.nim
+++ b/compiler/vm/packed_env.nim
@@ -312,6 +312,7 @@ proc storeFieldsData(enc: var DataEncoder, e: var PackedEnv,
   # iterate over all fields in the construction and pack and store them:
   var n = n + 1
   for _ in 0..<count:
+    inc n # skip the binding node
     let s = lookupInType(typ, t[n].field.int) ## the field symbol
     inc n # move the cursor to the field's data
 
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 7eaab915c4e..88f59328e39 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -49,13 +49,11 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
   template arg(body: untyped) =
     inc n # skip the ``mnkArg`` node
     body
-    inc n # skip the end node
 
   template iterTree(name, body: untyped) =
     let len = next().len
     for name in 0..<len:
       body
-    inc n # skip the end node
 
   case dest.typ.kind
   of akInt:
@@ -108,7 +106,6 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
           a = adjusted(env.getInt(next()), first)
           b = adjusted(env.getInt(next()), first)
         bitSetInclRange(mbitSet(dest), a .. b)
-        inc n # skip the end node
       else:
         bitSetIncl(mbitSet(dest), adjusted(env.getInt(node), first))
   of akPNode:
@@ -128,6 +125,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
     of mnkObjConstr, mnkRefConstr:
       let typ = env[tree[n].typ].skipTypes(abstractPtrs) ## the object's type
       iterTree(i):
+        inc n # skip the binding node
         let
           sym = lookupInType(typ, next().field)
           field = dest.getFieldHandle(sym.position.FieldPosition)
diff --git a/doc/mir.rst b/doc/mir.rst
index 4b5fa82e18d..b34a8661273 100644
--- a/doc/mir.rst
+++ b/doc/mir.rst
@@ -68,35 +68,38 @@ Semantics
   CALL_ARG = Arg VALUE                    # pass-by-value argument
            | Arg <none>                   # argument that's going to be omitted
                                           # later
-           | Name LVALUE                  # pass-by-name argument where the
-                                          # lvalue is only used for reading
-           | Name (Tag <Effect> LVALUE)   # pass-by-name argument where the
-                                          # lvalue is used for mutation
+           | Name <Effect> LVALUE         # pass-by-name argument. The effect
+                                          # specifies the effect the call has
+                                          # on the value/location
            | Consume VALUE                # pass-by-value argument, but
                                           # the value is consumed (i.e., moved)
 
   CONSTR_ARG = Arg VALUE
              | Consume OPERAND
 
-  CALL_EXPR = Call <Proc> CALL_ARG ...   # a static call of the provided
-                                         # procedure with the given arguments
-            | Call LVALUE CALL_ARG ...   # indirect call
-            | Call <Magic> CALL_ARG ...  # a call of a magic procedure (i.e.,
-                                         # a procedure that is either going to
-                                         # be lowered into something else, or
-                                         # one for which the behaviour cannot
-                                         # be represented in the MIR)
+  CALL_EXPR = Call <Imm> <Proc> CALL_ARG ...  # a static call of the provided
+                                              # procedure with the given
+                                              # arguments
+            | Call <Imm> LVALUE CALL_ARG ...  # indirect call
+            | Call <Imm> <Magic> CALL_ARG ... # a call of a magic procedure
+                                              # (i.e., a procedure that is
+                                              # either going to be lowered into
+                                              # something else, or one for
+                                              # which the behaviour cannot
+                                              # be represented in the MIR)
 
   # checked calls have the same shape as normal calls. The difference
   # is that the call has an exceptional exit (i.e., it might raise an
   # exception)
-  CHECKED_CALL_EXPR = CheckedCall <Proc> CALL_ARG ...  EX_TARGET
-                    | CheckedCall LVALUE CALL_ARG ...  EX_TARGET
-                    | CheckedCall <Magic> CALL_ARG ... EX_TARGET
+  CHECKED_CALL_EXPR = CheckedCall <Imm> <Proc> CALL_ARG ...  EX_TARGET
+                    | CheckedCall <Imm> LVALUE CALL_ARG ...  EX_TARGET
+                    | CheckedCall <Imm> <Magic> CALL_ARG ... EX_TARGET
 
   SET_CONSTR_ARG = VALUE
                  | Range VALUE VALUE     # range construction
 
+  BINDING = Binding <Field> CONSTR_ARG
+
   RVALUE = UNARY_OP
          | BINARY_OP
          | CALL_EXPR
@@ -106,8 +109,8 @@ Semantics
          | SeqConstr CONSTR_ARG...
          | TupleConstr CONSTR_ARG...
          | ClosureConstr CONSTR_ARG...
-         | ObjConstr (<Field> CONSTR_ARG) ... # construct an `object`
-         | RefConstr (<Field> CONSTR_ARG) ... # construct a `ref object`
+         | ObjConstr BINDING ...         # construct an `object`
+         | RefConstr BINDING ...         # construct a `ref object`
          | StdConv  VALUE                # number conversion or conversion
                                          # between cstring and string
          | Conv     VALUE                # same as `StdConv`. Only duplicate
@@ -334,8 +337,6 @@ The MIR uses a tree-based representation similar to the AST. For easier
 processing and faster access, the whole code for a procedure is stored in a
 single sequence of *nodes*, with the nodes forming a tree.
 
-Sub-trees are currently delimited via an explicit `End` node.
-
 Constant Expressions
 ====================
 
@@ -359,10 +360,12 @@ ones).
   SET_CONSTR_ARG = <Literal>
                  | Range <Literal> <Literal>
 
+  BINDING = Binding <Field> ARG
+
   COMPLEX = SetConstr SET_CONSTR_ARG...
           | ArrayConstr ARG...
           | SeqConstr ARG...
           | TupleConstr ARG...
           | ClosureConstr ARG...
-          | ObjConstr (<Field> ARG)...
-          | RefConstr (<Field> ARG)...
+          | ObjConstr BINDING...
+          | RefConstr BINDING...
diff --git a/tests/compiler/tdatatables.nim b/tests/compiler/tdatatables.nim
index cf72a869da1..be442d547b6 100644
--- a/tests/compiler/tdatatables.nim
+++ b/tests/compiler/tdatatables.nim
@@ -40,41 +40,41 @@ block tree_equality:
     @[node(mnkFloatLit, t2, number, NumberId 0)],
 
     # --- ordered aggregates
-    @[node(mnkTupleConstr, t1, len, 0), node(mnkEnd)],
-    @[node(mnkTupleConstr, t2, len, 0), node(mnkEnd)],
+    @[node(mnkTupleConstr, t1, len, 0)],
+    @[node(mnkTupleConstr, t2, len, 0)],
     @[node(mnkTupleConstr, t1, len, 1),
-        node(mnkArg), literal(NumberId 0),
-      node(mnkEnd)],
+        node(mnkArg), literal(NumberId 0)],
     @[node(mnkTupleConstr, t1, len, 2),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-      node(mnkEnd)],
+        node(mnkArg), literal(NumberId 0),
+        node(mnkArg), literal(NumberId 0)],
 
     # --- aggregates with fields
-    @[node(mnkObjConstr, t1, len, 0), node(mnkEnd)],
-    @[node(mnkObjConstr, t2, len, 0), node(mnkEnd)],
+    @[node(mnkObjConstr, t1, len, 0)],
+    @[node(mnkObjConstr, t2, len, 0)],
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, 0),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-      node(mnkEnd)],
+        node(mnkBinding),
+          node(mnkField, field, 0),
+          node(mnkArg), literal(NumberId 0)],
     # same field value, different field:
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, 1),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-      node(mnkEnd)],
+        node(mnkBinding),
+          node(mnkField, field, 1),
+          node(mnkArg), literal(NumberId 0)],
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, 0),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-        node(mnkField, field, 1),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-      node(mnkEnd)],
+        node(mnkBinding),
+          node(mnkField, field, 0),
+          node(mnkArg), literal(NumberId 0),
+        node(mnkBinding),
+          node(mnkField, field, 1),
+          node(mnkArg), literal(NumberId 0)],
     # swapped fields
     @[node(mnkObjConstr, t1, len, 1),
-        node(mnkField, field, 1),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-        node(mnkField, field, 0),
-        node(mnkArg), literal(NumberId 0), node(mnkEnd),
-      node(mnkEnd)]
+        node(mnkBinding),
+          node(mnkField, field, 1),
+          node(mnkArg), literal(NumberId 0),
+        node(mnkBinding),
+          node(mnkField, field, 0),
+          node(mnkArg), literal(NumberId 0)]
   ]
 
   # compare all trees with each other
diff --git a/tests/compiler/tmir_trees.nim b/tests/compiler/tmir_trees.nim
index 3b91e176ad5..a77ccd80941 100644
--- a/tests/compiler/tmir_trees.nim
+++ b/tests/compiler/tmir_trees.nim
@@ -6,5 +6,5 @@ discard """
 import compiler/mir/mirtrees
 
 block last_sibling:
-  let tree = @[MirNode(kind: mnkScope), MirNode(kind: mnkEnd)]
+  let tree = @[MirNode(kind: mnkScope)]
   doAssert sibling(tree, NodePosition 0) == NodePosition(tree.len)
diff --git a/tests/compiler/ttreechangesets.nim b/tests/compiler/ttreechangesets.nim
index 7889270e112..d07f66a31b0 100644
--- a/tests/compiler/ttreechangesets.nim
+++ b/tests/compiler/ttreechangesets.nim
@@ -142,16 +142,16 @@ block insert_shared_end:
 
   test(tree, [temp(0), temp(1), temp(2), temp(3)]):
     c.replace 1, temp(1)
-    c.insert  3, temp(2)
+    c.insert  2, temp(2)
 
   test(tree, [temp(0), temp(1), temp(2), temp(3)]):
-    c.insert  3, temp(2)
+    c.insert  2, temp(2)
     c.replace 1, temp(1)
 
   test(tree, [temp(0), temp(2), temp(3)]):
     c.remove 1
-    c.insert 3, temp(2)
+    c.insert 2, temp(2)
 
   test(tree, [temp(0), temp(2), temp(3)]):
-    c.insert 3, temp(2)
+    c.insert 2, temp(2)
     c.remove 1
\ No newline at end of file

From 158b7c306f75ce471b97b84ab3b8cee4020da8f4 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 11 Jun 2024 00:27:50 +0000
Subject: [PATCH 120/169] build(deps): Bump dawidd6/action-download-artifact
 from 4 to 5 (#1344)

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 4 to 5.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v5</h2>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v4...v5">https://github.com/dawidd6/action-download-artifact/compare/v4...v5</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/deb3bb83256a78589fef6a7b942e5f2573ad7c13"><code>deb3bb8</code></a>
node_modules: upgrade</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/1d93f37db2a8005b41437c75a4793d52e664d858"><code>1d93f37</code></a>
README: v4</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v4...v5">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=4&new-version=5)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 2cefb2699d7..a5ad4533b79 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v4
+        uses: dawidd6/action-download-artifact@v5
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v4
+        uses: dawidd6/action-download-artifact@v5
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v4
+        uses: dawidd6/action-download-artifact@v5
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v4
+        uses: dawidd6/action-download-artifact@v5
         with:
           workflow: ci.yml
           workflow_conclusion: success

From 8d1dcd082039a596aa7fa5d6ace79488f2ec2f22 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 14 Jun 2024 22:58:19 +0200
Subject: [PATCH 121/169] macros: keep instantiation parameters with `getType`
 (#1346)

## Summary

`getType` now keeps instantiation parameters, which were previously
irrecoverably lost. This also allows retrieving the instantiation
parameters when only having access to an alias of the instantiated
type.

Fixes #1223.

## Details

Expanding `tyGenericInst` to `(BracketExpr <Callee> ...)` is the only
way of keeping the type information intact, since `tyGenericInst` do
not have symbols attached to them (in which case translating to an
`nnkSym` would be preferable, as it'd keep the AST flat).

Existing tests are adjusted.

### Aliases

A second goal of changing `getType` behaviour for `tyGenericInst` is to
allow retrieving the instantiation parameters in the presence of
type aliases. Given:
```nim
type
  Generic[A, B] = object
  Alias = Generic[int, string]
```

it was previously not possible to retrieve the instantiation
parameters for `Generic[int, string]` when given the expression
`Alias`, but now it is (with `getType`).

### Other

The internal `enumutils.enumFullRange` macro relied on the old
`getType` behaviour. To restore its functionality, it now uses
`getTypeImpl`.
---
 compiler/vm/vmdeps.nim                   | 16 ++++++----------
 lib/std/enumutils.nim                    |  3 ++-
 tests/lang_callable/macros/tgettype2.nim |  8 ++++----
 tests/lang_callable/macros/tgettype3.nim |  4 ++++
 4 files changed, 16 insertions(+), 15 deletions(-)

diff --git a/compiler/vm/vmdeps.nim b/compiler/vm/vmdeps.nim
index 95318902f0d..edda5e38443 100644
--- a/compiler/vm/vmdeps.nim
+++ b/compiler/vm/vmdeps.nim
@@ -159,17 +159,13 @@ proc mapTypeToAstX(cache: IdentCache; t: PType; info: TLineInfo;
     for i in 0..<t.len:
       result.add mapTypeToAst(t[i], info)
   of tyGenericInst:
-    if inst:
-      if allowRecursion:
-        result = mapTypeToAstR(t.lastSon, info)
-      else:
-        result = newNodeX(nkBracketExpr)
-        #result.add mapTypeToAst(t.lastSon, info)
-        result.add mapTypeToAst(t[0], info)
-        for i in 1..<t.len-1:
-          result.add mapTypeToAst(t[i], info)
+    if inst and allowRecursion:
+      result = mapTypeToAstR(t.lastSon, info)
     else:
-      result = mapTypeToAstX(cache, t.lastSon, info, idgen, inst, allowRecursion)
+      result = newNodeX(nkBracketExpr)
+      result.add mapTypeToAst(t[0], info)
+      for i in 1..<t.len-1:
+        result.add mapTypeToAst(t[i], info)
   of tyGenericBody:
     if inst:
       result = mapTypeToAstR(t.lastSon, info)
diff --git a/lib/std/enumutils.nim b/lib/std/enumutils.nim
index 62bf30b3657..56db2d5fee3 100644
--- a/lib/std/enumutils.nim
+++ b/lib/std/enumutils.nim
@@ -11,7 +11,8 @@ import std/macros
 from std/typetraits import OrdinalEnum, HoleyEnum
 
 macro enumFullRange(a: typed): untyped =
-  newNimNode(nnkCurly).add(a.getType[1][1..^1])
+  let typ = getTypeImpl(getType(a)[1]) # the ``nnkEnumTy`` AST
+  newNimNode(nnkCurly).add(typ[1..^1])
 
 # xxx `genEnumCaseStmt` needs tests and runnableExamples
 
diff --git a/tests/lang_callable/macros/tgettype2.nim b/tests/lang_callable/macros/tgettype2.nim
index c579cf6ff42..8cb608b5093 100644
--- a/tests/lang_callable/macros/tgettype2.nim
+++ b/tests/lang_callable/macros/tgettype2.nim
@@ -11,8 +11,8 @@ gt(bar):	distinct[int]
 gt(baz):	int, int
 gt(v):	seq[int]
 gt(vv):	seq[float]
-gt(t):	distinct[tuple[int, int]]
-gt(tt):	distinct[tuple[float, float]]
+gt(t):	MyType[int]
+gt(tt):	MyType[float]
 gt(s):	distinct[tuple[int, int]]
 #############
 #### gt2 ####
@@ -70,8 +70,8 @@ echo gt(baz) # int, int          I would prefer Baz, int
 
 echo gt(v)   # seq[int], ok
 echo gt(vv)  # seq[float], ok
-echo gt(t)   # MyType, distinct[tuple[int, int]]      I would prefer MyType[int],   distinct[tuple[int, int]]
-echo gt(tt)  # MyType, distinct[tuple[float, float]]  I would prefer MyType[float], distinct[tuple[int, int]]
+echo gt(t)   # MyType[int], ok
+echo gt(tt)  # MyType[float], ok
 echo gt(s)   # distinct[tuple[int, int]]              I would prefer MySimpleType, distinct[tuple[int,int]]
 
 echo "#############"
diff --git a/tests/lang_callable/macros/tgettype3.nim b/tests/lang_callable/macros/tgettype3.nim
index 786d09d8bed..5a4372f97ae 100644
--- a/tests/lang_callable/macros/tgettype3.nim
+++ b/tests/lang_callable/macros/tgettype3.nim
@@ -27,6 +27,10 @@ proc getTypeName(t: NimNode, skipVar = false): string =
             result = "vec4"
         elif $(t[0]) == "distinct":
             result = getTypeName(t[1], skipVar)
+        # --------- not part of the original test case
+        elif $(t[0]) == "vecBase":
+            result = "vec2"
+        # ---------
     of nnkSym:
         case $t
         of "vecBase": result = getTypeName(getType(t), skipVar)

From e3f9a33dfdab0a0366f6047f815be9fe261d04d3 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 15 Jun 2024 23:38:49 +0200
Subject: [PATCH 122/169] typetraits: improve `genericParams` (#1347)

## Summary

The `genericParams` typetrait now also supports `ref`, `var`, `ptr`,
and `range`. In addition, it's fully based on type information, making
it work regardless of what expression is used as the argument. For
`array` types, the index type is now *always* a `range` type, so this
is a **breaking change**.

## Details

The main goal is removing the mixed analysis from `genericParams`,
where both type and normal AST were inspected. Besides only working for
some type expressions, this also relied on `sem` modifying the input
AST nodes' types in type AST, making the macro susceptible to breaking
when analysis of type AST changes in `sem`.

To make the implementation not rely on `sem` implementation details,
`genericParams` now only uses the macro type API, also removing the
need for an intermediate macro.

The syntax convenience of specifying an array's index type with a
single integer value does not exist at the type level, and a
`StaticParam[x]` is therefore not returned for `array` types anymore.
---
 lib/pure/typetraits.nim                     | 96 ++++++++-------------
 tests/lang_objects/metatype/ttypetraits.nim | 11 ++-
 2 files changed, 46 insertions(+), 61 deletions(-)

diff --git a/lib/pure/typetraits.nim b/lib/pure/typetraits.nim
index 9b3877decfd..d8b93b49d97 100644
--- a/lib/pure/typetraits.nim
+++ b/lib/pure/typetraits.nim
@@ -236,66 +236,12 @@ macro enumLen*(T: typedesc[enum]): int =
   expectKind(enumTy, nnkEnumTy)
   result = newLit(enumTy.len - 1)
 
-macro genericParamsImpl(T: typedesc): untyped =
-  # auxiliary macro needed, can't do it directly in `genericParams`
-  result = newNimNode(nnkTupleConstr)
-  var impl = getTypeImpl(T)
-  expectKind(impl, nnkBracketExpr)
-  impl = impl[1]
-  while true:
-    case impl.kind
-    of nnkSym:
-      impl = impl.getImpl
-    of nnkTypeDef:
-      impl = impl[2]
-    of nnkTypeOfExpr:
-      impl = getTypeInst(impl[0])
-    of nnkBracketExpr:
-      for i in 1..<impl.len:
-        let ai = impl[i]
-        var ret: NimNode = nil
-        case ai.typeKind
-        of ntyTypeDesc:
-          ret = ai
-        of ntyStatic: doAssert false
-        else:
-          # getType from a resolved symbol might return a typedesc symbol.
-          # If so, use it directly instead of wrapping it in StaticParam.
-          if (ai.kind == nnkSym and ai.symKind == nskType) or
-              (ai.kind == nnkBracketExpr and ai[0].kind == nnkSym and
-              ai[0].symKind == nskType) or ai.kind in {nnkRefTy, nnkVarTy, nnkPtrTy, nnkProcTy}:
-            ret = ai
-          elif ai.kind == nnkInfix and ai[0].kind == nnkIdent and
-                ai[0].strVal == "..":
-            # For built-in array types, the "2" is translated to "0..1" then
-            # automagically translated to "range[0..1]". However this is not
-            # reflected in the AST, thus requiring manual transformation here.
-            #
-            # We will also be losing some context here:
-            #   var a: array[10, int]
-            # will be translated to:
-            #   var a: array[0..9, int]
-            # after typecheck. This means that we can't get the exact
-            # definition as typed by the user, which will cause confusion for
-            # users expecting:
-            #   genericParams(typeof(a)) is (StaticParam(10), int)
-            # to be true while in fact the result will be:
-            #   genericParams(typeof(a)) is (range[0..9], int)
-            ret = newTree(nnkBracketExpr, @[bindSym"range", ai])
-          else:
-            since (1, 1):
-              ret = newTree(nnkBracketExpr, @[bindSym"StaticParam", ai])
-        result.add ret
-      break
-    else:
-      error "wrong kind: " & $impl.kind, impl
-
 since (1, 1):
-  template genericParams*(T: typedesc): untyped =
+  macro genericParams*(T: typedesc): untyped =
     ## Returns the tuple of generic parameters for the generic type `T`.
     ##
     ## **Note:** For the builtin array type, the index generic parameter will
-    ## **always** become a range type after it's bound to a variable.
+    ## **always** become a range type.
     runnableExamples:
       type Foo[T1, T2] = object
 
@@ -309,13 +255,43 @@ since (1, 1):
       var s: seq[Bar[3.0, string]]
       doAssert genericParams(typeof(s)) is (Bar[3.0, string],)
 
-      doAssert genericParams(array[10, int]) is (StaticParam[10], int)
+      doAssert genericParams(array[10, int]) is (range[0..9], int)
       var a: array[10, int]
       doAssert genericParams(typeof(a)) is (range[0..9], int)
 
-    type T2 = T
-    genericParamsImpl(T2)
-
+    let desc = getTypeInst(T)
+    expectKind(desc, nnkBracketExpr)
+    let typ = getType(desc[1]) # skip aliases
+
+    result = newNimNode(nnkTupleConstr)
+    case typ.typeKind
+    of ntyGenericInst:
+      # fetch all instnatiation parameters
+      for i in 1..<typ.len:
+        let op = getTypeInst(typ[i])
+        # ``getTypeInst`` loses the staticness, so `typ` has to be queried
+        # instead
+        if typ[i].typeKind == ntyStatic:
+          result.add nnkBracketExpr.newTree(bindSym"StaticParam", op)
+        else:
+          result.add op
+    of ntyPtr, ntyRef, ntyVar, ntySequence, ntyOpenArray, ntyVarargs, ntySet,
+       ntyUncheckedArray:
+      result.add typ[1]
+    of ntyRange:
+      result.add nnkBracketExpr.newTree(bindSym"StaticParam", typ[1])
+      result.add nnkBracketExpr.newTree(bindSym"StaticParam", typ[2])
+    of ntyArray:
+      var len = getTypeInst(typ[1])
+      if len.kind == nnkInfix:
+        # create a proper range type constructor
+        len = nnkBracketExpr.newTree(bindSym"range", len)
+
+      result = nnkTupleConstr.newTree(
+        len,
+        typ[2])
+    else:
+      error("not an instantiated generic type", T)
 
 proc hasClosureImpl(n: NimNode): bool = discard "see compiler/vmops.nim"
 
diff --git a/tests/lang_objects/metatype/ttypetraits.nim b/tests/lang_objects/metatype/ttypetraits.nim
index 631615dd5a9..c4b24957b1a 100644
--- a/tests/lang_objects/metatype/ttypetraits.nim
+++ b/tests/lang_objects/metatype/ttypetraits.nim
@@ -245,9 +245,18 @@ block genericParams:
 
   block nestedContainers:
     doAssert genericParams(seq[Foo[string, float]]).get(0) is Foo[string, float]
-    doAssert genericParams(array[10, Foo[Bar[1, int], Bar[2, float]]]) is (StaticParam[10], Foo[Bar[1, int], Bar[2, float]])
+    doAssert genericParams(array[10, Foo[Bar[1, int], Bar[2, float]]]) is (range[0..9], Foo[Bar[1, int], Bar[2, float]])
     doAssert genericParams(array[1..9, int]) is (range[1..9], int)
 
+  doAssert genericParams(var int) is (int,)
+  doAssert genericParams(ptr int) is (int,)
+  doAssert genericParams(ref int) is (int,)
+  doAssert genericParams(set[int16]) is (int16,)
+  doAssert genericParams(openArray[int]) is (int,)
+  doAssert genericParams(varargs[int]) is (int,)
+  doAssert genericParams(UncheckedArray[int]) is (int,)
+  doAssert genericParams(range[1 .. 2]) is (StaticParam[1], StaticParam[2])
+
 ##############################################
 # bug 13095
 

From da65fbf89fc5cd822e78acdf1f70f303f686d3f9 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 16 Jun 2024 20:17:01 +0200
Subject: [PATCH 123/169] sem: don't analyze dependent operands to `static`
 (#1345)

## Summary

Makes instantiations such as `Generic[someProc(T)]` work, where
`T` is some generic parameter (and receiving type parameter is a
`static` one) -- the `someProc(T)` expression is typed once `T` is
substituted, making the behaviour consistent with `array` and `range`.

## Details

Fully analyzing (i.e., with `semExpr`) arbitrary expressions that might
reference unresolved type variables generally doesn't work. Operands to
generic invocations were eagerly analyzed (in `matchesAux`), usually
resulting in errors when the operand needs to be a `static` value.

Disallowing expressions dependent on unresolved type variables in this
context would be a regression, since some expressions are special-cased
to work (such as `sizeof(T)`).

To address the problem, before typing the operand, it's first checked
whether it depends on unresolved type variables. If it does, the
expression is treated as a generic expression, with a `tyFromExpr`
assigned as its type -- otherwise it's analyzed as usual.

If the operand has an unknown type (`tyFromExpr`), it's wrapped in a
conversion to a type derived from the generic parameter's constraint,
to make sure the operand types later. If no concrete type can be
derived from the constraint, a type mismatch is reported.

To not convolute `matchesAux` further, the argument matching where the
callee is a `tyGenericBody` is moved into the new `matchesType`. It
does largely the same as `matchesAux`, but with everything not
applicable to types removed (such as the varargs handling).

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/sem/sem.nim                          |   1 +
 compiler/sem/semdata.nim                      |   3 +
 compiler/sem/semtypes.nim                     |   7 +
 compiler/sem/sigmatch.nim                     | 126 +++++++++++++++++-
 .../tdependent_operands_to_static.nim         |  27 ++++
 .../tdependent_operands_to_static_2.nim       |  21 +++
 6 files changed, 184 insertions(+), 1 deletion(-)
 create mode 100644 tests/lang_callable/generics/tdependent_operands_to_static.nim
 create mode 100644 tests/lang_callable/generics/tdependent_operands_to_static_2.nim

diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index 4a3d75c9cf8..dae720efd1f 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -914,6 +914,7 @@ proc myOpen(graph: ModuleGraph; module: PSym;
   c.semTypeNode = semTypeNode
   c.instTypeBoundOp = sigmatch.instTypeBoundOp
   c.hasUnresolvedArgs = hasUnresolvedArgs
+  c.semGenericExpr = semGenericExpr
   c.templInstCounter = new int
 
   pushProcCon(c, module)
diff --git a/compiler/sem/semdata.nim b/compiler/sem/semdata.nim
index 184edbe0536..5a08d14e770 100644
--- a/compiler/sem/semdata.nim
+++ b/compiler/sem/semdata.nim
@@ -637,6 +637,9 @@ type
                             op: TTypeAttachedOp; col: int): PSym {.nimcall.}
       ## read to break cyclic dependencies, init in sem during module open and
       ## read in liftdestructors and semtypinst
+    semGenericExpr*: proc (c: PContext, n: PNode): PNode {.nimcall.}
+      ## read to break cyclic dependencies, init in sem during module open and
+      ## read in sigmatch
     # -------------------------------------------------------------------------
     # end: not entirely clear why, function pionters for certain sem calls?
     # -------------------------------------------------------------------------
diff --git a/compiler/sem/semtypes.nim b/compiler/sem/semtypes.nim
index ac82a2dc5b5..22408dffdf2 100644
--- a/compiler/sem/semtypes.nim
+++ b/compiler/sem/semtypes.nim
@@ -1696,6 +1696,13 @@ proc semStmtListType(c: PContext, n: PNode, prev: PType): PType =
   else:
     result = nil
 
+proc semGenericExpr(c: PContext, n: PNode): PNode =
+  ## Runs the generic pre-pass on `n` and returns the result. Similar to
+  ## ``semGenericStmt``, but makes sure that all generic parameter symbols
+  ## were bound.
+  result = semGenericStmt(c, n)
+  discard fixupTypeVars(c, result)
+
 proc semGenericParamInInvocation(c: PContext, n: PNode): PType =
   result = semTypeNode(c, n, nil)
   n.typ = makeTypeDesc(c, result)
diff --git a/compiler/sem/sigmatch.nim b/compiler/sem/sigmatch.nim
index 0669d5c492b..faf78bb9d6d 100644
--- a/compiler/sem/sigmatch.nim
+++ b/compiler/sem/sigmatch.nim
@@ -3120,6 +3120,127 @@ proc matchesAux(c: PContext, n, nOrig: PNode, m: var TCandidate, marker: var Int
   m.error.firstMismatch.pos = a
   m.error.firstMismatch.formal = formal
 
+proc matchesType(c: PContext, n: PNode, m: var TCandidate,
+                 marker: var IntSet) =
+  ## Matches the arguments taken from invocation expression `n` against the
+  ## ``tyGenericBody`` callee and fills `m` with the results. `marker` is
+  ## updated with the matched-against formal positions.
+  m.state = csMatch # until proven otherwise
+  m.error.firstMismatch = MismatchInfo()
+
+  # pre-pass: make sure the AST is valid. `n` is production AST, so it can be
+  # modified in-place
+  var hasError = false
+  for i in 1..<n.len:
+    if n[i].kind == nkExprEqExpr:
+      let (ident, err) = considerQuotedIdent(c, n[i][0])
+      if err != nil:
+        n[i][0] = err
+        hasError = true
+      else:
+        n[i][0] = newIdentNode(ident, n[i][0].info)
+
+  if hasError:
+    # abort early
+    m.state = csNoMatch
+    m.call = c.config.wrapError(n)
+    return
+
+  m.call = newNodeI(n.kind, n.info, m.callee.len)
+  m.call[0] = n[0]
+
+  var f = 0
+  var i = 1
+  var formal: PSym
+
+  while i < n.len:
+    # select the formal parameter:
+    var operand: PNode
+    case n[i].kind
+    of nkExprEqExpr:
+      # explicit parameter
+      formal = getNamedParamFromList(m.callee.n, n[i][0].ident)
+      if formal.isNil:
+        m.error.firstMismatch.kind = kUnknownNamedParam
+        break
+
+      operand = n[i][1]
+    elif f < m.callee.n.len:
+      # implicit parameter
+      formal = m.callee.n[f].sym
+      operand = n[i]
+    else:
+      m.error.firstMismatch.kind = kExtraArg
+      break
+
+    if containsOrIncl(marker, formal.position):
+      m.error.firstMismatch.kind = kAlreadyGiven
+      break
+
+    # reset the per-parameter state:
+    m.typedescMatched = false
+
+    m.error.firstMismatch.kind = kTypeMismatch
+
+    # match the argument against the formal type:
+    var arg: PNode
+
+    if (tfHasStatic in formal.typ.skipTypes({tyDistinct}).flags or
+        formal.typ.kind == tyStatic) and c.hasUnresolvedArgs(c, operand):
+      # the expression depends on not-yet resolved generic parameters,
+      # ``semOperand`` won't work
+      operand = c.semGenericExpr(c, operand)
+      if operand.kind == nkError or operand.typ != nil:
+        arg = paramTypesMatch(m, formal.typ, operand.typ, operand)
+      elif formal.typ.kind == tyStatic:
+        # some expression that's more complex than just being a generic
+        # parameter symbol
+        if formal.typ.base.kind == tyNone:
+          # no constraints
+          arg = copyNodeWithKids(operand)
+          arg.typ = makeTypeFromExpr(c, operand)
+        else:
+          # the static is constrained. We don't know the argument's type yet,
+          # so we cannot know up-front whether the expression will fits once
+          # all type variables it depends on are resolved
+          # XXX: to support this at least somewhat, the argument is wrapped
+          #      in a conversion to the expected type. If the types are
+          #      wholly incompatible, later analysis of the conversion will
+          #      yield an error. Non-exact matches where the types have a
+          #      "convertible" relationship will not result in an error
+          arg = newTreeI(nkConv, operand.info,
+                         newNodeIT(nkType, operand.info, formal.typ.base),
+                         operand)
+          arg.typ = makeTypeFromExpr(c, copyNodeWithKids(arg))
+      else:
+        # we don't know the argument's type, nor can we enforce that it'll
+        # match the formal type later -> type mismatch
+        m.call[formal.position + 1] = copyNodeWithKids(operand)
+        m.call[formal.position + 1].typ = makeTypeFromExpr(c, operand)
+        break
+    else:
+      operand = m.c.semOperand(m.c, operand)
+      arg = paramTypesMatch(m, formal.typ, operand.typ, operand)
+
+    if arg != nil:
+      # errors don't need to be considered here; they're handled through
+      # `fauxMatch`
+      m.call[formal.position + 1] = arg
+    else:
+      # legacy error handling
+      m.call[formal.position + 1] = operand
+      break
+
+    f = max(formal.position + 1, f + 1)
+    inc i
+
+  if i < n.len:
+    # an error occurred
+    m.state = csNoMatch
+    m.error.firstMismatch.pos = i
+    m.error.firstMismatch.arg = n[i]
+    m.error.firstMismatch.formal = formal
+
 proc semFinishOperands*(c: PContext, n: PNode) =
   # this needs to be called to ensure that after overloading resolution every
   # argument has been sem'checked:
@@ -3155,7 +3276,10 @@ proc matches*(c: PContext, n, nOrig: PNode, m: var TCandidate) =
     return
   
   var marker = initIntSet()
-  matchesAux(c, n, nOrig, m, marker)
+  if m.callee.kind == tyGenericBody:
+    matchesType(c, n, m, marker)
+  else:
+    matchesAux(c, n, nOrig, m, marker)
 
   if m.state == csNoMatch:
     return
diff --git a/tests/lang_callable/generics/tdependent_operands_to_static.nim b/tests/lang_callable/generics/tdependent_operands_to_static.nim
new file mode 100644
index 00000000000..0c8de08e2b6
--- /dev/null
+++ b/tests/lang_callable/generics/tdependent_operands_to_static.nim
@@ -0,0 +1,27 @@
+discard """
+  description: '''
+    Various tests for operands to `static` constrained generic type parameters
+    where the operand's type depends on unresolved type variables.
+  '''
+"""
+
+type
+  Type1[T: static] = object ## only must be *some* static value
+  Type2[T: static int] = object ## must a be a static int
+
+proc eval[T](x: T): T {.compileTime.} =
+  x
+
+proc p1[T](): Type1[eval(default(T))] = discard
+proc p2[T](): Type2[eval(default(T))] = discard
+# ^^ whether the ``Type2`` can be instantiated depends on the later
+# supplied `T`
+
+discard p1[int]()    # works
+discard p1[float]()  # works
+discard p1[string]() # works
+
+discard p2[int]()    # int is convertible to int -> works
+discard p2[float]()  # float is convertible to int -> works
+# string is not convertible to float -> fails:
+doAssert not compiles(p3[string]())
diff --git a/tests/lang_callable/generics/tdependent_operands_to_static_2.nim b/tests/lang_callable/generics/tdependent_operands_to_static_2.nim
new file mode 100644
index 00000000000..9ef469e2061
--- /dev/null
+++ b/tests/lang_callable/generics/tdependent_operands_to_static_2.nim
@@ -0,0 +1,21 @@
+discard """
+  description: '''
+    Operands with a type not known upfront cannot be used as arguments to
+    complex static
+  '''
+  errormsg: "cannot instantiate Type"
+  line: 21
+  knownIssue: '''
+    `Type`s generic parameter is not detected as containing a `static`, thus
+    full analysis is not disabled (which subsequently fails)
+  '''
+"""
+
+type
+  Type[T: string | static float] = object ## must be a string or static float
+
+proc eval[T](x: T): T {.compileTime.} = x
+
+# the operand's type is not known and no concrete type can be derived from
+# the constraint -> reject early
+proc p[T](): Type[eval(default(T))] = discard

From a13f09b0853a1c4e09ebdb7cbd93b10cbff4ed8c Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 18 Jun 2024 04:29:17 +0000
Subject: [PATCH 124/169] build(deps): Bump dawidd6/action-download-artifact
 from 5 to 6 (#1348)

Bumps

[dawidd6/action-download-artifact](https://github.com/dawidd6/action-download-artifact)
from 5 to 6.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/dawidd6/action-download-artifact/releases">dawidd6/action-download-artifact's
releases</a>.</em></p>
<blockquote>
<h2>v6</h2>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/dawidd6/action-download-artifact/compare/v5...v6">https://github.com/dawidd6/action-download-artifact/compare/v5...v6</a></p>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/bf251b5aa9c2f7eeb574a96ee720e24f801b7c11"><code>bf251b5</code></a>
node_modules: upgrade</li>
<li><a

href="https://github.com/dawidd6/action-download-artifact/commit/93c629661111aae296c04004b30ae3ba22ed46f3"><code>93c6296</code></a>
README: v5</li>
<li>See full diff in <a

href="https://github.com/dawidd6/action-download-artifact/compare/v5...v6">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=dawidd6/action-download-artifact&package-manager=github_actions&previous-version=5&new-version=6)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index a5ad4533b79..61479c52ce0 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -30,7 +30,7 @@ jobs:
 
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v5
+        uses: dawidd6/action-download-artifact@v6
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -40,7 +40,7 @@ jobs:
           path: doc/html
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v5
+        uses: dawidd6/action-download-artifact@v6
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -50,7 +50,7 @@ jobs:
           path: release-staging
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v5
+        uses: dawidd6/action-download-artifact@v6
         with:
           workflow: ci.yml
           workflow_conclusion: success
@@ -61,7 +61,7 @@ jobs:
           path: release-staging
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v5
+        uses: dawidd6/action-download-artifact@v6
         with:
           workflow: ci.yml
           workflow_conclusion: success

From cdcf8f7c4608e67d638eb5411a3ea17fc331b943 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Tue, 18 Jun 2024 15:24:22 -0500
Subject: [PATCH 125/169] openssl: support OpenSSL 3.0 and above (#1349)

## Summary
The only ABI change between version 1.1.1 and 3.0 for our usage is
`SSL_get_peer_certificate`  being splitted into
`SSL_get1_peer_certificate`  (which is compatible with the prior symbol)
and  `SSL_get0_peer_certificate` .

This PR modifies  `SSL_get_peer_certificate`  in the wrapper to use the
new symbol if available. No changes in other programs are required.

## Details
*  `SSL_get_peer_certificate`  will now select either
`SSL_get1_peer_certificate`  or  `SSL_get_peer_certificate`  depending
on which symbols are available.
* DLL names for OpenSSL 3.x has been added for macOS, Windows and
Linux.
* The symbols used for certificate verification are no longer
unconditionally hidden on Windows. They were hidden previously as Nim
ships old OpenSSL 1.0 which did not have these symbols.

Fixes https://github.com/nim-works/nimskull/issues/1160
---
 lib/wrappers/openssl.nim | 24 ++++++++++++++----------
 1 file changed, 14 insertions(+), 10 deletions(-)

diff --git a/lib/wrappers/openssl.nim b/lib/wrappers/openssl.nim
index cdc3969d0f6..38c5ac6f59e 100644
--- a/lib/wrappers/openssl.nim
+++ b/lib/wrappers/openssl.nim
@@ -63,19 +63,19 @@ elif useWinVersion:
         DLLUtilName* = "libeay32.dll"
   elif defined(cpu64):
     const
-      DLLSSLName* = "(libssl-1_1-x64|ssleay64|libssl64).dll"
-      DLLUtilName* = "(libcrypto-1_1-x64|libeay64).dll"
+      DLLSSLName* = "(libssl-3-x64|libssl-1_1-x64|ssleay64|libssl64).dll"
+      DLLUtilName* = "(libcrypto-3-x64|libcrypto-1_1-x64|libeay64).dll"
   else:
     const
-      DLLSSLName* = "(libssl-1_1|ssleay32|libssl32).dll"
-      DLLUtilName* = "(libcrypto-1_1|libeay32).dll"
+      DLLSSLName* = "(libssl-3|libssl-1_1|ssleay32|libssl32).dll"
+      DLLUtilName* = "(libssl-3|libcrypto-1_1|libeay32).dll"
 
   from std/winlean import SocketHandle
 else:
   when defined(osx):
-    const versions = "(.1.1|.38|.39|.41|.43|.44|.45|.46|.47|.48|.10|.1.0.2|.1.0.1|.1.0.0|.0.9.9|.0.9.8|)"
+    const versions = "(.3|.1.1|.38|.39|.41|.43|.44|.45|.46|.47|.48|.10|.1.0.2|.1.0.1|.1.0.0|.0.9.9|.0.9.8|)"
   else:
-    const versions = "(.1.1|.1.0.2|.1.0.1|.1.0.0|.0.9.9|.0.9.8|.48|.47|.46|.45|.44|.43|.41|.39|.38|.10|)"
+    const versions = "(.3|.1.1|.1.0.2|.1.0.1|.1.0.0|.0.9.9|.0.9.8|.48|.47|.46|.45|.44|.43|.41|.39|.38|.10|)"
 
   when defined(macosx):
     const
@@ -796,10 +796,14 @@ when defined(nimHasStyleChecks):
 
 # Certificate validation
 # On old openSSL version some of these symbols are not available
-when not defined(nimDisableCertificateValidation) and not defined(windows):
-
-  proc SSL_get_peer_certificate*(ssl: SslCtx): PX509{.cdecl, dynlib: DLLSSLName,
-      importc.}
+when not defined(nimDisableCertificateValidation):
+
+  proc SSL_get_peer_certificate*(ssl: SslCtx): PX509 {.gcsafe, tags: [].} =
+    {.cast(tags: []), cast(gcsafe).}:
+      let thisProc {.global.} = cast[proc (ssl: SslCtx): PX509 {.cdecl.}](
+        sslSymThrows("SSL_get1_peer_certificate", "SSL_get_peer_certificate")
+      )
+      if not thisProc.isNil: result = thisProc(ssl)
 
   proc X509_get_subject_name*(a: PX509): PX509_NAME{.cdecl, dynlib: DLLSSLName, importc.}
 

From fd7d2f5b46e236d039bc2e4633bfd0adbf44fa62 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Tue, 18 Jun 2024 15:56:10 -0500
Subject: [PATCH 126/169] actions/setup-mingw: bump release-downloader to 1.10
 (#1350)

## Summary
No functional changes other than a bump to NodeJS 20 since 16 has been
deprecated by GitHub.

## Details
* GitHub has deprecated version 16 since Oct 2023:

https://github.blog/changelog/2023-09-22-github-actions-transitioning-from-node-16-to-node-20/
---
 .github/actions/setup-mingw/action.yml | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/.github/actions/setup-mingw/action.yml b/.github/actions/setup-mingw/action.yml
index 19c9baba6c6..3298a6e7ce0 100644
--- a/.github/actions/setup-mingw/action.yml
+++ b/.github/actions/setup-mingw/action.yml
@@ -18,7 +18,7 @@ runs:
 
     - name: Download from niXman/mingw-builds-binaries
       id: download
-      uses: robinraju/release-downloader@v1.8
+      uses: robinraju/release-downloader@v1.10
       with:
         repository: niXman/mingw-builds-binaries
         tag: ${{ inputs.mingw-version }}
@@ -31,8 +31,7 @@ runs:
         Join-Path $env:RUNNER_TEMP "mingw64" "bin" | Out-File -Append $env:GITHUB_PATH
       shell: pwsh
       env:
-        MINGW_ARCHIVE:
-          ${{ fromJson(steps.download.outputs.downloaded_files)[0] }}
+        MINGW_ARCHIVE: ${{ fromJson(steps.download.outputs.downloaded_files)[0] }}
       working-directory: ${{ runner.temp }}
 
     - name: Print GCC version

From 73e775542624083bfd40a15175eb0c5bcab9a332 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 19 Jun 2024 16:12:58 +0200
Subject: [PATCH 127/169] make the REPL (`nim secret`) work again (#1351)

## Summary

Properly configure the compiler when running the `nim secret`
command, making the compiler built-in REPL usable again.

## Details

* the compiler is configured for the VM backend when the
  `cmdInteractive` command is active
* `echo` output is no longer prefixed by `>>>`
* a test is added to ensure the basic REPL functionality works
* the standard output stream is flushed after writing `>>>` or `...`,
  so that the test is able to read the output
---
 compiler/ast/llstream.nim        |  1 +
 compiler/front/cli_reporter.nim  |  3 +-
 compiler/front/main.nim          |  6 ++--
 tests/compilerfeatures/trepl.nim | 55 ++++++++++++++++++++++++++++++++
 4 files changed, 61 insertions(+), 4 deletions(-)
 create mode 100644 tests/compilerfeatures/trepl.nim

diff --git a/compiler/ast/llstream.nim b/compiler/ast/llstream.nim
index 0fd5c53eba6..eaf484cc921 100644
--- a/compiler/ast/llstream.nim
+++ b/compiler/ast/llstream.nim
@@ -75,6 +75,7 @@ when not declared(readLineFromStdin):
   # fallback implementation:
   proc readLineFromStdin(prompt: string, line: var string): bool =
     stdout.write(prompt)
+    stdout.flushFile()
     result = readLine(stdin, line)
     if not result:
       stdout.write("\n")
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 08508dfa28d..3272f533b79 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -2617,8 +2617,7 @@ To create a stacktrace, rerun compilation with './koch temp $1 <file>'
       )
 
     of rintEchoMessage:
-      result = if conf.cmd == cmdInteractive: ">>> " & r.msg
-               else:                          r.msg
+      result = r.msg
 
     of rintCannotOpenFile, rintWarnCannotOpenFile:
       result = "cannot open file: $1" % r.file
diff --git a/compiler/front/main.nim b/compiler/front/main.nim
index 42cea67b373..f7b8f70835a 100644
--- a/compiler/front/main.nim
+++ b/compiler/front/main.nim
@@ -505,7 +505,7 @@ proc mainCommand*(graph: ModuleGraph) =
 
   ## command prepass
   if conf.cmd == cmdCrun: conf.incl {optRun, optUseNimcache}
-  if conf.cmd notin cmdBackends + {cmdTcc, cmdNimscript}:
+  if conf.cmd notin cmdBackends + {cmdTcc, cmdNimscript, cmdInteractive}:
     customizeForBackend(graph, conf, backendC)
   if conf.outDir.isEmpty:
     # doc like commands can generate a lot of files (especially with --project)
@@ -675,7 +675,9 @@ proc mainCommand*(graph: ModuleGraph) =
     wantMainModule(conf)
     commandView(graph)
     #msgWriteln(conf, "Beware: Indentation tokens depend on the parser's state!")
-  of cmdInteractive: commandInteractive(graph)
+  of cmdInteractive:
+    customizeForBackend(graph, conf, backendNimVm)
+    commandInteractive(graph)
   of cmdNimscript:
     if conf.inputMode == pimFile and not fileExists(conf.projectFull):
       localReport(conf, InternalReport(
diff --git a/tests/compilerfeatures/trepl.nim b/tests/compilerfeatures/trepl.nim
new file mode 100644
index 00000000000..cdad8e87c82
--- /dev/null
+++ b/tests/compilerfeatures/trepl.nim
@@ -0,0 +1,55 @@
+discard """
+  description: "Ensure that the basic REPL functionality works"
+  targets: native
+  timeout: "5"
+"""
+
+import std/[streams, os, osproc]
+
+const Compiler = getCurrentCompilerExe()
+
+let
+  repl = startProcess("bin/nim", args=["secret"], options={poStdErrToStdOut})
+  output = repl.inputStream()  # for writing to
+  input  = repl.outputStream() # for reading from
+
+template expectLine(expect: string) =
+  var line: string
+  doAssert readLine(input, line)
+  doAssert line == expect, "got: " & line
+
+template expect(expect: static string) =
+  var got = readStr(input, expect.len)
+  doAssert got == expect, "got: " & got
+
+template writeLine(line: string) =
+  writeLine(output, line)
+  flush(output)
+
+expect ">>> "
+# okay, startup was successful; no error was reported
+
+# test a simple echo statement
+writeLine "echo \"hello\""
+expectLine "hello"
+
+# test a simple procedure definition
+expect ">>> "
+writeLine "proc p() ="
+expect "... "
+writeLine "  echo \"here\""
+expect "... "
+writeLine ""
+expect ">>> "
+writeLine "p()" # call the procedure
+expectLine "here"
+
+# quit the REPL
+expect ">>> "
+writeLine "quit()"
+
+# make sure shutdown worked without an error
+let code = waitForExit(repl)
+doAssert code == 0, "non-zero exit code: " & $code
+
+repl.close()

From 251c073c01c042d974d13ab7a2082a195d6090f0 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Wed, 19 Jun 2024 10:03:55 -0500
Subject: [PATCH 128/169] ci: replace vcpkg-action with simpler setup-vcpkg
 (#1352)

## Summary
johnwason/vcpkg-action depends on various other actions that are now
out-of-date and is using deprecated NodeJS 16. Given that vcpkg
configuration and bootstrap is very simple, replace our usage with a
simpler homemade setup-vcpkg instead.

## Details
* Added a new  `setup-vcpkg`  action. This action is rather simple and
consist only of exporting environment variables to configure vcpkg.
* Replace usage of `johnwason/vcpkg-action` with `setup-vcpkg`.
---
 .github/actions/setup-vcpkg/action.yml | 62 ++++++++++++++++++++++++++
 .github/workflows/ci.yml               | 32 ++++++-------
 2 files changed, 78 insertions(+), 16 deletions(-)
 create mode 100644 .github/actions/setup-vcpkg/action.yml

diff --git a/.github/actions/setup-vcpkg/action.yml b/.github/actions/setup-vcpkg/action.yml
new file mode 100644
index 00000000000..19b0a27b0f8
--- /dev/null
+++ b/.github/actions/setup-vcpkg/action.yml
@@ -0,0 +1,62 @@
+name: Setup vcpkg
+description: Clone and setup vcpkg
+inputs:
+  triplet:
+    description: Specify the target triplet
+    required: false
+  host-triplet:
+    description: Specify the host triplet
+    required: false
+  overlay-triplets:
+    description: Additional directories to search to triplets, one entry per line
+    required: false
+  revision:
+    description: The revision of the vcpkg registry to be used
+    required: false
+
+runs:
+  using: composite
+
+  steps:
+    - name: Clone vcpkg
+      uses: actions/checkout@v4
+      with:
+        repository: microsoft/vcpkg
+        ref: ${{ inputs.revision }}
+        filter: tree:0
+        path: vcpkg
+
+    - name: Setup environment variables
+      uses: actions/github-script@v7
+      with:
+        script: |
+          // Configuration for GitHub Actions cache
+          core.exportVariable('ACTIONS_CACHE_URL', process.env.ACTIONS_CACHE_URL || '');
+          core.exportVariable('ACTIONS_RUNTIME_TOKEN', process.env.ACTIONS_RUNTIME_TOKEN || '');
+
+          // vcpkg configuration
+          const path = require('node:path');
+          const vcpkg_root = path.join(process.env.GITHUB_WORKSPACE, 'vcpkg');
+          core.exportVariable('VCPKG_ROOT', vcpkg_root);
+          core.addPath(vcpkg_root);
+
+          core.exportVariable('VCPKG_BINARY_SOURCES', 'clear;x-gha,readwrite');
+          const triplet = process.env.AINPUT_TRIPLET;
+          if (triplet) {
+            core.exportVariable('VCPKG_DEFAULT_TRIPLET', triplet);
+          }
+          const hostTriplet = process.env.AINPUT_HOST_TRIPLET;
+          if (hostTriplet) {
+            core.exportVariable('VCPKG_DEFAULT_HOST_TRIPLET', hostTriplet);
+          }
+          const tripletOverlays = process.env.AINPUT_OVERLAY_TRIPLETS?.replace(/\n/, path.delimiter);
+          if (tripletOverlays) {
+            core.exportVariable('VCPKG_OVERLAY_TRIPLETS', tripletOverlays);
+          }
+      env:
+        AINPUT_TRIPLET: ${{ inputs.triplet }}
+        AINPUT_HOST_TRIPLET: ${{ inputs.host-triplet }}
+        AINPUT_OVERLAY_TRIPLETS: ${{ inputs.overlay-triplets }}
+
+    - run: ./vcpkg/bootstrap-vcpkg.sh
+      shell: bash
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 6d3f31af1a3..9674bfec052 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -135,18 +135,18 @@ jobs:
         if: runner.os == 'Windows'
         uses: ./.github/actions/setup-mingw
 
-      - name: Install dependencies (Windows)
+      - name: Setup vcpkg (Windows)
         if: runner.os == 'Windows'
-        uses: johnwason/vcpkg-action@v6
+        uses: ./.github/actions/setup-vcpkg
         with:
-          pkgs: >-
-            pcre
-            sqlite3
           triplet: x64-mingw-dynamic-release
-          extra-args: --overlay-triplets=${{ github.workspace }}/tools/vcpkg/triplets --host-triplet=x64-mingw-dynamic-release
+          host-triplet: x64-mingw-dynamic-release
           revision: 2024.01.12
-          github-binarycache: true
-          token: ${{ github.token }}
+          overlay-triplets: ${{ github.workspace }}/tools/vcpkg/triplets
+
+      - name: Install dependencies (Windows)
+        if: runner.os == 'Windows'
+        run: vcpkg install pcre sqlite3
 
       - name: Download CA certificates (Windows)
         if: runner.os == 'Windows'
@@ -393,18 +393,18 @@ jobs:
           # Pipe from zstd to tar because macOS' tar does not support unpacking zstd
           zstd -c -d "$archive" | tar -xf - --strip-components 1
 
-      - name: Install dependencies (Windows)
+      - name: Setup vcpkg (Windows)
         if: runner.os == 'Windows'
-        uses: johnwason/vcpkg-action@v6
+        uses: ./git-src/.github/actions/setup-vcpkg
         with:
-          pkgs: >-
-            pcre
-            sqlite3
           triplet: x64-mingw-dynamic-release
-          extra-args: --overlay-triplets=${{ github.workspace }}/tools/vcpkg/triplets --host-triplet=x64-mingw-dynamic-release
+          host-triplet: x64-mingw-dynamic-release
           revision: 2024.01.12
-          github-binarycache: true
-          token: ${{ github.token }}
+          overlay-triplets: ${{ github.workspace }}/tools/vcpkg/triplets
+
+      - name: Install dependencies (Windows)
+        if: runner.os == 'Windows'
+        run: vcpkg install pcre sqlite3
 
       - name: Add DLLs to PATH (Windows)
         if: runner.os == 'Windows'

From 6cfebd9bece9cb0c0a5f997936e8ab3e75008ed7 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Wed, 19 Jun 2024 14:17:03 -0500
Subject: [PATCH 129/169] Produce a meaningful error message for invalid module
 name (#1354)

## Summary
While the AST form of the error generated by  `modules/modulepaths`  is
handled in  `cli_reporter` , the symbol form was not, creating terrible
error messages such as:

    Error: invalid module name '<nil tree>'

This PR makes cli_reporter aware of the symbol form generated by
`modules/modules` , fixing the bad error message.

## Details
*  `cli_reporter`  now handles the symbol form of
`rsemInvalidModuleName`  correctly.
*  `modules/modules`  now raises  `rsemInvalidModuleName`  with line
information, allowing user and tools to know which file the error
originated from.

Fixes https://github.com/nim-works/nimskull/issues/720

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 compiler/front/cli_reporter.nim | 5 ++++-
 compiler/modules/modules.nim    | 6 +++++-
 tests/errmsgs/tinvalid-name.nim | 6 ++++++
 3 files changed, 15 insertions(+), 2 deletions(-)
 create mode 100644 tests/errmsgs/tinvalid-name.nim

diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 3272f533b79..f5ea7744a7e 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -1636,7 +1636,10 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
       result = "using '.' instead of '/' in import paths is deprecated"
 
     of rsemInvalidModuleName:
-      result = "invalid module name: '$1'" % r.ast.render
+      if r.sym != nil:
+        result = "invalid module name: '$1'" % r.symstr
+      else:
+        result = "invalid module name: '$1'" % r.ast.render
 
     of rsemInvalidMethodDeclarationOrder:
       result = "invalid declaration order; cannot attach '" & r.symbols[0].name.s &
diff --git a/compiler/modules/modules.nim b/compiler/modules/modules.nim
index 28b4b70772f..1a438fe5844 100644
--- a/compiler/modules/modules.nim
+++ b/compiler/modules/modules.nim
@@ -104,7 +104,11 @@ proc newModule(graph: ModuleGraph; fileIdx: FileIndex): PSym =
                 name: getModuleIdent(graph, filename),
                 info: newLineInfo(fileIdx, 1, 1))
   if not isNimIdentifier(result.name.s):
-    localReport(graph.config, reportSym(rsemInvalidModuleName, result))
+    localReport(
+      graph.config,
+      newLineInfo(fileIdx, 0, -1),
+      reportSym(rsemInvalidModuleName, result)
+    )
 
   partialInitModule(result, graph, fileIdx, filename)
   graph.registerModule(result)
diff --git a/tests/errmsgs/tinvalid-name.nim b/tests/errmsgs/tinvalid-name.nim
new file mode 100644
index 00000000000..e0706cae043
--- /dev/null
+++ b/tests/errmsgs/tinvalid-name.nim
@@ -0,0 +1,6 @@
+discard """
+  description: '''
+    Test that a proper error message is printed for a module with invalid name
+  '''
+  errormsg: "invalid module name: 'tinvalid-name'"
+"""

From de5ff57b1899c5d75474a28bfa2f8b335c69055c Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 20 Jun 2024 03:33:33 +0200
Subject: [PATCH 130/169] fix incorrect typing in closure-iterator C code-gen
 (#1355)

## Summary

Fix the C code generator emitting incorrectly typed code for closure
closure-iterators, which recent, stricter C compilers report errors
for.

Fixes https://github.com/nim-works/nimskull/issues/1353.

## Details

When computing the environment for a closure iterator where the
iterator closes over some outer locals, there's already a symbol in
the hidden parameter slot, using the environment type of the enclosing
routine.

The symbol is retyped during closure iterator environment computation,
but the *node* referencing it was not updated. `cgen` used the MIR
local's type for the definition, but the *node's* type (which was still
the enclosing procedure's environment type) for the cast, resulting in
a pointer type mismatch.

The node referencing the symbol is now also updated, and an assertion
to make sure the types match is added in `cgen`.
---
 compiler/backend/cgen.nim      | 1 +
 compiler/sem/lambdalifting.nim | 2 ++
 2 files changed, 3 insertions(+)

diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 02627a31d1e..1b3f39a32fd 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -683,6 +683,7 @@ proc closureSetup(p: BProc, prc: PSym) =
   # prc.ast[paramsPos].last contains the type we're after:
   var ls = lastSon(prc.ast[paramsPos])
   p.config.internalAssert(ls.kind == nkSym, prc.info, "closure generation failed")
+  p.config.internalAssert(ls.typ == ls.sym.typ) # sanity check
   var env = ls.sym.position + 1 # parameters start at ID 1
 
   let n = newLocalRef(LocalId(env), ls.info, ls.typ)
diff --git a/compiler/sem/lambdalifting.nim b/compiler/sem/lambdalifting.nim
index e26d7eb50eb..6d37a2532de 100644
--- a/compiler/sem/lambdalifting.nim
+++ b/compiler/sem/lambdalifting.nim
@@ -769,6 +769,8 @@ proc liftLambdas*(g: ModuleGraph; fn: PSym, body: PNode;
       param = getHiddenParam(g, fn)
     else:
       param.typ = t # replace with the correct type
+      # also update the symbol *node's* type
+      fn.ast[paramsPos][^1].typ = t
 
     prepareInnerRoutines(d, idgen, t, fn.info)
     # the environment instance is not setup here; that's done at the iterator's

From 8d1dae2c8ff03b48bf5a4b8dabd83fa832b31ef3 Mon Sep 17 00:00:00 2001
From: Adam Sherwood <43248857+theSherwood@users.noreply.github.com>
Date: Mon, 24 Jun 2024 13:50:41 -0600
Subject: [PATCH 131/169] sem: fix crash when `sizeof` is called on generic
 type (#1328)

## Summary
* Changes  `semSizeof`  to check that the argument to  `sizeof`  is a
concrete type and report an error if that is not the case
* Fixes issue in which  `sizeof`  is called with a generic type, causing
the compiler to crash

## Details

Fixes: https://github.com/nim-works/nimskull/issues/1317

* The following code was causing the compiler to crash. Now it should
cause the compiler to print an error message about concrete types.
```nim
type
  GenericType[K, V] = object
    field: (K, V)

let size = sizeof(GenericType)
```
* adds  `adSemTIsNotAConcreteType`  and maps it to
`rsemTIsNotAConcreteType`
* adds minimal test featuring the snippet above
---
 compiler/ast/ast_types.nim                    |  2 ++
 compiler/front/cli_reporter.nim               |  1 +
 compiler/front/msgs.nim                       |  1 +
 compiler/sem/semexprs.nim                     | 13 +------------
 compiler/sem/semmagic.nim                     | 19 ++++++++++++++++++-
 .../generics/tsizeof_generic_error.nim        | 10 ++++++++++
 .../tsizeof_generic_error_overloaded.nim      | 13 +++++++++++++
 7 files changed, 46 insertions(+), 13 deletions(-)
 create mode 100644 tests/lang_callable/generics/tsizeof_generic_error.nim
 create mode 100644 tests/lang_callable/generics/tsizeof_generic_error_overloaded.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index d271d0fba8f..58770d82c61 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1075,6 +1075,7 @@ type
     # type
     adSemTypeMismatch
     adSemTypeNotAllowed
+    adSemTIsNotAConcreteType
     # lookup
     adSemUndeclaredIdentifier
     adSemConflictingExportnims
@@ -1410,6 +1411,7 @@ type
     of adSemAsmEmitExpectsStringLiteral:
       unexpectedKind*: TNodeKind
     of adSemRaisesPragmaExpectsObject,
+        adSemTIsNotAConcreteType,
         adSemCannotInferTypeOfLiteral,
         adSemProcHasNoConcreteType,
         adSemCannotCastToNonConcrete,
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index f5ea7744a7e..2f450495650 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3391,6 +3391,7 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
               "contains '$1'" % $diag.unexpectedKind,
         ast: diag.wrongNode)
   of adSemRaisesPragmaExpectsObject,
+      adSemTIsNotAConcreteType,
       adSemCannotInferTypeOfLiteral,
       adSemProcHasNoConcreteType,
       adSemCannotAssignTo:
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index 01a3540303a..d59bc03a49d 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -424,6 +424,7 @@ func astDiagToLegacyReportKind*(
   of adWrappedError: rsemWrappedError
   of adSemTypeMismatch: rsemTypeMismatch
   of adSemTypeNotAllowed: rsemTypeNotAllowed
+  of adSemTIsNotAConcreteType: rsemTIsNotAConcreteType
   of adSemUndeclaredIdentifier: rsemUndeclaredIdentifier
   of adSemConflictingExportnims: rsemConflictingExportnims
   of adSemAmbiguousIdent: rsemAmbiguousIdent
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 455fdeb0b6f..a810fd6033d 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -2823,17 +2823,6 @@ proc setMs(n: PNode, s: PSym): PNode =
   n[0] = newSymNode(s)
   n[0].info = n.info
 
-proc semSizeof(c: PContext, n: PNode): PNode =
-  case n.len
-  of 2:
-    #restoreOldStyleType(n[1])
-    n[1] = semExprWithType(c, n[1])
-    n.typ = getSysType(c.graph, n.info, tyInt)
-    result = foldSizeOf(c.config, n, n)
-  else:
-    result = c.config.newError(n, PAstDiag(kind: adSemMagicExpectTypeOrValue,
-                                            magic: mSizeOf))
-
 proc semMagic(c: PContext, n: PNode, s: PSym, flags: TExprFlags): PNode =
   # this is a hotspot in the compiler!
   result = n
@@ -2917,7 +2906,7 @@ proc semMagic(c: PContext, n: PNode, s: PSym, flags: TExprFlags): PNode =
       result = c.graph.emptyNode
   of mSizeOf:
     markUsed(c, n.info, s)
-    result = semSizeof(c, setMs(n, s))
+    result = semSizeOf(c, setMs(n, s))
   else:
     result = semDirectOp(c, n, flags)
 
diff --git a/compiler/sem/semmagic.nim b/compiler/sem/semmagic.nim
index a4e6bdf1122..663d2ea7870 100644
--- a/compiler/sem/semmagic.nim
+++ b/compiler/sem/semmagic.nim
@@ -44,6 +44,23 @@ proc semTypeOf(c: PContext; n: PNode): PNode =
   else:
     result.typ = makeTypeDesc(c, typExpr.typ)
 
+proc semSizeOf(c: PContext, n: PNode): PNode =
+  case n.len
+  of 2:
+    #restoreOldStyleType(n[1])
+    n[1] = semExprWithType(c, n[1])
+    if containsGenericType(n[1].typ):
+      # report the type, not the typedesc
+      n[1] = c.config.newError(n[1], PAstDiag(kind: adSemTIsNotAConcreteType,
+                                              wrongType: n[1].typ[0]))
+      result = n
+    else:
+      n.typ = getSysType(c.graph, n.info, tyInt)
+      result = foldSizeOf(c.config, n, n)
+  else:
+    result = c.config.newError(n, PAstDiag(kind: adSemMagicExpectTypeOrValue,
+                                            magic: mSizeOf))
+
 type
   SemAsgnMode = enum asgnNormal, noOverloadedSubscript, noOverloadedAsgn
 
@@ -403,7 +420,7 @@ proc magicsAfterOverloadResolution(c: PContext, n: PNode,
   of mTypeOf:
     result = semTypeOf(c, n)
   of mSizeOf:
-    result = foldSizeOf(c.config, n, n)
+    result = semSizeOf(c, n)
   of mAlignOf:
     result = foldAlignOf(c.config, n, n)
   of mOffsetOf:
diff --git a/tests/lang_callable/generics/tsizeof_generic_error.nim b/tests/lang_callable/generics/tsizeof_generic_error.nim
new file mode 100644
index 00000000000..fa0d7659f90
--- /dev/null
+++ b/tests/lang_callable/generics/tsizeof_generic_error.nim
@@ -0,0 +1,10 @@
+discard """
+  errormsg: "'GenericType' is not a concrete type"
+  line: 10
+"""
+
+type
+  GenericType[K, V] = object
+    field: (K, V)
+
+let size = sizeof(GenericType)
diff --git a/tests/lang_callable/generics/tsizeof_generic_error_overloaded.nim b/tests/lang_callable/generics/tsizeof_generic_error_overloaded.nim
new file mode 100644
index 00000000000..41c06c68142
--- /dev/null
+++ b/tests/lang_callable/generics/tsizeof_generic_error_overloaded.nim
@@ -0,0 +1,13 @@
+discard """
+  errormsg: "'GenericType' is not a concrete type"
+  line: 13
+"""
+
+type
+  GenericType[K, V] = object
+    field: (K, V)
+
+# Overload sizeof
+proc sizeof(a, b: int) = discard
+
+let size = sizeof(GenericType)

From 9e4bdb0b79362236bf5472ed168d635875df33e2 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 26 Jun 2024 18:01:18 +0000
Subject: [PATCH 132/169] build(deps): Bump softprops/action-gh-release from
 2.0.5 to 2.0.6 (#1356)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[softprops/action-gh-release](https://github.com/softprops/action-gh-release)
from 2.0.5 to 2.0.6.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/releases">softprops/action-gh-release's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.6</h2>
<p>maintenance release with updated dependencies</p>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/blob/master/CHANGELOG.md">softprops/action-gh-release's
changelog</a>.</em></p>
<blockquote>
<h2>2.0.6</h2>
<ul>
<li>maintenance release with updated dependencies</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/softprops/action-gh-release/commit/a74c6b72af54cfa997e81df42d94703d6313a2d0"><code>a74c6b7</code></a>
update changelog</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/b909f761f0367defeee0c2804db31a81c41dd81e"><code>b909f76</code></a>
update dist/index.js</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/e49d08fa3245e75166ef8eb8bc9d7521d34658eb"><code>e49d08f</code></a>
chore(deps): bump glob from 8.0.3 to 10.4.2</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/f12ad255e1c9d5cfd57d1ea9dca3e3001392be35"><code>f12ad25</code></a>
chore(deps): bump <code>@​octokit/plugin-throttling</code> from 4.3.2 to
9.3.0</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/7039a825a7b0413e21c08b679d39690ada00386f"><code>7039a82</code></a>
chore: release 2.0.6</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/f9c2b6ca3738015453adef1caa20347e8ac0fa6d"><code>f9c2b6c</code></a>
chore: update deps and run build</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/73738a629386c54e67bc26a1e14437a5d0b686a0"><code>73738a6</code></a>
chore(deps): bump node dep and <code>@types/node</code></li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/a500a35279e4ba77e64279527fb2a91bfc538dbe"><code>a500a35</code></a>
Bump ts-jest from 29.0.3 to 29.1.4 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/459">#459</a>)</li>
<li>See full diff in <a

href="https://github.com/softprops/action-gh-release/compare/v2.0.5...v2.0.6">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=softprops/action-gh-release&package-manager=github_actions&previous-version=2.0.5&new-version=2.0.6)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 61479c52ce0..ae4eb4b8884 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -101,7 +101,7 @@ jobs:
 
       - id: release
         name: Create pre-release
-        uses: softprops/action-gh-release@v2.0.5
+        uses: softprops/action-gh-release@v2.0.6
         with:
           prerelease: true
           files: ${{ steps.release-files.outputs.result }}

From e0ad8b193a9c501c54eae09f962ab53841c92744 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 26 Jun 2024 20:30:30 +0200
Subject: [PATCH 133/169] deprecate the `.codegenDecl` pragma (#1358)

## Summary

The `.codegenDecl` pragma is going to be removed eventually. For a
transition period, a deprecation warning is now reported when using it.
---
 compiler/ast/report_enums.nim   | 1 +
 compiler/front/cli_reporter.nim | 4 ++++
 compiler/sem/pragmas.nim        | 2 ++
 3 files changed, 7 insertions(+)

diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index 4b4afeeef41..9c8a2956ebd 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -734,6 +734,7 @@ type
     rsemLockLevelMismatch        = "LockLevel"
     rsemTypelessParam            = "TypelessParam"
     rsemOwnedTypeDeprecated
+    rsemCodegenDeclDeprecated    = "Deprecated"
 
     rsemWarnUnlistedRaises = "Effect" ## `sempass2.checkRaisesSpec` had
     ## `emitWarnings: bool` parameter which was supposedly used to control
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 2f450495650..d4d2242b57b 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -428,6 +428,10 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
     of rsemOwnedTypeDeprecated:
       result = "the `owned` type-operator is deprecated and treated as a no-op"
 
+    of rsemCodegenDeclDeprecated:
+      result = "the `.codegenDecl` pragma is deprecated; support for it " &
+               "will be removed in the future"
+
     of rsemLinterReport:
       result.addf("'$1' should be: '$2'", r.linterFail.got, r.linterFail.wanted)
 
diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index 58b479b0be3..486439bdf25 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -299,6 +299,8 @@ proc processCodegenDecl(c: PContext, n: PNode, sym: PSym): PNode =
   ## the string literal from `n`
   result = getStrLitNode(c, n)
   sym.constraint = result
+  # issue a deprecation warning:
+  c.config.localReport(n.info, reportSem(rsemCodegenDeclDeprecated))
 
 proc processMagic(c: PContext, n: PNode, s: PSym): PNode =
   ## produces an error if `n` is not a pragmacall kinds, otherwise `n` is

From a21c4db569067f4d9a5f8feee553af1af582f5d1 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 27 Jun 2024 07:54:56 +0200
Subject: [PATCH 134/169] fix incorrect removal of self-assignments (#1357)

## Summary

Fix a bug with the MIR-based alias analysis that caused assignments
like `arr[x][1] = arr[y][1]` to be considered self-assignments and
therefore removed.

## Details

Change `comparePaths` to not regress the 'overlap' state from `maybe`
back to `yes` when the compared array indices are the same, which led
to expressions of the same shape where the outermost array access uses
the same static index to being treated as referring to the same
location (even when they don't).

`injectdestructors` uses the `aliasanalysis` results to remove self-
assignments, causing the erroneous removal of assignments. All other
uses of `aliasanalysis` are for disabling optimizations, so
observable behaviour was not affected there.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/sem/aliasanalysis.nim          |  9 ++++++--
 tests/assign/tarray_expr_assignment.nim | 28 +++++++++++++++++++++++++
 2 files changed, 35 insertions(+), 2 deletions(-)
 create mode 100644 tests/assign/tarray_expr_assignment.nim

diff --git a/compiler/sem/aliasanalysis.nim b/compiler/sem/aliasanalysis.nim
index 8906d6bc5b4..efab582f858 100644
--- a/compiler/sem/aliasanalysis.nim
+++ b/compiler/sem/aliasanalysis.nim
@@ -205,9 +205,14 @@ proc compare*(body: MirTree, a, b: Path): CmpLocsResult =
         break
 
     of pikIndex:
-      overlaps = sameIndex(na, nb)
-      if overlaps == no:
+      case sameIndex(na, nb)
+      of no:
+        overlaps = no
         break
+      of yes:
+        discard "don't change back to 'yes'"
+      of maybe:
+        overlaps = maybe
 
     inc i
 
diff --git a/tests/assign/tarray_expr_assignment.nim b/tests/assign/tarray_expr_assignment.nim
new file mode 100644
index 00000000000..43a7b7dcfdc
--- /dev/null
+++ b/tests/assign/tarray_expr_assignment.nim
@@ -0,0 +1,28 @@
+discard """
+  description: '''
+    Regression test for an alias-analysis bug that caused expressions involving
+    array-subscript expressions to erroneously be eliminated in some cases
+  '''
+  targets: c js vm
+"""
+
+type
+  Object = object
+    val: int
+  Type = array[2, array[2, Object]]
+
+# important: the bug only affected code in procedures that work with destructor-
+# having types
+proc `=destroy`(x: var Object) =
+  discard
+
+proc test(x, y: int) {.noinline.} =
+  var a = [[Object(val: 1), Object(val: 2)], [Object(val: 3), Object(val: 4)]]
+  # whether the two expressions refer to the same location is unknown; the
+  # assignment must not be removed
+  a[x][1] = a[y][1]
+  # note: the common trailing [1] sub-expressions are important for this test
+
+  doAssert a[0][1].val == 4
+
+test(0, 1)

From 0ae0cd51b6b9505c27ca35dca4a143fc366f6a63 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 27 Jun 2024 22:16:34 +0200
Subject: [PATCH 135/169] lower `string`/`float` case statements with MIR pass
 (#1360)

## Summary

Use an MIR pass to lower `string` and `float` case statements into `if`
chains, replacing the C code generator logic.

## Details

* add the `lowerCase` pass to `mirpasses`
* it's currently only enabled for the C target
* the lowering is a straightforward MIR port of the code generation
  previously implemented by `cgen` for `string`/`float` case statements
* the `cgen` handling for `string` and `float` case statements is
  removed

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/backend/ccgstmts.nim |  61 +--------------
 compiler/mir/mirconstr.nim    |   4 +
 compiler/mir/mirpasses.nim    | 139 ++++++++++++++++++++++++++++++++++
 compiler/mir/mirtrees.nim     |   7 +-
 4 files changed, 150 insertions(+), 61 deletions(-)

diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index bd918b3d4f2..81dbebafc39 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -12,8 +12,6 @@
 const
   RangeExpandLimit = 256      # do not generate ranges
                               # over 'RangeExpandLimit' elements
-  stringCaseThreshold = 8
-    # above X strings a hash-switch for strings is generated
 
 proc startBlockInternal(p: BProc) =
   let result = p.blocks.len
@@ -213,52 +211,6 @@ template genIfForCaseUntil(p: BProc, t: CgNode,
     else:
       linefmt(p, cpsStmts, "goto $1;$n", [t[i][^1].label])
 
-template genCaseGeneric(p: BProc, t: CgNode,
-                    rangeFormat, eqFormat: FormatStr) =
-  var a: TLoc
-  initLocExpr(p, t[0], a)
-  genIfForCaseUntil(p, t, rangeFormat, eqFormat, t.len-1, a)
-
-proc genCaseStringBranch(p: BProc, b: CgNode, e: TLoc, labl: BlockId,
-                         branches: var openArray[Rope]) =
-  var x: TLoc
-  for i in 0..<b.len - 1:
-    assert(b[i].kind != cnkRange)
-    initLocExpr(p, b[i], x)
-    assert(b[i].kind == cnkStrLit)
-    var j = int(hashString(p.config, getString(p, b[i])) and high(branches))
-    appcg(p.module, branches[j], "if (#eqStrings($1, $2)) goto $3;$n",
-         [rdLoc(e), rdLoc(x), labl])
-
-proc genStringCase(p: BProc, t: CgNode) =
-  # count how many constant strings there are in the case:
-  var strings = 0
-  for i in 1..<t.len:
-    if isOfBranch(t[i]): inc(strings, t[i].len - 1)
-  if strings > stringCaseThreshold:
-    var bitMask = math.nextPowerOfTwo(strings) - 1
-    var branches: seq[Rope]
-    newSeq(branches, bitMask + 1)
-    var a: TLoc
-    initLocExpr(p, t[0], a) # fist pass: generate ifs+goto:
-    for i in 1..<t.len:
-      if isOfBranch(t[i]):
-        genCaseStringBranch(p, t[i], a, t[i][^1].label, branches)
-      else:
-        # else statement: nothing to do yet
-        discard
-    linefmt(p, cpsStmts, "switch (#hashString($1) & $2) {$n",
-            [rdLoc(a), bitMask])
-    for j in 0..high(branches):
-      if branches[j] != "":
-        lineF(p, cpsStmts, "case $1: $n$2break;$n",
-             [intLiteral(j), branches[j]])
-    lineF(p, cpsStmts, "}$n", []) # else statement:
-    if not isOfBranch(t[^1]):
-      lineCg(p, cpsStmts, "goto $1;$n", [t[^1][0].label])
-
-  else:
-    genCaseGeneric(p, t, "", "if (#eqStrings($1, $2)) goto $3;$n")
 
 proc branchHasTooBigRange(b: CgNode): bool =
   for it in b:
@@ -332,17 +284,10 @@ proc genOrdinalCase(p: BProc, n: CgNode) =
 
 proc genCase(p: BProc, t: CgNode) =
   genLineDir(p, t)
-  case skipTypes(t[0].typ, abstractVarRange).kind
-  of tyString:
-    genStringCase(p, t)
-  of tyFloat..tyFloat64:
-    genCaseGeneric(p, t, "if ($1 >= $2 && $1 <= $3) goto $4;$n",
-                         "if ($1 == $2) goto $3;$n")
+  if t[0].kind == cnkLocal and sfGoto in p.body[t[0].local].flags:
+    genGotoForCase(p, t)
   else:
-    if t[0].kind == cnkLocal and sfGoto in p.body[t[0].local].flags:
-      genGotoForCase(p, t)
-    else:
-      genOrdinalCase(p, t)
+    genOrdinalCase(p, t)
 
 proc bodyCanRaise(p: BProc; n: CgNode): bool =
   case n.kind
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 3b22dcc2105..2be7aeb3bc7 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -452,6 +452,10 @@ func join*(bu: var MirBuilder, label: LabelId) =
   bu.subTree mnkJoin:
     bu.add MirNode(kind: mnkLabel, label: label)
 
+func goto*(bu: var MirBuilder, label: LabelId) =
+  bu.subTree mnkGoto:
+    bu.add MirNode(kind: mnkLabel, label: label)
+
 template pathNamed*(bu: var MirBuilder, t: TypeId, f: int32, body: untyped) =
   ## Emits a ``mnkPathNamed`` expression.
   bu.subTree MirNode(kind: mnkPathNamed, typ: t):
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index c9b3d498899..40c438431a3 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -38,6 +38,9 @@ import
     idioms
   ]
 
+from std/math import nextPowerOfTwo
+from compiler/backend/ccgutils import hashString
+
 # for type-based alias analysis
 from compiler/sem/aliases import isPartOf, TAnalysisResult
 
@@ -58,6 +61,10 @@ const
   LocSkip = abstractRange + tyUserTypeClasses
     ## types to skip to arrive at the underlying concrete value type
 
+template addCompilerProc(env: var MirEnv, graph: ModuleGraph,
+                         name: string): ProcedureId =
+  env.procedures.add(graph.getCompilerProc(name))
+
 template subTree(bu: var MirBuilder, k: MirNodeKind, t: TypeId,
                  body: untyped) =
   bu.subTree MirNode(kind: k, typ: t):
@@ -652,6 +659,137 @@ proc lowerMove(tree: MirTree, changes: var Changeset) =
     else:
       discard "not relevant"
 
+proc lowerCase(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
+               changes: var Changeset) =
+  ## Lowers case statements with string or float selectors. For large string-
+  ## case statements, a hash-table optimization is used.
+  const stringCaseThreshold = 8
+    ## above X strings a hash-switch for strings is generated
+
+  iterator targets(tree: MirTree, n: NodePosition): (LabelId, NodePosition) =
+    ## Returns all comparison candidate together with their associated jump
+    ## target.
+    for it in tree.subNodes(n, 1):
+      let target = tree[tree.last(it)].label
+      var x = tree.child(it, 0)
+      for _ in 0..<(tree[it].len - 1): # -1 for the label node
+        yield (target, x)
+        x = tree.sibling(x)
+
+  proc genericCase(bu: var MirBuilder, tree: MirTree, n: NodePosition,
+                   eq: TMagic, sel: Value) {.nimcall.} =
+    for (target, it) in tree.targets(n):
+      if tree[it].kind == mnkRange:
+        # only float case-statements can use ranges, so we know that the
+        # operands are floats here
+        var cond = bu.wrapTemp BoolType:
+          bu.buildMagicCall mLeF64, BoolType:
+            bu.emitByVal bu.inline(tree, tree.child(it, 0))
+            bu.emitByVal sel
+
+        bu.buildIf (;bu.use cond):
+          cond = bu.wrapTemp BoolType:
+            bu.buildMagicCall mLeF64, BoolType:
+              bu.emitByVal sel
+              bu.emitByVal bu.inline(tree, tree.child(it, 1))
+
+          # jump to the branch body if the run-time value is within the given
+          # range
+          bu.buildIf (;bu.use cond):
+            bu.goto target
+      else:
+        # single comparison
+        let cond = bu.wrapTemp BoolType:
+          bu.buildMagicCall eq, BoolType:
+            bu.emitByVal sel
+            bu.emitByVal bu.inline(tree, it)
+
+        bu.buildIf (;bu.use cond):
+          bu.goto target
+
+    bu.goto tree[tree.last(tree.last(n))].label # jump to else branch
+
+  for n in search(tree, {mnkCase}):
+    case env.types[tree[n, 0].typ].skipTypes(abstractInst).kind
+    of tyFloat, tyFloat64, tyFloat32:
+      # simple: use the generic lowering
+      changes.replaceMulti(tree, n, bu):
+        let sel = bu.inline(tree, tree.child(n, 0))
+        genericCase(bu, tree, n, mEqF64, sel)
+    of tyString:
+      # count the number of strings:
+      var numStrings = 0
+      for it in tree.subNodes(n, start=1):
+        numStrings += (tree.len(it) - 1) # -1 for the target label
+
+      if numStrings < stringCaseThreshold:
+        # compare against every string
+        changes.replaceMulti(tree, n, bu):
+          let sel = bu.inline(tree, tree.child(n, 0))
+          genericCase(bu, tree, n, mEqStr, sel)
+      else:
+        # reduce the number of string comparisons through usage of a hash
+        # table
+        changes.replaceMulti(tree, n, bu):
+          let bitMask = nextPowerOfTwo(numStrings) - 1
+          var branches: seq[tuple[label: LabelId,
+                                  strings: seq[(NodePosition, LabelId)]]]
+          branches.newSeq(bitMask + 1)
+
+          # sort the string operands into buckets (`branches`) based on their
+          # hash:
+          for (target, it) in tree.targets(n):
+            let bI = hashString(graph.config, env[tree[it].strVal]) and bitMask
+            if branches[bI].strings.len == 0:
+              # the label is allocated on demand
+              branches[bI].label = bu.allocLabel()
+
+            branches[bI].strings.add (it, target)
+
+          let
+            elseLabel = tree[tree.last(tree.last(n))].label
+            typ  = env.types.sizeType
+            sel  = bu.inline(tree, tree.child(n, 0))
+          var hash: Value
+
+          # emit the hash computation:
+          hash = bu.wrapTemp typ:
+            bu.buildCall env.addCompilerProc(graph, "hashString"), typ:
+              bu.emitByVal sel
+          hash = bu.wrapTemp typ:
+            bu.buildMagicCall mBitandI, typ:
+              bu.emitByVal hash
+              bu.emitByVal:
+                literal(mnkIntLit, env.getOrIncl(BiggestInt bitMask), typ)
+
+          # emit the dispatcher over the hash value:
+          bu.subTree mnkCase:
+            bu.use hash
+            for i, b in branches.pairs:
+              bu.subTree mnkBranch:
+                bu.use literal(mnkIntLit, env.getOrIncl(BiggestInt i), typ)
+                if b.strings.len == 0:
+                  bu.add MirNode(kind: mnkLabel, label: elseLabel)
+                else:
+                  bu.add MirNode(kind: mnkLabel, label: b.label)
+
+          # emit the string comparisons:
+          for b in branches.items:
+            if b.strings.len > 0:
+              bu.join b.label
+              for (str, target) in b.strings.items:
+                let cond = bu.wrapTemp BoolType:
+                  bu.buildMagicCall mEqStr, BoolType:
+                    bu.emitByVal sel
+                    bu.emitByVal bu.inline(tree, str)
+
+                bu.buildIf (;bu.use cond):
+                  bu.goto target
+
+              bu.goto elseLabel # jump to the 'else' branch
+    else:
+      discard "keep as is"
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   graph: ModuleGraph, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
@@ -687,6 +825,7 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       lowerNew(body.code, graph, env, c)
       lowerChecks(body, graph, env, c)
       injectStrPreparation(body.code, graph, env, c)
+      lowerCase(body.code, graph, env, c)
 
   # instrument the body with profiler calls after all lowerings, but before
   # optimization
diff --git a/compiler/mir/mirtrees.nim b/compiler/mir/mirtrees.nim
index 00f9b5b70e5..ad27128e6a8 100644
--- a/compiler/mir/mirtrees.nim
+++ b/compiler/mir/mirtrees.nim
@@ -550,10 +550,11 @@ iterator pairs*(tree: MirTree): (NodePosition, lent MirNode) =
     yield (i.NodePosition, tree[i])
     inc i
 
-iterator subNodes*(tree: MirTree, n: NodePosition): NodePosition =
-  ## Iterates over and yields all direct child nodes of `n`
+iterator subNodes*(tree: MirTree, n: NodePosition; start = 0): NodePosition =
+  ## Returns in order of apperance all direct child nodes of `n`, starting with
+  ## `start`.
   let L = tree[n].len
-  var n = tree.child(n, 0)
+  var n = tree.child(n, start)
   for _ in 0..<L:
     yield n
     n = tree.sibling(n)

From d7353ba6faee6510474541bc95f07bec940c5def Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 29 Jun 2024 02:51:25 +0200
Subject: [PATCH 136/169] sem: correctly type empty containers in macro calls
 (#1361)

## Summary

Internal-only issue. Empty container values passed to `static` macro/
template parameters used empty container types. Now they're converted
to the formal parameter's type.

## Details

* wrap the arguments to `static` macro/template parameters in
  implicit conversions, if needed for the match
* use post-match argument fitting for macro calls
* for a smaller impact, template calls still don't use post-match
  argument fitting
* remove the `vmserialize` workaround for empty set types (which no
  longer reach there now)
---
 compiler/sem/semexprs.nim   |  8 ++++++--
 compiler/sem/sigmatch.nim   | 24 ++++++++++++++++++++----
 compiler/vm/vmserialize.nim |  6 +-----
 3 files changed, 27 insertions(+), 11 deletions(-)

diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index a810fd6033d..e9ae4293edd 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -1182,8 +1182,12 @@ proc afterCallActions(c: PContext; n: PNode, flags: TExprFlags): PNode =
   result = n
   let callee = result[0].sym
   case callee.kind
-  of skMacro: result = semMacroExpr(c, result, callee, flags)
-  of skTemplate: result = semTemplateExpr(c, result, callee, flags)
+  of skMacro:
+    result = fitArgTypesPostMatch(c, result)
+    if result.kind != nkError:
+      result = semMacroExpr(c, result, callee, flags)
+  of skTemplate:
+    result = semTemplateExpr(c, result, callee, flags)
   else:
     semFinishOperands(c, result)
     activate(c, result)
diff --git a/compiler/sem/sigmatch.nim b/compiler/sem/sigmatch.nim
index faf78bb9d6d..e14d99681bf 100644
--- a/compiler/sem/sigmatch.nim
+++ b/compiler/sem/sigmatch.nim
@@ -2311,10 +2311,26 @@ proc paramTypesMatchAux(m: var TCandidate, f, a: PType,
       of tyTyped, tyTypeDesc:
         arg
       of tyStatic:
-        if arg.typ.n.isNil:  # no value on the type
-          argSemantized
-        else:                # value on the type
-          arg.typ.n
+        let n =
+          if arg.typ.n.isNil:  # no value on the type
+            argSemantized
+          else:                # value on the type
+            arg.typ.n
+
+        # XXX: the implicit conversion handling is duplicated from the non-
+        #      template/non-macro path. Template and macro arguments shouldn't
+        #      be special-cased like this
+        case r
+        of isEqual: n
+        of isGeneric:
+          if n.typ.isEmptyContainer:
+            implicitConv(nkHiddenStdConv, f[0], n, m, c)
+          else:
+            n
+        of isSubtype:
+          implicitConv(nkHiddenSubConv, f[0], n, m, c)
+        else:
+          implicitConv(nkHiddenStdConv, f[0], n, m, c)
       else:
         argSemantized
     return
diff --git a/compiler/vm/vmserialize.nim b/compiler/vm/vmserialize.nim
index 88f59328e39..ae4b29a558f 100644
--- a/compiler/vm/vmserialize.nim
+++ b/compiler/vm/vmserialize.nim
@@ -94,11 +94,7 @@ proc initFromExpr(dest: LocHandle, tree: MirTree, n: var int, env: MirEnv,
       # subtract the first element's value to make all values zero-based
       toInt(val - first)
 
-    let first =
-      if tree[n].len > 0: firstOrd(c.config, env[tree[n].typ])
-      else:               Zero
-    # XXX: ^^ ``set[empty]``-typed literals reach here, but they shouldn't. The
-    #      len guard works around the issue
+    let first = firstOrd(c.config, env[tree[n].typ])
     iterTree(j):
       let node = next()
       if node.kind == mnkRange:

From 8184c8552f90b60acf70ad544076a2b464e7af21 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Sat, 29 Jun 2024 17:36:19 -0500
Subject: [PATCH 137/169] nversion: read version from text file (#1362)

## Summary
Instead of statically encoding the version as a structure, read it from
a text file. This allows tools to modify the version string without
creating invalid NimSkull, and allow for easier rearrangement of the
code in the future.

## Details
* Added validation for version string suffix according to SemVer rules.
* Compiler (base) version is now stored in text form in
`compiler/version.txt` .
---
 compiler/utils/nversion.nim | 36 ++++++++++++++++++++++++++----------
 compiler/version.txt        |  1 +
 2 files changed, 27 insertions(+), 10 deletions(-)
 create mode 100644 compiler/version.txt

diff --git a/compiler/utils/nversion.nim b/compiler/utils/nversion.nim
index c29ec1787c7..92c010f91bb 100644
--- a/compiler/utils/nversion.nim
+++ b/compiler/utils/nversion.nim
@@ -10,7 +10,7 @@
 # This module contains Nim's version. It is the only place where it needs
 # to be changed.
 
-import std/strscans
+import std/[strscans, strutils]
 
 type
   Version* = object
@@ -18,6 +18,17 @@ type
     suffix*: string ## Optional suffix
     major*, minor*, patch*: int
 
+func isValidSuffix(s: string): bool =
+  ## Return whether `s` represents a valid version suffix.
+  # The validation rules are derived from SemVer's grammar, albeit relaxed.
+  result = true
+  if s.len > 0 and s[0] notin {'+', '-'}:
+    return false
+
+  for ch in s.items:
+    if ch notin {'a'..'z', 'A'..'Z', '0'..'9', '+', '-', '.'}:
+      return false
+
 func `$`*(v: Version): string =
   ## Return a string describing `v`.
   result.addInt v.major
@@ -32,19 +43,24 @@ func parse*(s: string): Version =
   if not scanf(
     s, "$i.$i.$i$*$.",
     result.major, result.minor, result.patch, result.suffix
-  ):
+  ) or not result.suffix.isValidSuffix:
     raise newException(ValueError):
-      "Invalid version string: " & s
+      "Invalid version string: " & s.escape()
+
+const CompilerVersionSuffix* {.strdefine.} = ""
+  ## The suffix to attach to the compiler version. This is meant to be
+  ## declared by build tools to signify development version for example.
+
+proc parseStatic(): Version {.compileTime.} =
+  ## Obtain the compiler version from the version file.
+  result = parse(staticRead("../version.txt").strip())
+  doAssert result.suffix == "", "Compiler version in `version.txt' should not have any suffix"
+  doAssert isValidSuffix(CompilerVersionSuffix)
+  result.suffix = CompilerVersionSuffix
 
 const
   MaxSetElements* = 1 shl 16  # (2^16) to support unicode character sets?
-  CompilerVersionSuffix* {.strdefine.} = ""
-    ## The suffix to attach to the compiler version. This is meant to be
-    ## declared by build tools to signify development version for example.
-  CompilerVersion* = Version(
-    major: 0, minor: 1, patch: 0,
-    suffix: CompilerVersionSuffix
-  )
+  CompilerVersion* = parseStatic()
     ## The compiler version.
   VersionAsString* = $CompilerVersion
   RodFileVersion* = "1223"       # modify this if the rod-format changes!
diff --git a/compiler/version.txt b/compiler/version.txt
new file mode 100644
index 00000000000..6e8bf73aa55
--- /dev/null
+++ b/compiler/version.txt
@@ -0,0 +1 @@
+0.1.0

From eb5fa688e7f7949d26e1b788172f54b095c906aa Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 30 Jun 2024 01:44:31 +0200
Subject: [PATCH 138/169] remove the `.goto` pragma/feature (#1363)

## Summary

The `.goto` pragma is neither documented nor tested, and most of the
compiler is unaware of it. Everything related to the feature is removed
from the compiler.

## Details

* the `.goto` pragma could be used on variables of enum type,
  turning all assignments to the variable into jumps to branches of an
  associated `case` statement
* remove the `sfGoto` symbol flag
* remove the reports associated with the `.goto` pragma
* keep the `wGoto` enum; it's part of the C keyword set
---
 compiler/ast/ast_types.nim      |  1 -
 compiler/ast/report_enums.nim   |  2 --
 compiler/backend/ccgstmts.nim   | 37 ++-------------------------------
 compiler/front/cli_reporter.nim |  6 ------
 compiler/sem/pragmas.nim        |  6 +-----
 5 files changed, 3 insertions(+), 49 deletions(-)

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 58770d82c61..4bba6e9b78a 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -433,7 +433,6 @@ const
 
   sfNoForward*     = sfRegister       ## forward declarations are not required (per module)
   sfExperimental*  = sfOverriden      ## module uses the .experimental switch
-  sfGoto*          = sfOverriden      ## var is used for 'goto' code generation
   sfWrittenTo*     = sfBorrow         ## param is assigned to
   sfEscapes*       = sfProcvar        ## param escapes
   sfBase*          = sfDiscriminant
diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index 9c8a2956ebd..6889e5befcf 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -630,9 +630,7 @@ type
     # Codegen
     rsemRttiRequestForIncompleteObject
     rsemExpectedNimcallProc
-    rsemDisallowedRangeForComputedGoto
     rsemExpectedParameterForJsPattern
-    rsemExpectedLiteralForGoto
     rsemRequiresDeepCopyEnabled
     rsemDisallowedOfForPureObjects
     rsemCannotCodegenCompiletimeProc
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index 81dbebafc39..7e49197cea6 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -62,24 +62,11 @@ proc endBlock(p: BProc) =
   blockEnd.addf("}$n", [])
   endBlock(p, blockEnd)
 
-proc genGotoVar(p: BProc; value: CgNode) =
-  case value.kind
-  of cnkIntLit, cnkUIntLit:
-    lineF(p, cpsStmts, "goto NIMSTATE_$#;$n", [value.intVal.rope])
-  else:
-    localReport(p.config, value.info, reportSem rsemExpectedLiteralForGoto)
-
 proc genBracedInit(p: BProc, n: CgNode; optionalType: PType): Rope
 
 proc genSingleVar(p: BProc, vn, value: CgNode) =
   ## Generates and emits the C code for the definition statement of a local.
   let v = vn.local
-
-  if sfGoto in p.body[v].flags:
-    # translate 'var state {.goto.} = X' into 'goto LX':
-    genGotoVar(p, value)
-    return
-
   assignLocalVar(p, vn)
   # default-initialize the local if no initial value is supplied. Automatic
   # initialization is also ommitted when the `value` expression is a
@@ -108,20 +95,6 @@ proc genIf(p: BProc, n: CgNode) =
   lineF(p, cpsStmts, "if ($1)$n", [rdLoc(a)])
   startBlock(p)
 
-proc genGotoForCase(p: BProc; caseStmt: CgNode) =
-  for i in 1..<caseStmt.len:
-    startBlock(p)
-    let it = caseStmt[i]
-    for j in 0..<it.len-1:
-      if it[j].kind == cnkRange:
-        localReport(p.config, it.info, reportSem rsemDisallowedRangeForComputedGoto)
-        return
-      let val = getOrdValue(it[j])
-      lineF(p, cpsStmts, "NIMSTATE_$#:$n", [val.rope])
-
-    lineCg(p, cpsStmts, "goto $1;$n", [it[^1].label])
-    endBlock(p)
-
 proc exit(n: CgNode): CgNode =
   # XXX: exists as a convenience for overflow check, index check, etc.
   #      code gen. Should be removed once those are fully lowered prior
@@ -284,10 +257,7 @@ proc genOrdinalCase(p: BProc, n: CgNode) =
 
 proc genCase(p: BProc, t: CgNode) =
   genLineDir(p, t)
-  if t[0].kind == cnkLocal and sfGoto in p.body[t[0].local].flags:
-    genGotoForCase(p, t)
-  else:
-    genOrdinalCase(p, t)
+  genOrdinalCase(p, t)
 
 proc bodyCanRaise(p: BProc; n: CgNode): bool =
   case n.kind
@@ -429,10 +399,7 @@ when false:
     expr(p, call, d)
 
 proc genAsgn(p: BProc, e: CgNode) =
-  if e[0].kind == cnkLocal and sfGoto in p.body[e[0].local].flags:
-    genLineDir(p, e)
-    genGotoVar(p, e[1])
-  else:
+  if true:
     let le = e[0]
     let ri = e[1]
     var a: TLoc
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index d4d2242b57b..73c692a24b2 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -1993,16 +1993,10 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
     of rsemRequiresDeepCopyEnabled:
       result = "for --gc:arc|orc 'deepcopy' support has to be enabled with --deepcopy:on"
 
-    of rsemExpectedLiteralForGoto:
-      result = "'goto' target must be a literal value"
-
     of rsemExpectedParameterForJsPattern:
       result =  "wrong importjs pattern; expected parameter at position " &
         $r.countMismatch.expected & " but got only: " & $r.countMismatch.got
 
-    of rsemDisallowedRangeForComputedGoto:
-      result = "range notation not available for computed goto"
-
     of rsemExpectedNimcallProc:
       result = r.symstr & " needs to have the 'nimcall' calling convention"
 
diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index 486439bdf25..92b07857d56 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -119,7 +119,7 @@ const
     wMagic, wHeader, wCompilerProc, wCore, wDynlib,
     wNoInit, wCompileTime, wGlobal,
     wGensym, wInject,
-    wGuard, wGoto, wCursor, wNoalias, wAlign}
+    wGuard, wCursor, wNoalias, wAlign}
   constPragmas* = declPragmas + {wHeader, wMagic,
     wGensym, wInject,
     wIntDefine, wStrDefine, wBoolDefine, wCompilerProc, wCore}
@@ -1446,10 +1446,6 @@ proc applySymbolPragma(c: PContext, sym: PSym, it: PNode): PNode =
             result = sym.guard.ast
           else:
             result = it
-      of wGoto:
-        result = noVal(c, it)
-        assert sym.kind in {skVar, skLet}
-        sym.flags.incl sfGoto
       of wExportNims:
           # XXX: modifying the module graph during application of a symbol
           #      operator doesn't seem like a good idea...

From 6aa257c1f777cfa92d15d3a4a01be6e9a0bbb0ac Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 1 Jul 2024 01:24:25 +0200
Subject: [PATCH 139/169] mirbodies: track next label in `MirBody` (#1365)

## Summary

Track the ID to use for new labels in `MirBody`. This greatly reduces
the overhead of `Changeset` creation, since the source body doesn't
have to be scanned.

## Details

* track the next label ID with `MirBody.nextLabel`
* on creation, the `Changeset` next label ID is initialized from the ID
  stored with the `MirBody`
* add the `createBody` routine for creating a proper `MirBody` from a
  `MirBuilder` instance
* use `createBody` to replace manual `MirBody` construction

### Performance

Compile times are effectively unaffected. A small improvement of a few
milliseconds is measurable, but it's insignificant. However, using more
batches in the future will make the improvement more pronounced.
---
 compiler/backend/backends.nim  | 19 ++++++++-----------
 compiler/mir/mirbodies.nim     |  4 ++++
 compiler/mir/mirchangesets.nim | 11 +++--------
 compiler/mir/mirconstr.nim     |  8 +++++++-
 compiler/mir/mirgen.nim        |  7 ++-----
 5 files changed, 24 insertions(+), 25 deletions(-)

diff --git a/compiler/backend/backends.nim b/compiler/backend/backends.nim
index 157300f4aa1..c9ab7bde9a2 100644
--- a/compiler/backend/backends.nim
+++ b/compiler/backend/backends.nim
@@ -420,13 +420,13 @@ proc produceFragmentsForGlobals(
       bu.setSource(m.add(n))
       bu.subTree mnkScope: discard
 
-  func finish(bu: sink MirBuilder, m: var SourceMap, n: PNode
-             ): auto {.nimcall.} =
+  func finish(bu: sink MirBuilder, n: PNode, body: var MirBody) {.nimcall.} =
+    var map = move body.source
     if bu.front.len > 0:
-      bu.setSource(m.add(n))
+      bu.setSource(map.add(n))
       bu.subTree mnkEndScope: discard
-    # we're creating a body here, so there is no list of locals yet
-    result = finish(bu, default(Store[LocalId, Local]))
+
+    body = createBody(bu, map)
 
   var init, deinit, threadDeinit: MirBuilder
 
@@ -459,12 +459,9 @@ proc produceFragmentsForGlobals(
           # also emit a destructor into the thread-deinit fragment:
           destroyOp(threadDeinit, result.threadDeinit.source)
 
-  (result.init.code, result.init.locals) =
-    finish(init, result.init.source, graph.emptyNode)
-  (result.deinit.code, result.deinit.locals) =
-    finish(deinit, result.deinit.source, graph.emptyNode)
-  (result.threadDeinit.code, result.threadDeinit.locals) =
-    finish(threadDeinit, result.threadDeinit.source, graph.emptyNode)
+  finish(init, graph.emptyNode, result.init)
+  finish(deinit, graph.emptyNode, result.deinit)
+  finish(threadDeinit, graph.emptyNode, result.threadDeinit)
 
 # ----- dynlib handling -----
 
diff --git a/compiler/mir/mirbodies.nim b/compiler/mir/mirbodies.nim
index 1105b95b1ae..9650546d89b 100644
--- a/compiler/mir/mirbodies.nim
+++ b/compiler/mir/mirbodies.nim
@@ -45,6 +45,10 @@ type
     ## associated with a body, such as how far the lowering is along.
     locals*: Locals
       ## all locals part of the body
+    nextLabel*: LabelId
+      ## the ID to use for a new label. Incremented when allocating a new
+      ## label
+
     source*: SourceMap
     code*: MirTree
 
diff --git a/compiler/mir/mirchangesets.nim b/compiler/mir/mirchangesets.nim
index c629e725a41..ceca8770e88 100644
--- a/compiler/mir/mirchangesets.nim
+++ b/compiler/mir/mirchangesets.nim
@@ -50,14 +50,8 @@ template remove*(c: var Changeset, tree: MirTree, at: NodePosition) =
 func initChangeset*(body: MirBody): Changeset =
   ## Sets up a changeset for `body`. The changeset either needs to be
   ## discarded, or applied to the same ``MirBody`` instance it was created for.
-  result = Changeset(locals: fork(body.locals))
-  # compute the next ID to use for new labels:
-  for i, n in body.code.pairs:
-    case n.kind
-    of mnkLabel:
-      result.nextLabel = max(n.label.uint32 + 1, result.nextLabel)
-    else:
-      discard
+  Changeset(locals: fork(body.locals),
+            nextLabel: body.nextLabel.uint32)
 
 func initBuilder(c: var Changeset, buffer: var MirNodeSeq,
                  info: SourceId): MirBuilder =
@@ -99,3 +93,4 @@ func apply*(body: var MirBody, c: sink Changeset) =
   ## Applies the changeset `c` to `body`.
   apply(body.code, prepare(move c.inner))
   join(body.locals, move c.locals)
+  body.nextLabel = LabelId(c.nextLabel)
diff --git a/compiler/mir/mirconstr.nim b/compiler/mir/mirconstr.nim
index 2be7aeb3bc7..8f0b61a1817 100644
--- a/compiler/mir/mirconstr.nim
+++ b/compiler/mir/mirconstr.nim
@@ -7,7 +7,8 @@ import
   ],
   compiler/mir/[
     mirtrees,
-    mirbodies
+    mirbodies,
+    sourcemaps
   ],
   compiler/utils/[
     containers,
@@ -558,3 +559,8 @@ func finish*(bu: sink MirBuilder, locals: sink Store[LocalId, Local]): auto =
   result = (tree, move locals)
   # join the partial store into the base store:
   join(result[1], partial)
+
+proc createBody*(builder: sink MirBuilder, sm: sink SourceMap): MirBody =
+  ## Creates a MIR body from `builder` and `sm`.
+  result = MirBody(nextLabel: builder.nextLabel.LabelId, source: sm)
+  (result.code, result.locals) = builder.finish(default Store[LocalId, Local])
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 1ec2b007290..9392ae1a948 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -2395,9 +2395,7 @@ proc generateCode*(graph: ModuleGraph, env: var MirEnv, owner: PSym,
 
   env = c.env
 
-  # move the buffers into the result body
-  let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
-  MirBody(locals: locals, source: move c.sp.map, code: code)
+  createBody(move c.builder, move c.sp.map)
 
 proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
                 config: TranslationConfig, e: PNode): MirBody =
@@ -2428,8 +2426,7 @@ proc exprToMir*(graph: ModuleGraph, env: var MirEnv,
 
   env = move c.env
 
-  let (code, locals) = finish(move c.builder, default(Store[LocalId, Local]))
-  MirBody(locals: locals, source: move c.sp.map, code: code)
+  createBody(move c.builder, move c.sp.map)
 
 proc constDataToMir*(env: var MirEnv, n: PNode): MirTree =
   ## Translates the construction expression AST `n` representing some

From 216a5598a322d5cfd79028728158963bbdf73b67 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 1 Jul 2024 01:32:29 +0200
Subject: [PATCH 140/169] mirpasses: split assignments with MIR pass (#1366)

## Summary

* use MIR pass to split assignments involving potentially raising calls
* for the C backend, the compiler employing RVO no longer affects
  observable behaviour

## Details

* add the `splitAssignments` MIR pass and enable it for the C backend
* the condition of when to split assignments is the same as
  `ccgcalls.isHarmlessStore`, with the difference that
  `splitAssignments` also considers projections of locals when
  optimizing away a split (not only unprojected locals)
* `ccgcalls` can now assume that all assignments are safe; everything
  related to assignment splitting is removed

### Observable stores

When the RHS of an assignment was an RVO-using call, the assignment was
*not* split, resulting in an "observable store" if the call raised an
exception after having modified its `result` variable.

The `splitAssignments` call splits *all* assignments, incurring an
additional memory copy for RVO-using calls but also making the
behaviour "correct". `reportObservableStore` is obsolete and thus
removed.
---
 compiler/backend/ccgcalls.nim   | 98 +--------------------------------
 compiler/mir/mirpasses.nim      | 34 ++++++++++++
 tests/exception/tassignment.nim | 13 +----
 3 files changed, 39 insertions(+), 106 deletions(-)

diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index b2796ada2df..c1a7ecba453 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -10,70 +10,6 @@
 
 ## included from cgen.nim
 
-proc reportObservableStore(p: BProc; le, ri: CgNode) =
-  ## Reports the ``rsemObservableStores`` hint when the called procedure can
-  ## exit with an exception and `le` is something to which an assignment is
-  ## observable in the exception-raised case.
-  proc locationEscapes(p: BProc; le: CgNode; inTryStmt: bool): bool =
-    var n = le
-    while true:
-      # do NOT follow ``cnkDerefView`` here!
-      case n.kind
-      of cnkGlobal:
-        # mutation of a global -> the mutation escapes
-        return true
-      of cnkLocal:
-        # if the local is used within an 'except' or 'finally', a mutation of
-        # it through a procedure that eventually raises is also an observable
-        # store
-        return inTryStmt and sfUsedInFinallyOrExcept in p.body[n.local].flags
-      of cnkFieldAccess, cnkArrayAccess, cnkTupleAccess:
-        n = n[0]
-      of cnkObjUpConv, cnkObjDownConv, cnkLvalueConv:
-        n = n.operand
-      else:
-        # cannot analyse the location; assume the worst
-        return true
-
-  # XXX: this whole procedure needs to be removed; RVO calls must only be used
-  #      if safe
-  var inTryStmt = false
-  # analyse the target to check whether a local exception handler or finally
-  # is reached
-  case ri[^1].kind
-  of cnkLabel:
-    inTryStmt = true
-  of cnkTargetList:
-    for it in ri[^1].items:
-      if it.kind == cnkLabel:
-        inTryStmt = true
-        break
-  else:
-    discard "no local exception handler or finally is reached"
-
-  if le != nil and locationEscapes(p, le, inTryStmt):
-    localReport(p.config, le.info, reportSem rsemObservableStores)
-
-proc observableInExcept(n: CgNode): bool =
-  ## Computes whether the call expression `n` has an exceptional exit
-  ## that leads to an exception handler within the current procedure.
-  let target = n[^1]
-  case target.kind
-  of cnkLabel:      true # can only be an exception handler (of finally)
-  of cnkTargetList: target[^1].kind == cnkLabel
-  else:
-    unreachable()
-
-proc isHarmlessStore(p: BProc; ri: CgNode, d: TLoc): bool =
-  if d.k in {locTemp, locNone} or ri.kind != cnkCheckedCall:
-    result = true
-  elif d.k == locLocalVar and not observableInExcept(ri):
-    # we cannot observe a store to a local variable if the current proc
-    # has no error handler:
-    result = true
-  else:
-    result = false
-
 proc exitCall(p: BProc, call: CgNode) =
   ## Emits the exceptional control-flow related post-call logic.
   let isNoReturn = call[0].kind == cnkProc and
@@ -103,7 +39,6 @@ proc exitCall(p: BProc, call: CgNode) =
 
 proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
                callee, params: Rope) =
-  let canRaise = ri.kind == cnkCheckedCall
   genLineDir(p, ri)
   var pl = callee & ~"(" & params
   # getUniqueType() is too expensive here:
@@ -114,9 +49,6 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
       # the destination is guaranteed to be either a temporary or an lvalue
       # that can be modified in-place
       if true:
-        if d.k notin {locTemp, locNone} and canRaise:
-          reportObservableStore(p, le, ri)
-
         # resetting the result location is the responsibility of the called
         # procedure
         if d.k == locNone:
@@ -127,7 +59,7 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
         exitCall(p, ri)
     else:
       pl.add(~")")
-      if isHarmlessStore(p, ri, d):
+      if true:
         if d.k == locNone: getTemp(p, typ[0], d)
         assert(d.t != nil)        # generate an assignment to d:
         var list: TLoc
@@ -135,15 +67,6 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
         list.r = pl
         genAssignment(p, d, list)
         exitCall(p, ri)
-      else:
-        var tmp: TLoc
-        getTemp(p, typ[0], tmp)
-        var list: TLoc
-        initLoc(list, locCall, d.lode, OnUnknown)
-        list.r = pl
-        genAssignment(p, tmp, list)
-        exitCall(p, ri)
-        genAssignment(p, d, tmp)
   else:
     pl.add(~");$n")
     line(p, cpsStmts, pl)
@@ -284,16 +207,12 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
       lineF(p, cpsStmts, PatProc & ";$n", [rdLoc(op), pl, pl.addComma, rawProc])
 
   let rawProc = getClosureType(p.module, typ, clHalf)
-  let canRaise = ri.kind == cnkCheckedCall
   if typ[0] != nil:
     if isInvalidReturnType(p.config, typ[0]):
       if numArgs(ri) > 0: pl.add(~", ")
       # the destination is guaranteed to be either a temporary or an lvalue
       # that can be modified in-place
       if true:
-        if d.k notin {locTemp, locNone} and canRaise:
-          reportObservableStore(p, le, ri)
-
         # resetting the result location is the responsibility of the called
         # procedure
         if d.k == locNone:
@@ -301,7 +220,7 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
         pl.add(addrLoc(p.config, d))
         genCallPattern()
         exitCall(p, ri)
-    elif isHarmlessStore(p, ri, d):
+    else:
       if d.k == locNone: getTemp(p, typ[0], d)
       assert(d.t != nil)        # generate an assignment to d:
       var list: TLoc
@@ -312,19 +231,6 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
         list.r = PatProc % [rdLoc(op), pl, pl.addComma, rawProc]
       genAssignment(p, d, list)
       exitCall(p, ri)
-    else:
-      var tmp: TLoc
-      getTemp(p, typ[0], tmp)
-      assert(d.t != nil)        # generate an assignment to d:
-      var list: TLoc
-      initLoc(list, locCall, d.lode, OnUnknown)
-      if tfIterator in typ.flags:
-        list.r = PatIter % [rdLoc(op), pl, pl.addComma, rawProc]
-      else:
-        list.r = PatProc % [rdLoc(op), pl, pl.addComma, rawProc]
-      genAssignment(p, tmp, list)
-      exitCall(p, ri)
-      genAssignment(p, d, tmp)
   else:
     genCallPattern()
     exitCall(p, ri)
diff --git a/compiler/mir/mirpasses.nim b/compiler/mir/mirpasses.nim
index 40c438431a3..cbb5ab38bf8 100644
--- a/compiler/mir/mirpasses.nim
+++ b/compiler/mir/mirpasses.nim
@@ -790,6 +790,38 @@ proc lowerCase(tree: MirTree, graph: ModuleGraph, env: var MirEnv,
     else:
       discard "keep as is"
 
+proc splitAssignments(tree: MirTree, changes: var Changeset) =
+  ## Turns assignments such as:
+  ##   x = call(...) -> [L1]
+  ## into:
+  ##   def _1 = call(...) -> [L1]
+  ##   x = move _1
+  ##
+  ## The idea is to allow for code generators using error-flag-based exception
+  ## handling to rely on assigning the call result directly to the destination
+  ## being safe (as in, not affecting observable behaviour).
+  for n in search(tree, {mnkCheckedCall}):
+    let p = tree.parent(n)
+    if tree[p].kind in {mnkAsgn, mnkInit, mnkSwitch}:
+      let target = tree.last(n)
+      const Locals = {mnkTemp, mnkLocal}
+      # * is the destination not a local?
+      # * if the destination is a local, does the exceptional path enter a
+      #   local exception handler?
+      if tree[tree.getRoot(tree.operand(p, 0))].kind notin Locals or
+         tree[target].kind != mnkTargetList or
+         tree[tree.last(target)].kind != mnkResume:
+        # future direction: this can be optimized. The assignment only needs to
+        # be split if the assignment destination's value is observed on the
+        # exceptional control-flow path
+        var tmp: Value
+        changes.insert(tree, tree.getStmt(n), n, bu):
+          tmp = bu.wrapTemp tree[n].typ:
+            bu.emitFrom(tree, n)
+        changes.replaceMulti(tree, n, bu):
+          bu.subTree mnkMove:
+            bu.use tmp
+
 proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
                   graph: ModuleGraph, target: TargetBackend) =
   ## Applies all applicable MIR passes to the body (`tree` and `source`) of
@@ -802,6 +834,8 @@ proc applyPasses*(body: var MirBody, prc: PSym, env: var MirEnv,
       apply(body, c)
 
   if target == targetC:
+    batch:
+      splitAssignments(body.code, c)
     batch:
       # only the C code generator employs the return-value optimization (=RVO)
       # at the moment
diff --git a/tests/exception/tassignment.nim b/tests/exception/tassignment.nim
index ef8877389aa..ca974e83ea7 100644
--- a/tests/exception/tassignment.nim
+++ b/tests/exception/tassignment.nim
@@ -18,16 +18,9 @@ block unobservable_rvo_assignment:
     try:
       x = raiseEx(x)
     except CatchableError:
-      when defined(c):
-        # XXX: the C backend is the only one using RVO at the moment
-        doAssert x[0] == 1, "the behaviour is correct now; fix the assert"
-      else:
-        doAssert x[0] == 0, "handler observed changed value"
-
-    when defined(c):
-      doAssert x[0] == 1, "the behaviour is correct now; fix the assert"
-    else:
-      doAssert x[0] == 0, "following statement observed changed value"
+      doAssert x[0] == 0, "handler observed changed value"
+
+    doAssert x[0] == 0, "following statement observed changed value"
 
   test()
 

From 35509cb01616cfad032822d249cf16ee03a67005 Mon Sep 17 00:00:00 2001
From: Adam Sherwood <43248857+theSherwood@users.noreply.github.com>
Date: Mon, 1 Jul 2024 15:41:43 -0600
Subject: [PATCH 141/169] sem: proper error when alignof is called on generic
 type (#1367)

## Summary
*  `alignof`  calls on generic arguments resulted in
`Fatal: Internal unreachable code executed`  (C backend)
* This fix causes the compiler to report a proper error in such cases:
`<type> is not a concrete type`

## Details
* To do this we have to check that the argument to  `alignof`  is a
concrete type before it reaches the backend.
* We add `semAlignOf` to do this.
* Handles overloaded `alignof`.
---
 compiler/sem/semmagic.nim                           | 11 ++++++++++-
 .../generics/talignof_generic_error.nim             | 10 ++++++++++
 .../generics/talignof_generic_error_overloaded.nim  | 13 +++++++++++++
 3 files changed, 33 insertions(+), 1 deletion(-)
 create mode 100644 tests/lang_callable/generics/talignof_generic_error.nim
 create mode 100644 tests/lang_callable/generics/talignof_generic_error_overloaded.nim

diff --git a/compiler/sem/semmagic.nim b/compiler/sem/semmagic.nim
index 663d2ea7870..7c30b089356 100644
--- a/compiler/sem/semmagic.nim
+++ b/compiler/sem/semmagic.nim
@@ -61,6 +61,15 @@ proc semSizeOf(c: PContext, n: PNode): PNode =
     result = c.config.newError(n, PAstDiag(kind: adSemMagicExpectTypeOrValue,
                                             magic: mSizeOf))
 
+proc semAlignOf(c: PContext, n: PNode): PNode =
+  if containsGenericType(n[1].typ):
+    # report the type, not the typedesc
+    n[1] = c.config.newError(n[1], PAstDiag(kind: adSemTIsNotAConcreteType,
+                                            wrongType: n[1].typ[0]))
+    result = c.config.wrapError(n)
+  else:
+    result = foldAlignOf(c.config, n, n)
+
 type
   SemAsgnMode = enum asgnNormal, noOverloadedSubscript, noOverloadedAsgn
 
@@ -422,7 +431,7 @@ proc magicsAfterOverloadResolution(c: PContext, n: PNode,
   of mSizeOf:
     result = semSizeOf(c, n)
   of mAlignOf:
-    result = foldAlignOf(c.config, n, n)
+    result = semAlignOf(c, n)
   of mOffsetOf:
     result = foldOffsetOf(c.config, n, n)
   of mArrGet:
diff --git a/tests/lang_callable/generics/talignof_generic_error.nim b/tests/lang_callable/generics/talignof_generic_error.nim
new file mode 100644
index 00000000000..c4242990b81
--- /dev/null
+++ b/tests/lang_callable/generics/talignof_generic_error.nim
@@ -0,0 +1,10 @@
+discard """
+  errormsg: "'GenericType' is not a concrete type"
+  line: 10
+"""
+
+type
+  GenericType[K, V] = object
+    field: (K, V)
+
+let alignment = alignof(GenericType)
diff --git a/tests/lang_callable/generics/talignof_generic_error_overloaded.nim b/tests/lang_callable/generics/talignof_generic_error_overloaded.nim
new file mode 100644
index 00000000000..e7f8c43471a
--- /dev/null
+++ b/tests/lang_callable/generics/talignof_generic_error_overloaded.nim
@@ -0,0 +1,13 @@
+discard """
+  errormsg: "'GenericType' is not a concrete type"
+  line: 13
+"""
+
+type
+  GenericType[K, V] = object
+    field: (K, V)
+
+# Overload alignof
+proc alignof(a, b: int) = discard
+
+let alignment = alignof(GenericType)

From 70d59b544f11cccf5e9a570e23f133b70a740a82 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Tue, 2 Jul 2024 13:29:43 -0500
Subject: [PATCH 142/169] publisher: use actions/download-artifact directly
 (#1364)

## Summary
Instead of depending on a third-party actions to download built
artifacts, use GitHub's CLI to search for the wanted ID and first-party
actions to download the wanted artifacts.

## Details
* Replaced usage of  `dawidd6/action-download-artifact`  with
`actions/download-artifact` .

---------

Co-authored-by: zerbina <100542850+zerbina@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 58 ++++++++++++++++++++-------------
 1 file changed, 35 insertions(+), 23 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index ae4eb4b8884..f940fb7a183 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -28,47 +28,64 @@ jobs:
       # Publish action needs a checkout
       - uses: actions/checkout@v4
 
+      - name: Obtain latest successful run id
+        id: finder
+        run: |
+          run_id=$(gh run list \
+            -c "$COMMIT" \
+            -w "$WORKFLOW" \
+            -s "$CONCLUSION" \
+            --limit 1 \
+            --json databaseId \
+            --jq '.[].databaseId')
+          if [[ -z $run_id ]]; then
+            echo "::error::Could not find any CI run for commit $COMMIT"
+            exit 1
+          fi
+          echo "run_id=$run_id" >> "$GITHUB_OUTPUT"
+        env:
+          COMMIT: ${{ github.event.after }}
+          WORKFLOW: ci.yml
+          CONCLUSION: success
+          GH_TOKEN: ${{ github.token }}
+
       # Download the latest instance of artifacts from a build done previously
       - name: Download generated docs
-        uses: dawidd6/action-download-artifact@v6
+        uses: actions/download-artifact@v4
         with:
-          workflow: ci.yml
-          workflow_conclusion: success
-          commit: ${{ github.event.after }}
+          run-id: ${{ steps.finder.outputs.run_id }}
           # Keep up-to-date with ci.yml
           name: Generated docs
           path: doc/html
+          github-token: ${{ github.token }}
 
       - name: Download generated source archive
-        uses: dawidd6/action-download-artifact@v6
+        uses: actions/download-artifact@v4
         with:
-          workflow: ci.yml
-          workflow_conclusion: success
-          commit: ${{ github.event.after }}
+          run-id: ${{ steps.finder.outputs.run_id }}
           # Keep up-to-date with ci.yml
           name: source archive
           path: release-staging
+          github-token: ${{ github.token }}
 
       - name: Download generated release binaries
-        uses: dawidd6/action-download-artifact@v6
+        uses: actions/download-artifact@v4
         with:
-          workflow: ci.yml
-          workflow_conclusion: success
-          commit: ${{ github.event.after }}
+          run-id: ${{ steps.finder.outputs.run_id }}
           # Keep up-to-date with ci.yml
-          name: release binaries.*
-          name_is_regexp: true
+          pattern: release binaries *
+          merge-multiple: "true"
           path: release-staging
+          github-token: ${{ github.token }}
 
       - name: Download release manifest tool
-        uses: dawidd6/action-download-artifact@v6
+        uses: actions/download-artifact@v4
         with:
-          workflow: ci.yml
-          workflow_conclusion: success
-          commit: ${{ github.event.after }}
+          run-id: ${{ steps.finder.outputs.run_id }}
           # Keep up-to-date with ci.yml
           name: release manifest tool
           path: release-staging
+          github-token: ${{ github.token }}
 
       - name: Publish docs
         uses: JamesIves/github-pages-deploy-action@v4.6.1
@@ -79,11 +96,6 @@ jobs:
       - id: release-files
         name: Create release manifest
         run: |
-          # Move the release binaries to the current folder
-          for d in "release binaries "*; do
-            mv -v "$d"/* .
-          done
-
           # Github Artifacts strip executable permissions so it has to be set again
           chmod 755 release_manifest
           # Create a new release manifest

From 3328b9eea4584f025b88e471a6c7138443b3d642 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Fri, 5 Jul 2024 03:03:44 +0200
Subject: [PATCH 143/169] annotate more compiler stacktraces (#1371)

## Summary

Stacktraces from within `mirgen` and `transf` are now also annotated
with the line information of the currently processed node, providing
more context for compiler crashes when using `nim_dbg`.
---
 compiler/mir/mirgen.nim | 6 ++++++
 compiler/sem/transf.nim | 6 ++++++
 2 files changed, 12 insertions(+)

diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 9392ae1a948..8b6651ae0fc 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -98,6 +98,9 @@ import
 
 import std/options as std_options
 
+when defined(nimCompilerStacktraceHints):
+  import compiler/utils/debugutils
+
 type
   DestFlag = enum
     ## Extra information about an assignment destination. The flags are used to
@@ -400,6 +403,9 @@ proc exprToPmir(c: var TCtx, n: PNode, sink, mutable: bool): PMirExpr =
              n, sink, mutable)
 
 proc genx(c: var TCtx, n: PNode; consume: bool = false) =
+  when defined(nimCompilerStacktraceHints):
+    frameMsg(c.graph.config, n)
+
   let e = exprToPmir(c, n, consume, false)
   genx(c, e, e.high)
 
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index ac52b2d65bd..7b96ae60e67 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -54,6 +54,9 @@ import
 
 from compiler/sem/semdata import makeVarType
 
+when defined(nimCompilerStacktraceHints):
+  import compiler/utils/debugutils
+
 type
   PTransCon = ref object # part of TContext; stackable
     mapping: TIdNodeTable     # mapping from symbols to nodes
@@ -1205,6 +1208,9 @@ proc commonOptimizations*(g: ModuleGraph; idgen: IdGenerator; c: PSym, n: PNode)
       result = n
 
 proc transform(c: PTransf, n: PNode): PNode =
+  when defined(nimCompilerStacktraceHints):
+    frameMsg(c.graph.config, n)
+
   when false:
     var oldDeferAnchor: PNode
     if n.kind in {nkElifBranch, nkOfBranch, nkExceptBranch, nkElifExpr,

From bd3d3dc99680c23b38317d0ca39fce408d1c9a16 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Thu, 4 Jul 2024 21:11:45 -0500
Subject: [PATCH 144/169] ci: split docs deployment from publisher and deploy
 directly to pages (#1370)

## Summary
Documentation will now be built using a separated workflow that will be
run whenever publisher finishes. This allows us to use the latest page
deployment code regardless of the commit that triggered publisher.

## Details
* Added  `get`  sub-command to  `release_manifest` , which allows one to
extract binary archive name from a release manifest.
* "Generated docs" artifacts are now removed. Instead the generated
documentation will be obtained from the release tarball for Linux amd64.
This allows docs publishing to run regardless of whether the artifact
for the latest release has expired or not.
* Documentation deployment will now skip  `gh-pages`  branch and deploy
directly using  `actions/deploy-pages` . This allows us to drop the
heavyweight  `gh-pages`  branch and remove the latency between push and
page being deployed.
* Documentation deployment can now be triggered on-demand in case of a
prior failure.
* Documentation deployment will now always be done using latest code in
`devel` .
* Development documentation is also pushed to  `/devel`  sub-folder.
This is preliminary setup for versioned docs in the future.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 .github/workflows/ci.yml          |  9 ----
 .github/workflows/deploy-docs.yml | 86 +++++++++++++++++++++++++++++++
 .github/workflows/publisher.yml   | 19 +------
 doc/ci.rst                        | 25 +++++++--
 tools/release_manifest.nim        | 40 ++++++++++++++
 5 files changed, 147 insertions(+), 32 deletions(-)
 create mode 100644 .github/workflows/deploy-docs.yml

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 9674bfec052..0a75e1a04e9 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -549,15 +549,6 @@ jobs:
           echo "archive=$archive" >> $GITHUB_OUTPUT
           echo "metadata=$metadata" >> $GITHUB_OUTPUT
 
-      - name: Upload docs to artifacts
-        if: matrix.target.shared_builder
-        uses: actions/upload-artifact@v4
-        with:
-          # If this name is updated, tweak publisher.yml
-          name: Generated docs
-          path: doc/html/
-          if-no-files-found: error
-
       - name: Upload release package to artifacts
         uses: actions/upload-artifact@v4
         with:
diff --git a/.github/workflows/deploy-docs.yml b/.github/workflows/deploy-docs.yml
new file mode 100644
index 00000000000..64aa5991f93
--- /dev/null
+++ b/.github/workflows/deploy-docs.yml
@@ -0,0 +1,86 @@
+name: Deploy documentation
+on:
+  # Automatically run after any completed publish
+  workflow_run:
+    workflows:
+      - Publish built artifacts
+    types:
+      - completed
+
+  # For manual triggers
+  workflow_dispatch:
+
+# Run every script actions in bash
+defaults:
+  run:
+    shell: bash
+
+concurrency: doc-publisher
+
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+
+    permissions:
+      id-token: write
+      pages: write
+
+    environment:
+      name: github-pages
+      url: ${{ steps.deploy.outputs.page_url }}
+
+    env:
+      # Triplet to obtain docs from
+      DOC_TARGET: x86_64-linux-gnu
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Setup latest compiler
+        uses: nim-works/setup-nimskull@0.1.2
+        with:
+          nimskull-version: "*" # Grab the latest nimskull-version
+
+      - name: Compile release_manifest
+        run: nim c -d:release -o:release_manifest tools/release_manifest.nim
+
+      - id: versions
+        name: Grab latest release version
+        run: |
+          # Stolen from asdf-nimskull
+          sort_versions() {
+            sed 'h; s/[+-]/./g; s/$/.z/; G; s/\n/ /' |
+              LC_ALL=C sort -t. -k 1,1n -k 2,2n -k 3,3n -k 4,4 -k 5,5n | awk '{print $2}'
+          }
+
+          all_tags=$(gh release list --json tagName --jq '.[] | .tagName')
+          latest=$(sort_versions <<<"$all_tags" | tail -n 1)
+
+          echo "Latest devel is: $latest"
+          echo "devel=$latest" >> "$GITHUB_OUTPUT"
+        env:
+          GH_TOKEN: ${{ github.token }}
+
+      - name: Construct devel docs
+        run: |
+          tmpdir=$(mktemp -dp "$RUNNER_TEMP" devel.XXXXXXXXXX)
+          # Get the name of the binary archive for the documentation target
+          release_archive=$(gh release download "$DEVEL" -p manifest.json -O - | ./release_manifest -f /dev/stdin get "$DOC_TARGET")
+          # Download the latest release binary
+          gh release download "$DEVEL" -p "$release_archive" -O "$tmpdir/$release_archive"
+          # Extract and remove the top-level directory
+          tar -C "$tmpdir" -xf "$tmpdir/$release_archive" --strip-components=1
+
+          mkdir -p built-docs
+          cp -rT "$tmpdir/doc/html" built-docs/devel
+          cp -rT "$tmpdir/doc/html" built-docs
+        env:
+          GH_TOKEN: ${{ github.token }}
+          DEVEL: ${{ steps.versions.outputs.devel }}
+
+      - uses: actions/upload-pages-artifact@v3
+        with:
+          path: built-docs/
+
+      - id: deploy
+        uses: actions/deploy-pages@v4
diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index f940fb7a183..5d0125ed76a 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -25,9 +25,6 @@ jobs:
       url: ${{ steps.release.outputs.url }}
 
     steps:
-      # Publish action needs a checkout
-      - uses: actions/checkout@v4
-
       - name: Obtain latest successful run id
         id: finder
         run: |
@@ -48,17 +45,9 @@ jobs:
           WORKFLOW: ci.yml
           CONCLUSION: success
           GH_TOKEN: ${{ github.token }}
+          GH_REPO: ${{ github.repository }}
 
       # Download the latest instance of artifacts from a build done previously
-      - name: Download generated docs
-        uses: actions/download-artifact@v4
-        with:
-          run-id: ${{ steps.finder.outputs.run_id }}
-          # Keep up-to-date with ci.yml
-          name: Generated docs
-          path: doc/html
-          github-token: ${{ github.token }}
-
       - name: Download generated source archive
         uses: actions/download-artifact@v4
         with:
@@ -87,12 +76,6 @@ jobs:
           path: release-staging
           github-token: ${{ github.token }}
 
-      - name: Publish docs
-        uses: JamesIves/github-pages-deploy-action@v4.6.1
-        with:
-          branch: gh-pages
-          folder: doc/html
-
       - id: release-files
         name: Create release manifest
         run: |
diff --git a/doc/ci.rst b/doc/ci.rst
index 7accfb59c84..b27c7273a69 100644
--- a/doc/ci.rst
+++ b/doc/ci.rst
@@ -96,8 +96,11 @@ was developed to leverage this.
 4. Assuming that the staging branch passes all tests, ``devel`` is
    fast-forwarded to the staging branch head commit.
 
-5. The "Publish" pipeline deploys the rendered documentation and binaries
-   generated by the testing pipeline earlier in the staging branch.
+5. The "Publish" pipeline deploys the binaries generated by the testing pipeline
+   earlier in the staging branch.
+
+6. The "Deploy documentation" pipeline deploys the latest documentation to GitHub
+   Pages.
 
 Assumptions in CI design
 ------------------------
@@ -161,9 +164,6 @@ which are used by other pipelines, these artifacts are:
 
 * "source archive": generated from the git clone.
 
-* "Generated docs": HTML documentation generated from source. This is the
-  ``doc/html`` folder after a ``koch docs`` run.
-
 Changes to how these artifacts are packaged must be reviewed carefully to
 ensure that dependent pipelines will still function.
 
@@ -245,6 +245,21 @@ Only one instance of this pipeline might be run at any given time, due to its
 mutating nature. Currently Github Action's ``concurrency`` feature is used to
 block multiple runs.
 
+"Deploy documentation"
+----------------------
+
+As the name suggests, this pipeline constructs and deploys the documentation
+website. This pipeline is dependent on the
+`Release manifest tool <#tools-release-manifest-tool>`_.
+
+Unlike other pipelines, the code run will always be that of the latest commit
+in ``devel`` branch. This means that the code should always be aware of
+differences between versions of |NimSkull| being deployed.
+
+Currently, only one instance of this pipeline might be run at any given time
+to prevent races. GitHub Actions's ``concurrency`` feature is used to
+serialize the runs.
+
 Development guidelines
 ======================
 
diff --git a/tools/release_manifest.nim b/tools/release_manifest.nim
index 89e32cc1baf..5d1c14aaad9 100644
--- a/tools/release_manifest.nim
+++ b/tools/release_manifest.nim
@@ -255,6 +255,23 @@ proc addCommand(manifest: string, archiveData: varargs[string]) =
   # Serialize a new manifest
   writeFile(manifest, $database.serialize())
 
+proc getCommand(manifest, target: string): int =
+  ## Implementation for the `get` subcommand.
+  ##
+  ## :manifest:
+  ##   The filename of the release manifest to inspect.
+  ##
+  ## :target:
+  ##   The triplet of interest.
+  let database = json.parseFile(manifest).deserialize()
+
+  let idx = database.triplet.find(target)
+  if idx < 0:
+    stderr.writeLine("error: target $1 could not be found in database")
+    return 1
+
+  stdout.writeLine(database.file[idx])
+
 func escapeDataForGithubActions(s: string): string =
   ## Escape the string `s` so that it can be used as data for workflow commands.
   # The list is obtained from here:
@@ -314,6 +331,7 @@ type
     Help = "help"
     Add = "add"
     FilesToUpload = "files-to-upload"
+    Get = "get"
     Version = "version"
 
   Flag {.pure.} = enum
@@ -363,6 +381,7 @@ Usage: $app <command> [args]...
 Commands:
   add              Add artifacts to the manifest
   files-to-upload  List the files to be uploaded
+  get              Get release artifact for a target
   version          Print the release version
   help             Display help for any subcommand
 
@@ -393,6 +412,15 @@ Options:
                                   format such that it can be used in workflow
                                   commands (ie. set-output) without losing data.
 
+$globalOpt
+"""
+
+  GetHelp = """
+Usage: $app get [options] [--] <target>
+
+Print the artifact file name of the given target triplet. An error will be raised
+if no artifact can be found for the given target.
+
 $globalOpt
 """
 
@@ -432,6 +460,8 @@ proc printHelp(action: Action) =
     stdout.write(AddHelp % defaultHelpFormat)
   of FilesToUpload:
     stdout.write(FilesToUploadHelp % defaultHelpFormat)
+  of Get:
+    stdout.write(GetHelp % defaultHelpFormat)
   of Version:
     stdout.write(VersionHelp % defaultHelpFormat)
 
@@ -504,6 +534,16 @@ proc dispatch(cli: Cli): int =
           result = 1
         else:
           filesToUploadCommand(manifest, format.get)
+      of Get:
+        let manifest = cli.flags.getOrDefault(Flag.File, DefaultManifestFile)
+        if cli.args.len == 1:
+          result = getCommand(manifest, cli.args[0])
+        else:
+          # No or more than one targets were given, print the help text and set failure.
+          if cli.args.len > 1:
+            stderr.writeLine("error: only one target is expected")
+          printHelp(cli.action)
+          result = 1
       of Version:
         let manifest = cli.flags.getOrDefault(Flag.File, DefaultManifestFile)
         versionCommand(manifest)

From aaba3c54dffdbb1d2c4dc397b13c2bf9d36f7428 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 6 Jul 2024 21:30:34 +0200
Subject: [PATCH 145/169] sem: fix crash due to incorrect error handling
 (#1372)

## Summary

Wrap usage of erroneous symbols in quiet errors, so that error
propagation works as expected. This fixes compiler/nimsuggest crashes
when the iterable expression in `for` loops has an error.

Fixes https://github.com/nim-works/nimskull/issues/1369.

## Details

### The Problem

If the iterable slot of a `for` loop is an error, `tyError` is assigned
as the forvars' type. When such forvar appears as an argument in a call
expression, errors

### The Solution

* add the `adWrappedSymError` diagnostic, which is a quiet diagnostic
  like `adWrappedError`, meaning that it's only used for error
  propagation and never reported
* move `newSymNode2` from `ast` to `sem` and change it so that it
  creates `adWrappedSymError` error nodes for symbols where the
  definition has an error
* rename `newSymNode2` to `newSymNodeOrError`
* update the few usages of `newSymNode2`
* add test for the `for`-loop-related compiler crash to the new
  `error_propagation` category

The introduction of `adWrappedSymError` is meant to be a foundational
work for changing `skError` to only represent errors (instead of both
errors and symbols whose definition has an error).
---
 compiler/ast/ast.nim                        | 26 ---------------------
 compiler/ast/ast_types.nim                  |  3 ++-
 compiler/ast/errorhandling.nim              |  2 +-
 compiler/front/cli_reporter.nim             |  2 +-
 compiler/front/msgs.nim                     |  1 +
 compiler/sem/sem.nim                        | 14 +++++++++++
 compiler/sem/semexprs.nim                   | 13 ++++-------
 compiler/sem/semstmts.nim                   |  4 ++--
 tests/error_propagation/tfor_loop_error.nim | 12 ++++++++++
 9 files changed, 37 insertions(+), 40 deletions(-)
 create mode 100644 tests/error_propagation/tfor_loop_error.nim

diff --git a/compiler/ast/ast.nim b/compiler/ast/ast.nim
index 3665b29341d..f0ad4625253 100644
--- a/compiler/ast/ast.nim
+++ b/compiler/ast/ast.nim
@@ -193,32 +193,6 @@ proc newIdentNode*(ident: PIdent, info: TLineInfo): PNode =
   result.ident = ident
   result.info = info
 
-proc newSymNode2*(sym: PSym): PNode =
-  ## creates a new `nkSym` node, unless sym.kind is an skError where an nkError
-  ## is extracted from the sym and returned instead.
-  ## NB: not a `newSymNode` replacement, it's for when symbol sem fails
-  if sym.isError:
-    result = sym.ast
-  else:
-    result = newNode(nkSym)
-    result.sym = sym
-    result.typ = sym.typ
-    result.info = sym.info
-
-proc newSymNode2*(sym: PSym, info: TLineInfo): PNode =
-  ## creates a new `nkSym` node, unless sym.kind is an skError where an nkError
-  ## is extracted from the sym and returned instead. In either case sets the
-  ## node info to the one provided
-  ## NB: not a `newSymNode` replacement, it's for when symbol sem fails
-  if sym.isError:
-    result = sym.ast
-    result.info = info
-  else:
-    result = newNode(nkSym)
-    result.sym = sym
-    result.typ = sym.typ
-    result.info = info
-
 proc newSymNodeIT*(sym: PSym, info: TLineInfo, typ: PType): PNode =
   ## create a new sym node with the supplied `info` and `typ`
   result = newNodeIT(nkSym, info, typ)
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 4bba6e9b78a..83d76336cb3 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1070,6 +1070,7 @@ type
   AstDiagKind* = enum
     # general
     adWrappedError
+    adWrappedSymError
     adCyclicTree
     # type
     adSemTypeMismatch
@@ -1279,7 +1280,7 @@ type
     location*: TLineInfo        # TODO: `wrongNode` already has this, move to
                                 #       variant or handle in display/rendering
     case kind*: AstDiagKind
-    of adWrappedError:
+    of adWrappedError, adWrappedSymError:
       discard
     of adSemTypeMismatch,
         adSemIllegalConversion,
diff --git a/compiler/ast/errorhandling.nim b/compiler/ast/errorhandling.nim
index eb34e2e75a2..e54e38ab409 100644
--- a/compiler/ast/errorhandling.nim
+++ b/compiler/ast/errorhandling.nim
@@ -189,7 +189,7 @@ iterator walkErrors*(config: ConfigRef; n: PNode): PNode =
   for i in 0..<errNodes.len:
     # reverse index so we go from the innermost to outermost
     let e = errNodes[i]
-    if e.diag.kind == adWrappedError:
+    if e.diag.kind in {adWrappedError, adWrappedSymError}:
       continue
 
     assert(
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 73c692a24b2..18b37d8ae3f 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3143,7 +3143,7 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
     vmRep: VMReport
 
   case diag.kind
-  of adWrappedError:
+  of adWrappedError, adWrappedSymError:
     semRep = SemReport(
         location: some diag.location,
         reportInst: diag.instLoc.toReportLineInfo,
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index d59bc03a49d..3e043f00a6f 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -422,6 +422,7 @@ func astDiagToLegacyReportKind*(
   ## very broad categories and they'll no longer map to "reports".
   case diag
   of adWrappedError: rsemWrappedError
+  of adWrappedSymError: rsemWrappedError
   of adSemTypeMismatch: rsemTypeMismatch
   of adSemTypeNotAllowed: rsemTypeNotAllowed
   of adSemTIsNotAConcreteType: rsemTIsNotAConcreteType
diff --git a/compiler/sem/sem.nim b/compiler/sem/sem.nim
index dae720efd1f..fe7efbefa1c 100644
--- a/compiler/sem/sem.nim
+++ b/compiler/sem/sem.nim
@@ -151,6 +151,20 @@ proc wrapErrorAndUpdate(c: ConfigRef, n: PNode, s: PSym): PNode =
   result = c.wrapError(n)
   s.ast = result
 
+proc newSymNodeOrError(c: ConfigRef, sym: PSym, info: TLineInfo): PNode =
+  ## Creates a new `nkSym` node, unless `sym` either represents an error
+  ## itself or refers to an erroneous entity. In the latter two cases, an
+  ## error node is returned.
+  ## NB: not a `newSymNode` replacement, it's for when symbol sem fails
+  if sym.isError:
+    result = sym.ast
+    result.info = info
+  elif sym.ast.isError or (sym.typ != nil and sym.typ.kind == tyError):
+    result = c.newError(newSymNode(sym, info),
+                        PAstDiag(kind: adWrappedSymError))
+  else:
+    result = newSymNode(sym, info)
+
 template semIdeForTemplateOrGenericCheck(conf, n, cursorInBody) =
   # use only for idetools support; detecting cursor in generic or template body
   # if so call `semIdeForTemplateOrGeneric` for semantic checking
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index e9ae4293edd..d65a5aac4cc 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -1631,7 +1631,7 @@ proc semSym(c: PContext, n: PNode, sym: PSym, flags: TExprFlags): PNode =
       localReport(c.config, n, reportSem rsemIllegalNimvmContext)
 
     markUsed(c, n.info, s)
-    result = newSymNode2(s, n.info)
+    result = newSymNodeOrError(c.config, s, n.info)
     # We cannot check for access to outer vars for example because it's still
     # not sure the symbol really ends up being used:
     # var len = 0 # but won't be called
@@ -1662,14 +1662,9 @@ proc semSym(c: PContext, n: PNode, sym: PSym, flags: TExprFlags): PNode =
       c.config.internalAssert s.owner != nil
     result = newSymNode(s, n.info)
   else:
-    if s.kind == skError and not s.ast.isNil and s.ast.kind == nkError:
-      # XXX: at the time of writing only `lookups.qualifiedlookup` sets up the
-      #      PSym so the error is in the ast field
-      result = s.ast
-    else:
-      let info = getCallLineInfo(n)
-      markUsed(c, info, s)
-      result = newSymNode(s, info)
+    let info = getCallLineInfo(n)
+    markUsed(c, info, s)
+    result = newSymNodeOrError(c.config, s, info)
 
 proc tryReadingGenericParam(c: PContext, n: PNode, i: PIdent, t: PType): PNode =
   case t.kind
diff --git a/compiler/sem/semstmts.nim b/compiler/sem/semstmts.nim
index ae74be1efa4..1036ba9e8cf 100644
--- a/compiler/sem/semstmts.nim
+++ b/compiler/sem/semstmts.nim
@@ -839,7 +839,7 @@ proc semNormalizedLetOrVar(c: PContext, n: PNode, symkind: TSymKind): PNode =
           c.config.newError(r, PAstDiag(kind: adSemIllegalCompileTime))
 
     if v.isError:
-      producedDecl[i] = newSymNode2(v)
+      producedDecl[i] = v.ast # ast is an error AST
       hasError = true
 
       continue # refactor: remove the need to continue
@@ -1202,7 +1202,7 @@ proc semNormalizedConst(c: PContext, n: PNode): PNode =
           localReport(c.config, defPart.info, reportSem(rsemResultShadowed))
 
     if v.isError:
-      producedDecl[i] = newSymNode2(v)
+      producedDecl[i] = v.ast # ast is an error AST
       hasError = true
 
       continue # refactor: remove the need to continue
diff --git a/tests/error_propagation/tfor_loop_error.nim b/tests/error_propagation/tfor_loop_error.nim
new file mode 100644
index 00000000000..7143d9c419b
--- /dev/null
+++ b/tests/error_propagation/tfor_loop_error.nim
@@ -0,0 +1,12 @@
+discard """
+  description: '''
+    Ensure for-loop vars are usable in call expressions when the iterable slot
+    has an error.
+  '''
+  matrix: "--errorMax:100"
+  errormsg: "undeclared identifier: 'unknown'"
+  line: 11
+"""
+
+for x in unknown:
+  echo x

From 91464de37b3846ea02e895c575fd0172f72051f3 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 7 Jul 2024 20:33:21 +0200
Subject: [PATCH 146/169] clean up symbol error reporting (#1373)

## Summary

* don't report "cannot call" error when using symbol of routines
  where the definition has an error
* don't report "only identifier found is an error" when using `let`/
  `var`/`const` symbol where the initializer expression has an error
* these errors don't provide any additional information and only
  clutter compiler and nimsuggest output

## Details

* use a common erroneous symbol handling path in `semSym`
* don't turn `skLet`, `skVar`, and `skConst` into `skError`s when the
  definition AST has an error
* use the silent `adWrappedSymError` diagnostic for erroneous callees
* remove the `CalleeHasAnError` diagnostic and report
* add tests to make sure the new error reporting behaviour works
* adjust the `tpointerprocs.nim`, which is affected by the different
  error reporting
---
 compiler/ast/ast_types.nim                    |  3 ---
 compiler/ast/report_enums.nim                 |  1 -
 compiler/front/cli_reporter.nim               | 11 -----------
 compiler/front/msgs.nim                       |  1 -
 compiler/sem/semcall.nim                      |  8 +++++---
 compiler/sem/semexprs.nim                     | 19 ++++++++++---------
 compiler/sem/semstmts.nim                     |  9 ---------
 tests/error_propagation/tproc_with_error.nim  | 15 +++++++++++++++
 .../tvar_let_const_with_error.nim             | 17 +++++++++++++++++
 .../lang_callable/generics/tpointerprocs.nim  |  4 ++--
 10 files changed, 49 insertions(+), 39 deletions(-)
 create mode 100644 tests/error_propagation/tproc_with_error.nim
 create mode 100644 tests/error_propagation/tvar_let_const_with_error.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 83d76336cb3..f42fcc825af 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1154,7 +1154,6 @@ type
     adSemUndeclaredField
     adSemCannotInstantiate
     adSemWrongNumberOfGenericParams
-    adSemCalleeHasAnError
     # sem
     adSemExpressionHasNoType
     adSemDefNameSym   ## when creating a sym node from `nkIdentKinds`
@@ -1461,8 +1460,6 @@ type
     of adSemWrongNumberOfGenericParams:
       countMismatch*: tuple[expected, got: int]
       gnrcCallLineInfo*: TLineInfo
-    of adSemCalleeHasAnError:
-      callee*: PSym
     of adSemIllformedAstExpectedOneOf:
       expectedKinds*: TNodeKinds
     of adSemImplementationExpected:
diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index 6889e5befcf..b2f17deb930 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -417,7 +417,6 @@ type
     rsemIsOperatorTakes2Args
     rsemWrongNumberOfVariables
     rsemWrongNumberOfGenericParams
-    rsemCalleeHasAnError
     rsemNoGenericParamsAllowed
     rsemAmbiguousCall
     rsemCallingConventionMismatch
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index 18b37d8ae3f..f06d5b9cff4 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -1836,10 +1836,6 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
         $r.countMismatch.expected
       )
 
-    of rsemCalleeHasAnError:
-      result = "cannot call '$1'; its definition has an error [defined at '$2']" %
-               [r.symstr, conf.toFileLineCol(r.sym.info)]
-
     of rsemNoGenericParamsAllowed:
       result = "no generic parameters allowed for $1" % r.symstr
 
@@ -3512,13 +3508,6 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
       kind: rsemWrongNumberOfGenericParams,
       ast: diag.wrongNode,
       countMismatch: diag.countMismatch)
-  of adSemCalleeHasAnError:
-    semRep = SemReport(
-      location: some diag.location,
-      reportInst: diag.instLoc.toReportLineInfo,
-      kind: rsemCalleeHasAnError,
-      ast: diag.wrongNode,
-      sym: diag.callee)
   of adSemIllformedAstExpectedPragmaOrIdent:
     semRep = SemReport(
       location: some diag.location,
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index 3e043f00a6f..e3fd21da753 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -500,7 +500,6 @@ func astDiagToLegacyReportKind*(
   of adSemUndeclaredField: rsemUndeclaredField
   of adSemCannotInstantiate: rsemCannotInstantiate
   of adSemWrongNumberOfGenericParams: rsemWrongNumberOfGenericParams
-  of adSemCalleeHasAnError: rsemCalleeHasAnError
   of adSemExpressionHasNoType: rsemExpressionHasNoType
   of adSemTypeExpected: rsemTypeExpected
   of adSemStringRangeNotAllowed: rsemStringRangeNotAllowed
diff --git a/compiler/sem/semcall.nim b/compiler/sem/semcall.nim
index 62eb231b1a6..f9646ed0352 100644
--- a/compiler/sem/semcall.nim
+++ b/compiler/sem/semcall.nim
@@ -602,9 +602,11 @@ proc semOverloadedCall(c: PContext, n, nOrig: PNode,
     result =
       case r.calleeSym.ast.kind
       of nkError:
-        # the symbol refers to an erroneous entity
-        c.config.newError(r.call):
-          PAstDiag(kind: adSemCalleeHasAnError, callee: r.calleeSym)
+        # the definition has an error; don't attempt to fully resolve the call
+        let x = r.call
+        x[0] = newSymNodeOrError(c.config, r.calleeSym, getCallLineInfo(x[0]))
+        #      ^^ will return an error node
+        c.config.wrapError(x)
       else:
         semResolvedCall(c, r, n, flags)
 
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index d65a5aac4cc..62e53f41943 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -1565,6 +1565,13 @@ proc readTypeParameter(c: PContext, typ: PType,
 
 proc semSym(c: PContext, n: PNode, sym: PSym, flags: TExprFlags): PNode =
   let s = getGenSym(c, sym)
+  # handle symbols whose definition have an error:
+  if s.kind != skError and (s.ast.isError or s.typ.isError):
+    # still mark the symbol as used
+    markUsed(c, n.info, s)
+    return c.config.newError(newSymNode(s, n.info),
+                             PAstDiag(kind: adWrappedSymError))
+
   case s.kind
   of skConst:
     markUsed(c, n.info, s)
@@ -1596,20 +1603,14 @@ proc semSym(c: PContext, n: PNode, sym: PSym, flags: TExprFlags): PNode =
     else:
       result = newSymNode(s, n.info)
   of skMacro:
-    if s.ast.kind == nkError:
-      result = c.config.newError(n,
-        PAstDiag(kind: adSemCalleeHasAnError, callee: s))
-    elif efNoEvaluateGeneric in flags and s.ast[genericParamsPos].safeLen > 0 or
+    if efNoEvaluateGeneric in flags and s.ast[genericParamsPos].safeLen > 0 or
        (n.kind notin nkCallKinds and s.requiredParams > 0):
       markUsed(c, n.info, s)
       result = symChoice(c, n, s, scClosed)
     else:
       result = semMacroExpr(c, n, s, flags)
   of skTemplate:
-    if s.ast.kind == nkError:
-      result = c.config.newError(n,
-        PAstDiag(kind: adSemCalleeHasAnError, callee: s))
-    elif efNoEvaluateGeneric in flags and s.ast[genericParamsPos].safeLen > 0 or
+    if efNoEvaluateGeneric in flags and s.ast[genericParamsPos].safeLen > 0 or
        (n.kind notin nkCallKinds and s.requiredParams > 0) or
        sfCustomPragma in sym.flags:
       let info = getCallLineInfo(n)
@@ -1631,7 +1632,7 @@ proc semSym(c: PContext, n: PNode, sym: PSym, flags: TExprFlags): PNode =
       localReport(c.config, n, reportSem rsemIllegalNimvmContext)
 
     markUsed(c, n.info, s)
-    result = newSymNodeOrError(c.config, s, n.info)
+    result = newSymNode(s, n.info)
     # We cannot check for access to outer vars for example because it's still
     # not sure the symbol really ends up being used:
     # var len = 0 # but won't be called
diff --git a/compiler/sem/semstmts.nim b/compiler/sem/semstmts.nim
index 1036ba9e8cf..5acc11c8df9 100644
--- a/compiler/sem/semstmts.nim
+++ b/compiler/sem/semstmts.nim
@@ -882,9 +882,6 @@ proc semNormalizedLetOrVar(c: PContext, n: PNode, symkind: TSymKind): PNode =
       else:
         internalError(c.config, "should never happen")
 
-    if v.ast.isError:
-      v.transitionToError(v.ast)
-
     # set the symbol type and add the symbol to the production
     producedDecl[i] = setSymType(c, r, v, vTyp)
 
@@ -1226,12 +1223,6 @@ proc semNormalizedConst(c: PContext, n: PNode): PNode =
       else:
         internalError(c.config, "should never happen")
 
-    if v.ast.isError:
-      # XXX: although this mirrors the behaviour of ``semNormalizedLetOrVar``,
-      #      it seems wrong. For example, the type of the symbol is set to a
-      #      valid type instead of ``tyError``
-      v.transitionToError(v.ast)
-
     # set the symbol type and add the symbol to the production
     producedDecl[i] = setSymType(c, r, v, vTyp)
 
diff --git a/tests/error_propagation/tproc_with_error.nim b/tests/error_propagation/tproc_with_error.nim
new file mode 100644
index 00000000000..715ce32c14f
--- /dev/null
+++ b/tests/error_propagation/tproc_with_error.nim
@@ -0,0 +1,15 @@
+discard """
+  cmd: "nim check --hints:off $options $file"
+  action: reject
+  nimoutFull: true
+  nimout: '''
+tproc_with_error.nim(11, 11) Error: undeclared identifier: 'missing'
+'''
+"""
+
+proc p() =
+  discard missing # <- error
+
+# calling the procedure doesn't result in errors being reported to the
+# programmer
+p()
diff --git a/tests/error_propagation/tvar_let_const_with_error.nim b/tests/error_propagation/tvar_let_const_with_error.nim
new file mode 100644
index 00000000000..ac0212d84b3
--- /dev/null
+++ b/tests/error_propagation/tvar_let_const_with_error.nim
@@ -0,0 +1,17 @@
+discard """
+  cmd: "nim check --hints:off $options $file"
+  action: reject
+  nimoutFull: true
+  nimout: '''
+tvar_let_const_with_error.nim(12, 12) Error: undeclared identifier: 'missing'
+tvar_let_const_with_error.nim(13, 12) Error: undeclared identifier: 'missing'
+tvar_let_const_with_error.nim(14, 12) Error: undeclared identifier: 'missing'
+'''
+"""
+
+var va   = missing
+let le   = missing
+const co = missing
+
+# using the symbols doesn't result in errors being reported to the programmer
+echo va, le, co
diff --git a/tests/lang_callable/generics/tpointerprocs.nim b/tests/lang_callable/generics/tpointerprocs.nim
index 3000a3359ac..16e98746936 100644
--- a/tests/lang_callable/generics/tpointerprocs.nim
+++ b/tests/lang_callable/generics/tpointerprocs.nim
@@ -3,11 +3,11 @@ cmd: "nim check $options --hints:off $file"
 action: "reject"
 nimout:'''
 tpointerprocs.nim(14, 11) Error: 'foo' doesn't have a concrete type, due to unspecified generic parameters.
-tpointerprocs.nim(15, 11) Error: identifier 'bar' found but it has errors, see: tpointerprocs.nim(14, 5)
 tpointerprocs.nim(26, 11) Error: cannot instantiate: 'foo[int]'; got 1 typeof(s) but expected 2
-tpointerprocs.nim(27, 11) Error: identifier 'bar' found but it has errors, see: tpointerprocs.nim(26, 5)
 '''
 """
+
+
 block:
   proc foo(x: int | float): float = result = 1.0
   let

From 8b2b72ee7c07b32fa39400bf93648f67df69db0c Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 10 Jul 2024 00:24:55 +0200
Subject: [PATCH 147/169] Report error for foreign forward declared generic
 (#1374)

## Summary

Fix the compiler or backend crashing when using an incomplete generic
procedure from another module. A proper compiler error is now reported
in this case.

Fixes https://github.com/nim-works/nimskull/issues/1368.

## Details

The issues can only occur in the presence of cyclic imports.
Instantiating a generic routine registers it in the instantiating
module, preventing its body from being patched when the generic routine
is complete. Using the instantiation cache when completing a forward-
declared generic won't work, since the module an instantiation comes
from might be closed already.

Instead, this situation is now detected and an error is reported. No
error is reported if no instantiation takes place (i.e., because the
instantiation was cached already), meaning that previously working
code stays working.
---
 compiler/ast/report_enums.nim                 |  1 +
 compiler/front/cli_reporter.nim               |  4 ++++
 compiler/sem/seminst.nim                      |  5 +++++
 .../generics/mgeneric_cycle_forward.nim       |  5 +++++
 .../generics/tgeneric_cycle_forward.nim       | 20 +++++++++++++++++++
 5 files changed, 35 insertions(+)
 create mode 100644 tests/lang_callable/generics/mgeneric_cycle_forward.nim
 create mode 100644 tests/lang_callable/generics/tgeneric_cycle_forward.nim

diff --git a/compiler/ast/report_enums.nim b/compiler/ast/report_enums.nim
index b2f17deb930..80471922f3a 100644
--- a/compiler/ast/report_enums.nim
+++ b/compiler/ast/report_enums.nim
@@ -360,6 +360,7 @@ type
 
     rsemCannotInstantiate
     rsemCannotInstantiateWithParameter
+    rsemCannotInstantiateForwarded
     rsemCannotGenerateGenericDestructor
     rsemUndeclaredField
     rsemExpectedOrdinal
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index f06d5b9cff4..e9e9616839e 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -790,6 +790,10 @@ proc reportBody*(conf: ConfigRef, r: SemReport): string =
           r.ownerSym.name.s
         )
 
+    of rsemCannotInstantiateForwarded:
+      result = "cannot instantiate generic procedure forward-declared in " &
+               "another module"
+
     of rsemTypeKindMismatch:
       result = r.str
       result.add  " got '$1'" % typeToString(r.actualType)
diff --git a/compiler/sem/seminst.nim b/compiler/sem/seminst.nim
index a47e0fea606..985785ecade 100644
--- a/compiler/sem/seminst.nim
+++ b/compiler/sem/seminst.nim
@@ -401,6 +401,11 @@ proc generateInstance(c: PContext, fn: PSym, pt: TIdTable,
   n[genericParamsPos] = c.graph.emptyNode
   var oldPrc = genericCacheGet(c.graph, fn, entry[], c.compilesContextId)
   if oldPrc == nil:
+    if sfForward in fn.flags and fn.itemId.module != c.module.itemId.module:
+      localReport(c.config, info, reportSem(rsemCannotInstantiateForwarded))
+      # don't abort instantiation; let it complete for the sake of error
+      # correction (check/suggest)
+
     # we MUST not add potentially wrong instantiations to the caching mechanism.
     # This means recursive instantiations behave differently when in
     # a ``compiles`` context but this is the lesser evil. See
diff --git a/tests/lang_callable/generics/mgeneric_cycle_forward.nim b/tests/lang_callable/generics/mgeneric_cycle_forward.nim
new file mode 100644
index 00000000000..22bef725b8e
--- /dev/null
+++ b/tests/lang_callable/generics/mgeneric_cycle_forward.nim
@@ -0,0 +1,5 @@
+import tgeneric_cycle_forward
+
+forwarded[int]() # was already instantiated; works
+# try to instantiate the incomplete generic routine:
+forwarded[float]()
diff --git a/tests/lang_callable/generics/tgeneric_cycle_forward.nim b/tests/lang_callable/generics/tgeneric_cycle_forward.nim
new file mode 100644
index 00000000000..7f72e20fb18
--- /dev/null
+++ b/tests/lang_callable/generics/tgeneric_cycle_forward.nim
@@ -0,0 +1,20 @@
+discard """
+  description: '''
+    Ensure instantiating foreign, incomplete generic procedures leads to a
+    proper error.
+  '''
+  errormsg: "cannot instantiate generic procedure forward-declared in another module"
+  file: "mgeneric_cycle_forward.nim"
+  line: 5
+"""
+
+proc forwarded*[T]()
+
+# instantiate with `int` before starting the import cycle
+forwarded[int]()
+
+import mgeneric_cycle_forward # start the recursive import
+
+# complete the forward declaration:
+proc forwarded[T]() =
+  discard

From 759ee3976cd70dccfbe0ba7424561f5688c88cd6 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Thu, 11 Jul 2024 15:35:25 -0500
Subject: [PATCH 148/169] ci: clean up workflows (#1378)

## Summary
This PR cleans up unnecessary dependencies and remove some (potentially)
unsafe usage of templating.

## Details
* Replaced  `fkirc/skip-duplicate-actions`  with natively supported
`concurrency`  feature.
* Replaced unsafe usage of templating with equivalent environment
variables.
* Replaced  `tibdex/github-app-token`  with first-party
`actions/create-github-app-token` .
---
 .github/workflows/ci.yml                  | 34 ++++++++++-------------
 .github/workflows/slash-command-merge.yml |  6 ++--
 .github/workflows/slash-commands.yml      |  6 ++--
 3 files changed, 20 insertions(+), 26 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 0a75e1a04e9..64bd65060e7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -32,6 +32,10 @@ defaults:
   run:
     shell: bash
 
+concurrency:
+  group: ci-${{ github.ref }}
+  cancel-in-progress: true
+
 jobs:
   pre_run:
     name: Provide additional context for the workflow
@@ -42,29 +46,17 @@ jobs:
       shared_builder: ${{ steps.matrix.outputs.shared }}
 
     steps:
-      - id: run_cond
-        uses: fkirc/skip-duplicate-actions@v5.3.1
-        with:
-          # Cancel CI on outdated commits
-          cancel_others: true
-          # Don't skip when a duplicated run (ie. from a PR) is done.
-          #
-          # Only CI in upstream has docs publishing rights.
-          skip_after_successful_duplicate: false
-          # Do not skip on push, dispatched or cron
-          do_not_skip: '["push", "workflow_dispatch", "schedule"]'
-
       - id: skip_result
         name: Whether to skip checks
         run: |
-          if [[ '${{ steps.run_cond.outputs.should_skip }}' == true ]]; then
-            echo "result=true" >> $GITHUB_OUTPUT
-          elif [[ '${{ github.event.pull_request.draft }}' == true ]]; then
+          if [[ $IS_DRAFT == true ]]; then
             echo "Pull request is in draft state, skipping"
             echo "result=true" >> $GITHUB_OUTPUT
           else
             echo "result=false" >> $GITHUB_OUTPUT
           fi
+        env:
+          IS_DRAFT: ${{ github.event.pull_request.draft }}
 
       - id: matrix
         name: Obtain build target matrix
@@ -248,7 +240,9 @@ jobs:
         shell: pwsh
 
       - name: Run tester
-        run: ./koch.py test --batch:'${{ matrix.batch }}_${{ matrix.total_batch }}' --tryFailing all
+        run: ./koch.py test --batch:"$TEST_BATCH" --tryFailing all
+        env:
+          TEST_BATCH: ${{ matrix.batch }}_${{ matrix.total_batch }}
 
       - name: Print all test errors
         if: failure()
@@ -428,8 +422,8 @@ jobs:
       - name: Build docs
         run: |
           ./koch.py doc \
-            --git.url:'https://github.com/${{ github.repository }}' \
-            --git.commit:'${{ github.sha }}' \
+            --git.url:"https://github.com/$GITHUB_REPOSITORY" \
+            --git.commit:"$GITHUB_SHA" \
             --git.devel:devel
 
           # Remove leftover nimskullcache
@@ -522,8 +516,8 @@ jobs:
       - name: Build docs
         run: |
           ./koch.py doc \
-            --git.url:'https://github.com/${{ github.repository }}' \
-            --git.commit:'${{ github.sha }}' \
+            --git.url:"https://github.com/$GITHUB_REPOSITORY" \
+            --git.commit:"$GITHUB_SHA" \
             --git.devel:devel
 
           # Remove leftover nimskullcache
diff --git a/.github/workflows/slash-command-merge.yml b/.github/workflows/slash-command-merge.yml
index 731aa2f9403..8dfc87dc871 100644
--- a/.github/workflows/slash-command-merge.yml
+++ b/.github/workflows/slash-command-merge.yml
@@ -117,10 +117,10 @@ jobs:
       - if: steps.pr-data.outputs.run
         id: token
         name: Create app token for merges
-        uses: tibdex/github-app-token@v2
+        uses: actions/create-github-app-token@v1
         with:
-          app_id: ${{ secrets.CHORE_APP_ID }}
-          private_key: ${{ secrets.CHORE_APP_KEY }}
+          app-id: ${{ secrets.CHORE_APP_ID }}
+          private-key: ${{ secrets.CHORE_APP_KEY }}
 
         # TODO: Switch to GitHub CLI once
         # https://github.com/cli/cli/issues/7213 is solved.
diff --git a/.github/workflows/slash-commands.yml b/.github/workflows/slash-commands.yml
index 76b313d72ed..1987cfd988c 100644
--- a/.github/workflows/slash-commands.yml
+++ b/.github/workflows/slash-commands.yml
@@ -12,10 +12,10 @@ jobs:
     runs-on: ubuntu-latest
     steps:
       - id: token
-        uses: tibdex/github-app-token@v2
+        uses: actions/create-github-app-token@v1
         with:
-          app_id: ${{ secrets.CHORE_APP_ID }}
-          private_key: ${{ secrets.CHORE_APP_KEY }}
+          app-id: ${{ secrets.CHORE_APP_ID }}
+          private-key: ${{ secrets.CHORE_APP_KEY }}
 
       - uses: peter-evans/slash-command-dispatch@v4
         with:

From 1a6e12581a5ed9e812b6a32b9bc184613ee27810 Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Thu, 11 Jul 2024 19:31:23 -0500
Subject: [PATCH 149/169] add changelog builder for release publishing (#1377)

## Summary
Add changelog builder to the publishing workflow. This allows us to
provide richer release information to users.

## Details
The changelog builder will tally all PRs merged between the previous tag
and the latest tag, then generate a categorized changelog for them. The
configuration for the builder can be found at  `.github/changelog.json`
.

In addition to this,  `/generate-changelog`  PR command has been added,
which allows maintainers to generate a changelog based on the new
configuration within a given PR.

Usage:

/generate-changelog [from=<tag>] [to=<tag>] [no_prerelease=<true|false>]

Where:

-  `from` : Specify the previous tag. If not provided, will be the first
tag older than  `to` .
-  `to` : Specify the latest tag. If not provided, will be the latest
tag in this repository.
-  `no_prerelease` : Only applies when  `from`  is not provided. If set
to  `true` ,  `from`  is selected such that the older tag is /not/ a
pre-release. Defaults to  `false` .
---
 .github/changelog.json                        | 90 +++++++++++++++++++
 .github/workflows/publisher.yml               | 23 ++++-
 .../slash-command-generate-changelog.yml      | 81 +++++++++++++++++
 .github/workflows/slash-commands.yml          |  1 +
 4 files changed, 193 insertions(+), 2 deletions(-)
 create mode 100644 .github/changelog.json
 create mode 100644 .github/workflows/slash-command-generate-changelog.yml

diff --git a/.github/changelog.json b/.github/changelog.json
new file mode 100644
index 00000000000..56a6a1529f6
--- /dev/null
+++ b/.github/changelog.json
@@ -0,0 +1,90 @@
+{
+  "categories": [
+    {
+      "title": "## 🚀 Features",
+      "labels": ["enhancement"],
+      "categories": [
+        {
+          "title": "### Compiler",
+          "labels": ["enhancement"],
+          "exhaustive": true,
+          "rules": [
+            {
+              "on_property": "labels",
+              "pattern": "compiler.*"
+            }
+          ]
+        },
+        {
+          "title": "### Standard Library",
+          "labels": ["enhancement", "stdlib"],
+          "exhaustive": true
+        },
+        {
+          "title": "### Tooling",
+          "labels": ["enhancement", "tools"],
+          "exhaustive": true
+        }
+      ]
+    },
+    {
+      "title": "## 🐛 Fixes",
+      "labels": ["bug"],
+      "categories": [
+        {
+          "title": "### Compiler",
+          "labels": ["bug"],
+          "exhaustive": true,
+          "rules": [
+            {
+              "on_property": "labels",
+              "pattern": "compiler.*"
+            }
+          ]
+        },
+        {
+          "title": "### Standard Library",
+          "labels": ["bug", "stdlib"],
+          "exhaustive": true
+        },
+        {
+          "title": "### Tooling",
+          "labels": ["bug", "tool"],
+          "exhaustive": true
+        }
+      ]
+    },
+    {
+      "title": "## 🔧 Refactorings",
+      "labels": ["refactor", "simplification"],
+      "categories": [
+        {
+          "title": "### Compiler",
+          "labels": ["refactor", "simplification"],
+          "exhaustive_rules": true,
+          "rules": [
+            {
+              "on_property": "labels",
+              "pattern": "compiler.*"
+            }
+          ]
+        },
+        {
+          "title": "### Standard Library",
+          "labels": ["refactor", "stdlib"],
+          "exhaustive": true
+        },
+        {
+          "title": "### Tooling",
+          "labels": ["refactor", "tool"],
+          "exhaustive": true
+        }
+      ]
+    }
+  ],
+  "template": "# What's Changed\n\n#{{CHANGELOG}}\n\n<details>\n<summary>\n\n## 💬 Other\n\n</summary>\n\n#{{UNCATEGORIZED}}\n\n</details>\n\n**Full Changelog**: #{{RELEASE_DIFF}}",
+  "empty_template": "**Full Changelog**: #{{RELEASE_DIFF}}",
+  "pr_template": "* #{{TITLE}} by @#{{AUTHOR}} in #{{URL}}",
+  "sort": "DSC",
+  "base_branches": ["devel"]
+}
diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 5d0125ed76a..2a39c9265b6 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -25,6 +25,13 @@ jobs:
       url: ${{ steps.release.outputs.url }}
 
     steps:
+      # Repository required for changelog builder
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+          sparse-checkout: |
+            .github
+
       - name: Obtain latest successful run id
         id: finder
         run: |
@@ -103,5 +110,17 @@ jobs:
           tag_name: ${{ steps.release-files.outputs.version }}
           fail_on_unmatched_files: true
           target_commitish: ${{ github.event.after }}
-          body: |
-            Continuous delivery for commit ${{ github.event.after }}
+
+      - id: changelog
+        name: Create release changelog
+        uses: mikepenz/release-changelog-builder-action@v5.0.0-a04
+        with:
+          configuration: ".github/changelog.json"
+          toTag: ${{ steps.release-files.outputs.version }}
+          failOnError: true
+
+      - name: Push changelog
+        uses: softprops/action-gh-release@v2.0.6
+        with:
+          tag_name: ${{ steps.release-files.outputs.version }}
+          body: ${{ steps.changelog.outputs.changelog }}
diff --git a/.github/workflows/slash-command-generate-changelog.yml b/.github/workflows/slash-command-generate-changelog.yml
new file mode 100644
index 00000000000..ce93cd85d3e
--- /dev/null
+++ b/.github/workflows/slash-command-generate-changelog.yml
@@ -0,0 +1,81 @@
+name: /generate-changelog handler
+
+on:
+  repository_dispatch:
+    types: [generate-changelog-command]
+
+permissions:
+  pull-requests: write
+
+concurrency: generate-changelog-handler-${{ github.event.client_payload.pull_request.node_id || github.run_id }}
+
+jobs:
+  changelog:
+    if: github.event.client_payload.pull_request != null
+    name: Generate changelog and comment
+
+    runs-on: ubuntu-latest
+    env:
+      PR: ${{ github.event.client_payload.pull_request.number }}
+    steps:
+      - if: github.event.client_payload.pull_request.merge_commit_sha == null
+        name: Report "No merge HEAD" found
+        uses: peter-evans/create-or-update-comment@v4
+        with:
+          issue-number: ${{ env.PR }}
+          body: |
+            Could not generate changelog using this PR as no GitHub merge commits are available.
+
+            This could be due to the PR being recently opened or there is a merge conflict. Please
+            try again after a few minutes.
+
+      - if: github.event.client_payload.pull_request.merge_commit_sha == null
+        name: Fail due to "No merge HEAD"
+        run: |
+          echo "::error::No merge HEAD found for PR #$PR"
+          exit 1
+
+      - name: "Checkout merge head for #${{ env.PR }}"
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ github.event.client_payload.pull_request.merge_commit_sha }}
+          sparse-checkout: |
+            .github
+
+      - id: changelog
+        name: Create changelog
+        uses: mikepenz/release-changelog-builder-action@v5.0.0-a04
+        with:
+          configuration: ".github/changelog.json"
+          fromTag: ${{ github.event.client_payload.slash_command.args.named.from || '' }}
+          toTag: ${{ github.event.client_payload.slash_command.args.named.to || '' }}
+          ignorePreReleases: ${{ github.event.client_payload.slash_command.args.named.no_prerelease || false }}
+
+      - if: steps.changelog.outputs.failed == 'true'
+        name: Report failure
+        uses: peter-evans/create-or-update-comment@v4
+        with:
+          issue-number: ${{ env.PR }}
+          body: |
+            Error occurred while generating changelog using this PR.
+
+            See run log at ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}.
+
+      - if: steps.changelog.outputs.failed == 'true'
+        name: Fail due to changelog
+        run: |
+          echo "::error::Error occurred while generating changelog using PR #$PR"
+          exit 1
+
+      - name: Comment with changelog
+        uses: peter-evans/create-or-update-comment@v4
+        with:
+          issue-number: ${{ env.PR }}
+          body: |
+            Changelog requested by: @${{ github.event.client_payload.github.payload.comment.user.login }}
+
+            Generated between ${{ steps.changelog.outputs.fromTag }} to ${{ steps.changelog.outputs.toTag }} using configuration provided by this PR.
+
+            ---
+
+            ${{ steps.changelog.outputs.changelog }}
diff --git a/.github/workflows/slash-commands.yml b/.github/workflows/slash-commands.yml
index 1987cfd988c..939366186df 100644
--- a/.github/workflows/slash-commands.yml
+++ b/.github/workflows/slash-commands.yml
@@ -23,5 +23,6 @@ jobs:
           reaction-token: ${{ steps.token.outputs.token }}
           commands: |
             merge
+            generate-changelog
           issue-type: pull-request
           permission: write

From 7a3226a65809873cf11c25d2d890d62107ef74db Mon Sep 17 00:00:00 2001
From: alaviss <leorize+oss@disroot.org>
Date: Sun, 14 Jul 2024 19:41:46 -0500
Subject: [PATCH 150/169] changelog: move "Other" into categories (#1380)

While this will no longer allow the category to be collapsible, it will
allow the category to be omitted when nothing goes there.

This addresses the empty "Other" section as seen in
https://github.com/nim-works/nimskull/releases/tag/0.1.0-dev.21377
---
 .github/changelog.json | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/.github/changelog.json b/.github/changelog.json
index 56a6a1529f6..71614a27971 100644
--- a/.github/changelog.json
+++ b/.github/changelog.json
@@ -80,9 +80,13 @@
           "exhaustive": true
         }
       ]
+    },
+    {
+      "title": "## 💬 Other",
+      "labels": []
     }
   ],
-  "template": "# What's Changed\n\n#{{CHANGELOG}}\n\n<details>\n<summary>\n\n## 💬 Other\n\n</summary>\n\n#{{UNCATEGORIZED}}\n\n</details>\n\n**Full Changelog**: #{{RELEASE_DIFF}}",
+  "template": "# What's Changed\n\n#{{CHANGELOG}}\n\n**Full Changelog**: #{{RELEASE_DIFF}}",
   "empty_template": "**Full Changelog**: #{{RELEASE_DIFF}}",
   "pr_template": "* #{{TITLE}} by @#{{AUTHOR}} in #{{URL}}",
   "sort": "DSC",

From d69d651052c9415089e7f3758aef0ed41d34663f Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 15 Jul 2024 18:21:57 +0200
Subject: [PATCH 151/169] IC: fix type-bound operator lookup (#1383)

## Summary

Fix the compiler crashing in some contrived situations when using
`--ic:on`.

## Details

* populate the `canonTypes` table in `ic/cbackend` before starting the
  mid-/back-end processing
* type instances that weren't processed by `createTypeBoundOps` (e.g.,
  type instances for parameters) need the `canonTypes` lookup table for
  looking up the type-bound hooks
* the added test provides more information about the circumstances of
  the crash

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/ic/cbackend.nim      | 22 ++++++++++++++++++++--
 tests/ic/tcanonical_types.nim | 23 +++++++++++++++++++++++
 2 files changed, 43 insertions(+), 2 deletions(-)
 create mode 100644 tests/ic/tcanonical_types.nim

diff --git a/compiler/ic/cbackend.nim b/compiler/ic/cbackend.nim
index a36f6d70b6b..8b0e990ebf4 100644
--- a/compiler/ic/cbackend.nim
+++ b/compiler/ic/cbackend.nim
@@ -13,7 +13,9 @@
 
 import
   std/[
-    packedsets, algorithm
+    algorithm,
+    packedsets,
+    tables
   ],
   compiler/ast/[
     ast,
@@ -42,7 +44,8 @@ import
     rodfiles
   ],
   compiler/sem/[
-    modulelowering
+    modulelowering,
+    sighashes
   ]
 
 import compiler/backend/cbackend as cbackend2
@@ -195,6 +198,21 @@ proc generateCode*(g: ModuleGraph) =
       mlist.modulesClosed.add(pos)
       break
 
+  # fill the table of canonical types; hook injection needs it during its
+  # lookup
+  for e in attachedAsgn..attachedTrace:
+    for item, sym in g.attachedOps[e].mpairs:
+      # retrieving the attached-to type from the symbol is easier than
+      # trying to map `item` to a PType
+      let resolved = loadSymFromId(g.config, g.cache, g.packed, sym.id.module,
+                                   sym.id.packed)
+      if resolved.typ != nil:
+        # XXX: for an unknown reason, some symbols don't have a type
+        let t = resolved.typ[1].skipTypes({tyVar})
+        # ignore types that don't have real type-bound operators
+        if tfHasAsgn in t.flags and t.kind notin {tyDistinct, tyObject}:
+          discard g.canonTypes.mgetOrPut(hashType(t, {CoDistinct, CoType}), t)
+
   # Fourth pass: Generate the code:
   cbackend2.generateCode(g, backend, mlist)
   g.backend = backend
diff --git a/tests/ic/tcanonical_types.nim b/tests/ic/tcanonical_types.nim
new file mode 100644
index 00000000000..0f89ca0e10e
--- /dev/null
+++ b/tests/ic/tcanonical_types.nim
@@ -0,0 +1,23 @@
+discard """
+  description: '''
+    Regression test for compiler crash due to missing hook attachments. The
+    test is contrived and depends on compiler implementation details.
+  '''
+"""
+
+proc f1(x: ref int): ref int =
+  # the assignment requires the =copy hook. `f1` is processed by hook lifting
+  # first, so the lifetime hooks are bound to the result variable's ``ref int``
+  # instance
+  result = x
+
+proc f2(x: ref int) =
+  discard
+
+# use `f2` first so that its ``ref int`` instance is registered with the
+# environment
+f2(nil)
+# then use `f1`. It's ``ref int`` instance is mapped to that of `f2`, and
+# since `f2`'s ``ref int`` *instance* has no hook attached, missing canonical
+# type mappings result in a crash (as no hook can be found)
+discard f1(nil)

From 4f95d2afbe4ca80f679065464c40feec3480921a Mon Sep 17 00:00:00 2001
From: "P. Starsider" <132208486+starsiderfox@users.noreply.github.com>
Date: Mon, 22 Jul 2024 01:46:35 +0200
Subject: [PATCH 152/169] sem, pragmas: fix fatal pragma (#1386)

## Summary

Using  `{.fatal:"...".}`  did not show any message to the user and it
didn't stop compilation.
This commit fixes both issues.

## Details

-  `adSemFatalError`  now carries a message just like
`adSemCustomUserError` .
- All reports of `fatal` severity abort compilation.
- Testament now also consider fatal errors to be errors.
- A simple test case has been included.
-  `isCompilerFatal`  has been removed as it seems it lost its purpose.
The check for  `rextCmdRequiresFile`  seems to be unnecessary. A fatal
report is produced elsewhere (the only place where
`rextCmdRequiresFile`  is used) before this function is ever called, so
it was redundant and it doesn't break existing code.
---
 compiler/ast/ast_types.nim      |  3 +--
 compiler/front/cli_reporter.nim |  5 ++---
 compiler/front/msgs.nim         |  2 +-
 compiler/front/options.nim      | 10 ----------
 compiler/sem/pragmas.nim        |  7 ++++++-
 testament/testament.nim         |  2 +-
 tests/pragmas/tfatal.nim        |  4 ++++
 7 files changed, 15 insertions(+), 18 deletions(-)
 create mode 100644 tests/pragmas/tfatal.nim

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index f42fcc825af..e73893ba4fa 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1324,7 +1324,6 @@ type
         adSemAlignRequiresPowerOfTwo,
         adSemNoReturnHasReturn,
         adSemMisplacedDeprecation,
-        adSemFatalError,
         adSemNoUnionForJs,
         adSemBitsizeRequiresPositive,
         adSemExperimentalRequiresToplevel,
@@ -1421,7 +1420,7 @@ type
       externName*: string
     of adSemPragmaRecursiveDependency:
       userPragma*: PSym
-    of adSemCustomUserError:
+    of adSemCustomUserError, adSemFatalError:
       errmsg*: string
     of adSemImplicitPragmaError:
       implicitPragma*: PSym
diff --git a/compiler/front/cli_reporter.nim b/compiler/front/cli_reporter.nim
index e9e9616839e..2031f03180c 100644
--- a/compiler/front/cli_reporter.nim
+++ b/compiler/front/cli_reporter.nim
@@ -3211,7 +3211,6 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
       adSemAlignRequiresPowerOfTwo,
       adSemNoReturnHasReturn,
       adSemMisplacedDeprecation,
-      adSemFatalError,
       adSemNoUnionForJs,
       adSemBitsizeRequiresPositive,
       adSemExperimentalRequiresToplevel,
@@ -3428,11 +3427,11 @@ func astDiagToLegacyReport(conf: ConfigRef, diag: PAstDiag): Report {.inline.} =
         kind: rsemPragmaRecursiveDependency,
         sym: diag.userPragma,
         ast: diag.wrongNode)
-  of adSemCustomUserError:
+  of adSemFatalError, adSemCustomUserError:
     semRep = SemReport(
         location: some diag.location,
         reportInst: diag.instLoc.toReportLineInfo,
-        kind: rsemCustomUserError,
+        kind: kind,
         str: diag.errmsg,
         ast: diag.wrongNode)
   of adSemImplicitPragmaError:
diff --git a/compiler/front/msgs.nim b/compiler/front/msgs.nim
index e3fd21da753..79b785b28da 100644
--- a/compiler/front/msgs.nim
+++ b/compiler/front/msgs.nim
@@ -294,7 +294,7 @@ proc errorActions(
     eh: TErrorHandling
   ): tuple[action: TErrorHandling, withTrace: bool] =
   result = (doNothing, false)
-  if conf.isCompilerFatal(report):
+  if report.severity == rsevFatal:
     # Fatal message such as ICE (internal compiler), errFatal,
     result = (doAbort, true)
   elif conf.isCodeError(report):
diff --git a/compiler/front/options.nim b/compiler/front/options.nim
index c90c6046a3d..fc100d0ce4e 100644
--- a/compiler/front/options.nim
+++ b/compiler/front/options.nim
@@ -615,16 +615,6 @@ template report*[R: ReportTypes](
   ## it's instantiation info with `instantiationInfo()` of the template.
   report(conf, wrap(inReport, instLoc(), tinfo))
 
-# REFACTOR: we shouldn't need to dig into the internalReport and query severity
-#           directly
-from compiler/ast/reports_internal import severity
-
-func isCompilerFatal*(conf: ConfigRef, report: Report): bool =
-  ## Check if report stores fatal compilation error
-  report.category == repInternal and
-  report.internalReport.severity() == rsevFatal or
-  report.kind == rextCmdRequiresFile
-
 func severity*(conf: ConfigRef, report: ReportTypes | Report): ReportSeverity =
   # style checking is a hint by default, but can be globally overriden to
   # be treated as error via `--styleCheck:error`, and this is handled in
diff --git a/compiler/sem/pragmas.nim b/compiler/sem/pragmas.nim
index 92b07857d56..547fb70cfce 100644
--- a/compiler/sem/pragmas.nim
+++ b/compiler/sem/pragmas.nim
@@ -1556,7 +1556,12 @@ proc applyStmtPragma(c: PContext, owner: PSym, it: PNode, k: TSpecialWord): PNod
           result = c.config.newError(
             it, PAstDiag(kind: adSemCustomUserError, errmsg: s.strVal))
   of wFatal:
-    result = c.config.newError(it, PAstDiag(kind: adSemFatalError))
+    let (s, err) = strLitToStrOrErr(c, it)
+    result =
+      if err.isNil:
+        c.config.newError(it, PAstDiag(kind: adSemFatalError, errmsg: s))
+      else:
+        err
   of wDefine:
     result = processDefine(c, it)
   of wUndef:
diff --git a/testament/testament.nim b/testament/testament.nim
index be47463c69b..f93cb4e71b2 100644
--- a/testament/testament.nim
+++ b/testament/testament.nim
@@ -316,7 +316,7 @@ proc verboseCmd(cmd: string) =
 
 let
   pegLineError =
-    peg"{[^(]*} '(' {\d+} ', ' {\d+} ') ' ('Error') ':' \s* {.*}"
+    peg"{[^(]*} '(' {\d+} ', ' {\d+} ') ' ('Error' / 'Fatal') ':' \s* {.*}"
   pegOtherError = peg"'Error:' \s* {.*}"
   pegOfInterest = pegLineError / pegOtherError
 
diff --git a/tests/pragmas/tfatal.nim b/tests/pragmas/tfatal.nim
new file mode 100644
index 00000000000..89a607841f6
--- /dev/null
+++ b/tests/pragmas/tfatal.nim
@@ -0,0 +1,4 @@
+discard """
+  errormsg: "user message"
+"""
+{.fatal:"user message".}

From f99307697c55189d33da98dd165cb6d15559dd06 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 23 Jul 2024 04:44:46 +0000
Subject: [PATCH 153/169] build(deps): Bump softprops/action-gh-release from
 2.0.6 to 2.0.8 (#1387)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[softprops/action-gh-release](https://github.com/softprops/action-gh-release)
from 2.0.6 to 2.0.8.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/releases">softprops/action-gh-release's
releases</a>.</em></p>
<blockquote>
<h2>v2.0.8</h2>

<h2>What's Changed</h2>
<h3>Other Changes 🔄</h3>
<ul>
<li>chore(deps): bump prettier from 2.8.0 to 3.3.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/480">softprops/action-gh-release#480</a></li>
<li>chore(deps): bump <code>@​types/node</code> from 20.14.9 to 20.14.11
by <a href="https://github.com/dependabot"><code>@​dependabot</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/483">softprops/action-gh-release#483</a></li>
<li>chore(deps): bump <code>@​octokit/plugin-throttling</code> from
9.3.0 to 9.3.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/484">softprops/action-gh-release#484</a></li>
<li>chore(deps): bump glob from 10.4.2 to 11.0.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/477">softprops/action-gh-release#477</a></li>
<li>refactor: write jest config in ts by <a
href="https://github.com/chenrui333"><code>@​chenrui333</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/485">softprops/action-gh-release#485</a></li>
<li>chore(deps): bump <code>@​actions/github</code> from 5.1.1 to 6.0.0
by <a href="https://github.com/dependabot"><code>@​dependabot</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/470">softprops/action-gh-release#470</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/softprops/action-gh-release/compare/v2...v2.0.8">https://github.com/softprops/action-gh-release/compare/v2...v2.0.8</a></p>
<h2>v2.0.7</h2>
<!-- raw HTML omitted -->
<h2>What's Changed</h2>
<h3>Bug fixes 🐛</h3>
<ul>
<li>Fix missing update release body by <a

href="https://github.com/FirelightFlagboy"><code>@​FirelightFlagboy</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/365">softprops/action-gh-release#365</a></li>
</ul>
<h3>Other Changes 🔄</h3>
<ul>
<li>Bump <code>@​octokit/plugin-retry</code> from 4.0.3 to 7.1.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/443">softprops/action-gh-release#443</a></li>
<li>Bump typescript from 4.9.5 to 5.5.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/467">softprops/action-gh-release#467</a></li>
<li>Bump <code>@​types/node</code> from 20.14.6 to 20.14.8 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/469">softprops/action-gh-release#469</a></li>
<li>Bump <code>@​types/node</code> from 20.14.8 to 20.14.9 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/473">softprops/action-gh-release#473</a></li>
<li>Bump typescript from 5.5.2 to 5.5.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/472">softprops/action-gh-release#472</a></li>
<li>Bump ts-jest from 29.1.5 to 29.2.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/479">softprops/action-gh-release#479</a></li>
<li>docs: document that existing releases are updated by <a
href="https://github.com/jvanbruegge"><code>@​jvanbruegge</code></a> in
<a

href="https://redirect.github.com/softprops/action-gh-release/pull/474">softprops/action-gh-release#474</a></li>
</ul>
<h2>New Contributors</h2>
<ul>
<li><a
href="https://github.com/jvanbruegge"><code>@​jvanbruegge</code></a>
made their first contribution in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/474">softprops/action-gh-release#474</a></li>
<li><a

href="https://github.com/FirelightFlagboy"><code>@​FirelightFlagboy</code></a>
made their first contribution in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/365">softprops/action-gh-release#365</a></li>
</ul>
<p><strong>Full Changelog</strong>: <a

href="https://github.com/softprops/action-gh-release/compare/v2.0.6...v2.0.7">https://github.com/softprops/action-gh-release/compare/v2.0.6...v2.0.7</a></p>
</blockquote>
</details>
<details>
<summary>Changelog</summary>
<p><em>Sourced from <a

href="https://github.com/softprops/action-gh-release/blob/master/CHANGELOG.md">softprops/action-gh-release's
changelog</a>.</em></p>
<blockquote>
<h2>2.0.8</h2>
<h3>Other Changes 🔄</h3>
<ul>
<li>chore(deps): bump prettier from 2.8.0 to 3.3.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/480">softprops/action-gh-release#480</a></li>
<li>chore(deps): bump <code>@​types/node</code> from 20.14.9 to 20.14.11
by <a href="https://github.com/dependabot"><code>@​dependabot</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/483">softprops/action-gh-release#483</a></li>
<li>chore(deps): bump <code>@​octokit/plugin-throttling</code> from
9.3.0 to 9.3.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/484">softprops/action-gh-release#484</a></li>
<li>chore(deps): bump glob from 10.4.2 to 11.0.0 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/477">softprops/action-gh-release#477</a></li>
<li>refactor: write jest config in ts by <a
href="https://github.com/chenrui333"><code>@​chenrui333</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/485">softprops/action-gh-release#485</a></li>
<li>chore(deps): bump <code>@​actions/github</code> from 5.1.1 to 6.0.0
by <a href="https://github.com/dependabot"><code>@​dependabot</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/470">softprops/action-gh-release#470</a></li>
</ul>
<h2>2.0.7</h2>
<h3>Bug fixes 🐛</h3>
<ul>
<li>Fix missing update release body by <a

href="https://github.com/FirelightFlagboy"><code>@​FirelightFlagboy</code></a>
in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/365">softprops/action-gh-release#365</a></li>
</ul>
<h3>Other Changes 🔄</h3>
<ul>
<li>Bump <code>@​octokit/plugin-retry</code> from 4.0.3 to 7.1.1 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/443">softprops/action-gh-release#443</a></li>
<li>Bump typescript from 4.9.5 to 5.5.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/467">softprops/action-gh-release#467</a></li>
<li>Bump <code>@​types/node</code> from 20.14.6 to 20.14.8 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/469">softprops/action-gh-release#469</a></li>
<li>Bump <code>@​types/node</code> from 20.14.8 to 20.14.9 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/473">softprops/action-gh-release#473</a></li>
<li>Bump typescript from 5.5.2 to 5.5.3 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/472">softprops/action-gh-release#472</a></li>
<li>Bump ts-jest from 29.1.5 to 29.2.2 by <a
href="https://github.com/dependabot"><code>@​dependabot</code></a> in <a

href="https://redirect.github.com/softprops/action-gh-release/pull/479">softprops/action-gh-release#479</a></li>
<li>docs: document that existing releases are updated by <a
href="https://github.com/jvanbruegge"><code>@​jvanbruegge</code></a> in
<a

href="https://redirect.github.com/softprops/action-gh-release/pull/474">softprops/action-gh-release#474</a></li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/softprops/action-gh-release/commit/c062e08bd532815e2082a85e87e3ef29c3e6d191"><code>c062e08</code></a>
release 2.0.8</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/380635c4add9f3686733a9aee43912f1f16604d3"><code>380635c</code></a>
chore(deps): bump <code>@​actions/github</code> from 5.1.1 to 6.0.0 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/470">#470</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/20adb4259cc911c7d3ef4d10da2f13ca8ca2834c"><code>20adb42</code></a>
refactor: write jest config in ts (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/485">#485</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/f808f15ba8f7c201fa6f1f90fd6bb18127b9ddb0"><code>f808f15</code></a>
chore(deps): bump glob from 10.4.2 to 11.0.0 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/477">#477</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/61452410498f83c1b46c544ed23ed73f060138c4"><code>6145241</code></a>
chore(deps): bump <code>@​octokit/plugin-throttling</code> from 9.3.0 to
9.3.1 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/484">#484</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/4ac522d0bd78af302662418619bc832457bdd0b9"><code>4ac522d</code></a>
chore(deps): bump <code>@​types/node</code> from 20.14.9 to 20.14.11 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/483">#483</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/25849b132669d3a5d6adf884362acdb69262f262"><code>25849b1</code></a>
chore(deps): bump prettier from 2.8.0 to 3.3.3 (<a

href="https://redirect.github.com/softprops/action-gh-release/issues/480">#480</a>)</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/62060560e321d3dcfb1ae338d2512fbd98ab3f24"><code>6206056</code></a>
chore: update dependabot commit msg</li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/39aadf190d216edf1be66954a199b7c8983f1d09"><code>39aadf1</code></a>
chore: run <code>frizbee actions .github/workflows/</code></li>
<li><a

href="https://github.com/softprops/action-gh-release/commit/6f3ab653231297c6e8410125a22784df62214f4e"><code>6f3ab65</code></a>
chore: update dist file</li>
<li>Additional commits viewable in <a

href="https://github.com/softprops/action-gh-release/compare/v2.0.6...v2.0.8">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=softprops/action-gh-release&package-manager=github_actions&previous-version=2.0.6&new-version=2.0.8)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 2a39c9265b6..6c2fc56d13d 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -103,7 +103,7 @@ jobs:
 
       - id: release
         name: Create pre-release
-        uses: softprops/action-gh-release@v2.0.6
+        uses: softprops/action-gh-release@v2.0.8
         with:
           prerelease: true
           files: ${{ steps.release-files.outputs.result }}
@@ -120,7 +120,7 @@ jobs:
           failOnError: true
 
       - name: Push changelog
-        uses: softprops/action-gh-release@v2.0.6
+        uses: softprops/action-gh-release@v2.0.8
         with:
           tag_name: ${{ steps.release-files.outputs.version }}
           body: ${{ steps.changelog.outputs.changelog }}

From a0d524bf8a3f655082c8b27bf1d1ad56b4607f1e Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 24 Jul 2024 19:53:23 +0200
Subject: [PATCH 154/169] mir: add a dedicated IR for types (#1382)

## Summary

* implement a dedicated type IR for the MIR and back-end phase
* use the new IR in parts of the C code generator
* use a new name mangling scheme for types that doesn't rely on
  signature hashes

## Details

The idea behind introducing a dedicated type IR for the MIR and back-
end phase is to:
* have a simpler and more regular IR during lowering and code
  generation
* decouple type lowering from code generation
* make `PType` solely used by `sem` and `transf`

The key ideas for the type IR are that:
* same ID (`HeaderId`) means same type; there are no duplicates like
  with `PType`
* transformations and code generation have easy access to the various
  stages of a type's representation (including the `PType`)
* lineage to `PType`s is kept track of

The current design likely covers more ground than it ultimately needs
to, but this was a deliberate choice in order to ease the transition to
the new IR.

### Translation

The lowering and or fixes performed by `mirtypes` during the
translation of types intends to exactly match what was previously
implemented in `ccgtypes`.

So that the IR is well-tested, all `PType`s entering `mirgen` are
translated to the IR representation.

### Code generation

Most of the existing is still oblivious to the new type IR, with only
the type emission in the C code generation. Some analysis that was
previously performed on `PType`s is ported to operate on MIR type
descriptions.

The `mangling` module implements a semi-stable, reversible name
mangling for types. It's necessary since not all MIR types have an
originating-from `PType` (such as the internal payload type for `seq`s
and `string`s), meaning that the `sighash`-based mangling cannot be
used there.

### AST

Associating fields with names in the C code generator is now done via
the new type IR, meaning that the `locId` field on `TSym` is obsolete;
it's removed.

### Tests

* multiple `ccodecheck` test are adjusted to `int` now translating to a
  sized integer instead of `NI`
* due to usage of the to-MIR-type-translation,
  `tempty_typed_expressions_issues.nim` now also fails for JS

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/ast/ast.nim                          |    2 +-
 compiler/ast/ast_types.nim                    |    2 -
 compiler/ast/types.nim                        |   29 +
 compiler/backend/ccgcalls.nim                 |   17 +-
 compiler/backend/ccgexprs.nim                 |   72 +-
 compiler/backend/ccgstmts.nim                 |    9 +-
 compiler/backend/ccgthreadvars.nim            |    1 -
 compiler/backend/ccgtypes.nim                 | 1111 ++++++++---------
 compiler/backend/cgen.nim                     |   49 +-
 compiler/backend/cgendata.nim                 |   60 +-
 compiler/backend/mangling.nim                 |  199 +++
 compiler/mir/mirgen.nim                       |   12 +-
 compiler/mir/mirtypes.nim                     | 1100 +++++++++++++++-
 compiler/mir/typemaps.nim                     |    6 +-
 tests/align/talign.nim                        |    8 +-
 tests/ccgbugs/tnoalias.nim                    |    4 +-
 .../tempty_typed_expressions_issues.nim       |    4 +-
 17 files changed, 1921 insertions(+), 764 deletions(-)
 create mode 100644 compiler/backend/mangling.nim

diff --git a/compiler/ast/ast.nim b/compiler/ast/ast.nim
index f0ad4625253..6436a1f5e5d 100644
--- a/compiler/ast/ast.nim
+++ b/compiler/ast/ast.nim
@@ -498,7 +498,7 @@ template transitionSymKindCommon*(k: TSymKind) =
   s[] = TSym(kind: k, itemId: obj.itemId, magic: obj.magic, typ: obj.typ, name: obj.name,
              info: obj.info, owner: obj.owner, flags: obj.flags, ast: obj.ast,
              options: obj.options, position: obj.position, offset: obj.offset,
-             extname: obj.extname, extFlags: obj.extFlags, locId: obj.locId,
+             extname: obj.extname, extFlags: obj.extFlags,
              annex: obj.annex, constraint: obj.constraint)
   when defined(nimsuggest):
     s.allUsages = obj.allUsages
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index e73893ba4fa..e3eead924da 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -1723,8 +1723,6 @@ type
                               ## generated name is to be used
     extFlags*: ExternalFlags  ## additional flags that are relevant to code
                               ## generation
-    locId*: uint32            ## associates the symbol with a loc in the C code
-                              ## generator. 0 means unset.
     annex*: LibId             ## additional fields (seldom used, so we use a
                               ## reference to another object to save space)
     constraint*: PNode        ## additional constraints like 'lit|result'; also
diff --git a/compiler/ast/types.nim b/compiler/ast/types.nim
index e2b137e0d19..9bb6c072301 100644
--- a/compiler/ast/types.nim
+++ b/compiler/ast/types.nim
@@ -1557,3 +1557,32 @@ proc classifyBackendView*(t: PType): BackendViewKind =
      tyGenericParam, tyForward, tyBuiltInTypeClass, tyCompositeTypeClass,
      tyAnd, tyOr, tyNot, tyAnything, tyFromExpr:
     unreachable()
+
+proc isPassByRef*(conf: ConfigRef; s: PSym, retType: PType): bool =
+  var pt = skipTypes(s.typ, typedescInst)
+  assert skResult != s.kind
+
+  if tfByRef in pt.flags: return true
+  elif tfByCopy in pt.flags: return false
+  case pt.kind
+  of tyObject:
+    if s.typ.sym != nil and sfForward in s.typ.sym.flags:
+      # forwarded objects are *always* passed by pointers for consistency!
+      result = true
+    elif (optByRef in s.options) or (getSize(conf, pt) > conf.target.floatSize * 3):
+      result = true           # requested anyway
+    elif (tfFinal in pt.flags) and (pt[0] == nil):
+      result = false          # no need, because no subtyping possible
+    else:
+      result = true           # ordinary objects are always passed by reference,
+                              # otherwise casting doesn't work
+  of tyTuple:
+    result = (getSize(conf, pt) > conf.target.floatSize*3) or (optByRef in s.options)
+  else:
+    result = false
+
+  # first parameter and return type is 'lent T'? --> use pass by pointer if
+  # not already a pointer-like type
+  if s.position == 0 and retType != nil and retType.kind == tyLent:
+    result = pt.kind notin {tyVar, tyOpenArray, tyVarargs, tyRef, tyPtr,
+                            tyPointer}
diff --git a/compiler/backend/ccgcalls.nim b/compiler/backend/ccgcalls.nim
index c1a7ecba453..2c7d67bd3b4 100644
--- a/compiler/backend/ccgcalls.nim
+++ b/compiler/backend/ccgcalls.nim
@@ -44,7 +44,7 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
   # getUniqueType() is too expensive here:
   var typ = skipTypes(ri[0].typ, abstractInst)
   if typ[0] != nil:
-    if isInvalidReturnType(p.config, typ[0]):
+    if isInvalidReturnType(p.module, typ[0]):
       if params != "": pl.add(~", ")
       # the destination is guaranteed to be either a temporary or an lvalue
       # that can be modified in-place
@@ -53,7 +53,7 @@ proc fixupCall(p: BProc, le, ri: CgNode, d: var TLoc,
         # procedure
         if d.k == locNone:
           getTemp(p, typ[0], d)
-        pl.add(addrLoc(p.config, d))
+        pl.add(addrLoc(p.module, d))
         pl.add(~");$n")
         line(p, cpsStmts, pl)
         exitCall(p, ri)
@@ -105,6 +105,7 @@ proc genOpenArraySlice(p: BProc; q: CgNode; formalType, destType: PType): (Rope,
     result = ("($3*)($1)+($2)" % [rdLoc(a), rdLoc(b), dest],
               lengthExpr)
   of tyString, tySequence:
+    requestFullDesc(p.module, a.t)
     let atyp = skipTypes(a.t, abstractInst)
     if atyp.kind in {tyVar}:
       result = ("((*$1).p != NIM_NIL ? ($4*)(*$1)$3+$2 : NIM_NIL)" %
@@ -139,12 +140,12 @@ proc genArg(p: BProc, n: CgNode, param: PSym; call: CgNode): Rope =
       result = "$1.Field0, $1.Field1" % [rdLoc(a)]
     else:
       result = "$1, $1Len_0" % [rdLoc(a)]
-  elif ccgIntroducedPtr(p.config, param, call[0].typ[0]):
+  elif ccgIntroducedPtr(p.module, param, call[0].typ[0]):
     initLocExpr(p, n, a)
     if n.kind in cnkLiterals + {cnkNilLit}:
-      result = addrLoc(p.config, literalsNeedsTmp(p, a))
+      result = addrLoc(p.module, literalsNeedsTmp(p, a))
     else:
-      result = addrLoc(p.config, a)
+      result = addrLoc(p.module, a)
   else:
     initLocExprSingleUse(p, n, a)
     result = rdLoc(a)
@@ -206,9 +207,9 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
     else:
       lineF(p, cpsStmts, PatProc & ";$n", [rdLoc(op), pl, pl.addComma, rawProc])
 
-  let rawProc = getClosureType(p.module, typ, clHalf)
+  let rawProc = getClosureType(p.module, ri[0].typ, clHalf)
   if typ[0] != nil:
-    if isInvalidReturnType(p.config, typ[0]):
+    if isInvalidReturnType(p.module, typ[0]):
       if numArgs(ri) > 0: pl.add(~", ")
       # the destination is guaranteed to be either a temporary or an lvalue
       # that can be modified in-place
@@ -217,7 +218,7 @@ proc genClosureCall(p: BProc, le, ri: CgNode, d: var TLoc) =
         # procedure
         if d.k == locNone:
           getTemp(p, typ[0], d)
-        pl.add(addrLoc(p.config, d))
+        pl.add(addrLoc(p.module, d))
         genCallPattern()
         exitCall(p, ri)
     else:
diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 365138bb9a8..34717bd7b71 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -129,6 +129,7 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
       linefmt(p, cpsStmts, "$1.Field0 = $2; $1.Field1 = $2Len_0;$n",
         [rdLoc(d), a.rdLoc])
   of tySequence, tyString:
+    requestFullDesc(p.module, a.t)
     linefmt(p, cpsStmts, "$1.Field0 = ($2.p != NIM_NIL ? $2$3 : NIM_NIL); $1.Field1 = $4;$n",
       [rdLoc(d), a.rdLoc, dataField(p), lenExpr(p, a)])
   of tyArray:
@@ -140,7 +141,7 @@ proc genOpenArrayConv(p: BProc; d: TLoc; a: TLoc) =
 proc genAssignment(p: BProc, dest, src: TLoc) =
   # This function replaces all other methods for generating
   # the assignment operation in C.
-  case mapType(p.config, dest.t)
+  case mapType(p.module, dest.t)
   of ctChar, ctBool, ctInt, ctInt8, ctInt16, ctInt32, ctInt64,
      ctFloat, ctFloat32, ctFloat64,
      ctUInt, ctUInt8, ctUInt16, ctUInt32, ctUInt64,
@@ -166,7 +167,7 @@ proc genAssignment(p: BProc, dest, src: TLoc) =
     #writeStackTrace()
     #echo p.currLineInfo, " requesting"
     linefmt(p, cpsStmts, "#memTrackerWrite((void*)$1, $2, $3, $4);$n",
-            [addrLoc(p.config, dest), getSize(p.config, dest.t),
+            [addrLoc(p.module, dest), getSize(p.config, dest.t),
             makeCString(toFullPath(p.config, p.currLineInfo)),
             p.currLineInfo.safeLineNm])
 
@@ -176,25 +177,25 @@ proc genDeepCopy(p: BProc; dest, src: TLoc) =
       var tmp: TLoc
       getTemp(p, a.t, tmp)
       genAssignment(p, tmp, a)
-      addrLoc(p.config, tmp)
+      addrLoc(p.module, tmp)
     else:
-      addrLoc(p.config, a)
+      addrLoc(p.module, a)
 
   var ty = skipTypes(dest.t, abstractVarRange + {tyStatic})
   case ty.kind
   of tyPtr, tyRef, tyProc, tyTuple, tyObject, tyArray:
     # XXX optimize this
     linefmt(p, cpsStmts, "#genericDeepCopy((void*)$1, (void*)$2, $3);$n",
-            [addrLoc(p.config, dest), addrLocOrTemp(src),
+            [addrLoc(p.module, dest), addrLocOrTemp(src),
             genTypeInfoV1(p.module, dest.t, dest.lode.info)])
   of tySequence, tyString:
     linefmt(p, cpsStmts, "#genericDeepCopy((void*)$1, (void*)$2, $3);$n",
-            [addrLoc(p.config, dest), addrLocOrTemp(src),
+            [addrLoc(p.module, dest), addrLocOrTemp(src),
             genTypeInfoV1(p.module, dest.t, dest.lode.info)])
   of tyOpenArray, tyVarargs:
     linefmt(p, cpsStmts,
          "#genericDeepCopyOpenArray((void*)$1, (void*)$2, $1Len_0, $3);$n",
-         [addrLoc(p.config, dest), addrLocOrTemp(src),
+         [addrLoc(p.module, dest), addrLocOrTemp(src),
          genTypeInfoV1(p.module, dest.t, dest.lode.info)])
   of tySet:
     if mapSetType(p.config, ty) == ctArray:
@@ -396,7 +397,7 @@ proc unaryArith(p: BProc, e, x: CgNode, d: var TLoc, op: TMagic) =
 proc genDeref(p: BProc, e: CgNode, d: var TLoc) =
   let
     src = e.operand
-    mt = mapType(p.config, src.typ)
+    mt = mapType(p.module, src.typ)
   if mt in {ctArray, ctPtrToArray} and lfEnforceDeref notin d.flags:
     # XXX the amount of hacks for C's arrays is incredible, maybe we should
     # simply wrap them in a struct? --> Losing auto vectorization then?
@@ -438,14 +439,14 @@ proc genDeref(p: BProc, e: CgNode, d: var TLoc) =
       putIntoDest(p, d, e, "(*$1)" % [rdLoc(a)], a.storage)
 
 proc genAddr(p: BProc, e: CgNode, d: var TLoc) =
-  if mapType(p.config, e.operand.typ) == ctArray:
+  if mapType(p.module, e.operand.typ) == ctArray:
     expr(p, e.operand, d)
   else:
     var a: TLoc
     initLoc(a, locNone, e.operand, OnUnknown)
     a.flags.incl lfWantLvalue
     expr(p, e.operand, a)
-    putIntoDest(p, d, e, addrLoc(p.config, a), a.storage)
+    putIntoDest(p, d, e, addrLoc(p.module, a), a.storage)
 
 template inheritLocation(d: var TLoc, a: TLoc) =
   if d.k == locNone: d.storage = a.storage
@@ -469,33 +470,22 @@ proc genTupleElem(p: BProc, e: CgNode, d: var TLoc) =
   r.addf(".Field$1", [rope(e[1].intVal)])
   putIntoDest(p, d, e, r, a.storage)
 
-proc lookupFieldAgain(p: BProc, ty: PType; field: PSym; r: var Rope;
-                      resTyp: ptr PType = nil): PSym =
-  var ty = ty
-  assert r != ""
-  while ty != nil:
-    ty = ty.skipTypes(skipPtrs)
-    assert ty.kind == tyObject
-    result = lookupInRecord(ty.n, field.name)
-    if result != nil:
-      if resTyp != nil: resTyp[] = ty
-      break
-    r.add(".Sup")
-    ty = ty[0]
-  if result == nil: internalError(p.config, field.info, "genCheckedRecordField")
+proc handleSupAccess(types: TypeEnv, ty: PType; field: PSym; r: var Rope) =
+  let depth = computeDepth(types, types.headerFor(types[ty], Canonical),
+                           field.position.int32)
+  for _ in 0..<depth:
+    r.add ".Sup"
 
 proc genRecordField(p: BProc, e: CgNode, d: var TLoc) =
   var a: TLoc
   genRecordFieldAux(p, e, d, a)
   var r = rdLoc(a)
-  var f = e[1].field
+  let f = e[1].field
   let ty = skipTypes(a.t, abstractInst + tyUserTypeClasses)
   p.config.internalAssert(ty.kind == tyObject, e[0].info)
   if true:
-    var rtyp: PType
-    let field = lookupFieldAgain(p, ty, f, r, addr rtyp)
-    ensureObjectFields(p.module, field, rtyp)
-    r.addf(".$1", [p.fieldName(field)])
+    handleSupAccess(p.module.types, ty, f, r)
+    r.addf(".$1", [p.fieldName(ty, f)])
     putIntoDest(p, d, e, r, a.storage)
 
 proc genUncheckedArrayElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
@@ -574,6 +564,7 @@ proc genSeqElem(p: BProc, n, x, y: CgNode, d: var TLoc) =
   var a, b: TLoc
   initLocExpr(p, x, a)
   initLocExpr(p, y, b)
+  requestFullDesc(p.module, a.t)
   var ty = skipTypes(a.t, abstractVarRange)
   if ty.kind in {tyRef, tyPtr}:
     ty = skipTypes(ty.lastSon, abstractVarRange)
@@ -742,8 +733,7 @@ proc specializeInitObjectN(p: BProc, accessor: Rope, n: PNode, typ: PType) =
     p.config.internalAssert(n[0].kind == nkSym, n.info,
                             "specializeInitObjectN")
     let disc = n[0].sym
-    ensureObjectFields(p.module, disc, typ)
-    lineF(p, cpsStmts, "switch ($1.$2) {$n", [accessor, p.fieldName(disc)])
+    lineF(p, cpsStmts, "switch ($1.$2) {$n", [accessor, p.fieldName(typ, disc)])
     for i in 1..<n.len:
       let branch = n[i]
       assert branch.kind in {nkOfBranch, nkElse}
@@ -757,8 +747,7 @@ proc specializeInitObjectN(p: BProc, accessor: Rope, n: PNode, typ: PType) =
   of nkSym:
     let field = n.sym
     if field.typ.kind == tyVoid: return
-    ensureObjectFields(p.module, field, typ)
-    specializeInitObject(p, "$1.$2" % [accessor, p.fieldName(field)],
+    specializeInitObject(p, "$1.$2" % [accessor, p.fieldName(typ, field)],
                          field.typ, n.info)
   else: internalError(p.config, n.info, "specializeInitObjectN()")
 
@@ -854,10 +843,9 @@ proc genObjConstr(p: BProc, e: CgNode, d: var TLoc) =
   for it in e.items:
     var tmp2: TLoc
     tmp2.r = r
-    let field = lookupFieldAgain(p, ty, it[0].field, tmp2.r)
-    ensureObjectFields(p.module, field, ty)
+    handleSupAccess(p.module.types, ty, it[0].field, tmp2.r)
     tmp2.r.add(".")
-    tmp2.r.add(p.fieldName(field))
+    tmp2.r.add(p.fieldName(ty, it[0].field))
     tmp2.k = d.k
     tmp2.storage = d.storage
     tmp2.lode = it[1]
@@ -1209,7 +1197,7 @@ proc genSomeCast(p: BProc, e: CgNode, d: var TLoc) =
   let srcTyp = skipTypes(src.typ, abstractRange)
   if etyp.kind in ValueTypes and lfIndirect notin a.flags:
     putIntoDest(p, d, e, "(*($1*) ($2))" %
-        [getTypeDesc(p.module, e.typ), addrLoc(p.config, a)], a.storage)
+        [getTypeDesc(p.module, e.typ), addrLoc(p.module, a)], a.storage)
   elif etyp.kind == tyProc and etyp.callConv == ccClosure and srcTyp.callConv != ccClosure:
     putIntoDest(p, d, e, "(($1) ($2))" %
         [getClosureType(p.module, etyp, clHalfWithEnv), rdCharLoc(a)], a.storage)
@@ -1284,6 +1272,7 @@ proc genDestroy(p: BProc; n: CgNode) =
     let t = arg.typ.skipTypes(abstractInst)
     case t.kind
     of tyString:
+      requestFullDesc(p.module, arg.typ)
       var a: TLoc
       initLocExpr(p, arg, a)
       if optThreads in p.config.globalOptions:
@@ -1295,6 +1284,7 @@ proc genDestroy(p: BProc; n: CgNode) =
           " #dealloc($1.p);$n" &
           "}$n", [rdLoc(a)])
     of tySequence:
+      requestFullDesc(p.module, arg.typ)
       var a: TLoc
       initLocExpr(p, arg, a)
       linefmt(p, cpsStmts, "if ($1.p && !($1.p->cap & NIM_STRLIT_FLAG)) {$n" &
@@ -1377,7 +1367,7 @@ proc genMagicExpr(p: BProc, e: CgNode, d: var TLoc, op: TMagic) =
     let member =
       if dotExpr.kind == cnkTupleAccess:
         "Field" & rope(dotExpr[1].intVal)
-      else: p.fieldName(dotExpr[1].field)
+      else: p.fieldName(dotExpr[0].typ, dotExpr[1].field)
     putIntoDest(p,d,e, "((NI)offsetof($1, $2))" % [tname, member])
   of mChr: genSomeCast(p, e, d)
   of mOrd: genOrd(p, e, d)
@@ -1566,14 +1556,14 @@ proc downConv(p: BProc, n: CgNode, d: var TLoc) =
     if lfWantLvalue in d.flags:
       putIntoDest(p, d, n,
                 "(($1*) ($2))" % [getTypeDesc(p.module, n.typ),
-                                  addrLoc(p.config, a)], a.storage)
+                                  addrLoc(p.module, a)], a.storage)
       d.flags.incl lfIndirect
     else:
       putIntoDest(p, d, n,
                 "(($1) ($2))" % [getTypeDesc(p.module, n.typ), rdLoc(a)], a.storage)
   else:
     putIntoDest(p, d, n, "(*($1*) ($2))" %
-                        [getTypeDesc(p.module, dest), addrLoc(p.config, a)], a.storage)
+                        [getTypeDesc(p.module, dest), addrLoc(p.module, a)], a.storage)
 
 proc upConv(p: BProc, n: CgNode, d: var TLoc) =
   ## Generates and emits the code for the ``cnkObjUpConv`` (conversion to
@@ -1591,7 +1581,7 @@ proc upConv(p: BProc, n: CgNode, d: var TLoc) =
     # expression and then cast the pointer:
     putIntoDest(p, d, n,
                 "(($1*) ($2))" % [getTypeDesc(p.module, n.typ),
-                                  addrLoc(p.config, a)],
+                                  addrLoc(p.module, a)],
                 a.storage)
     # an indirection is used:
     d.flags.incl lfIndirect
diff --git a/compiler/backend/ccgstmts.nim b/compiler/backend/ccgstmts.nim
index 7e49197cea6..6e16b590c6a 100644
--- a/compiler/backend/ccgstmts.nim
+++ b/compiler/backend/ccgstmts.nim
@@ -305,7 +305,7 @@ proc genExcept(p: BProc, n: CgNode) =
   # setup the handler frame:
   var tmp: TLoc
   getTemp(p, p.module.g.graph.getCompilerProc("ExceptionFrame").typ, tmp)
-  lineCg(p, cpsStmts, "#nimCatchException($1);$n", [addrLoc(p.config, tmp)])
+  lineCg(p, cpsStmts, "#nimCatchException($1);$n", [addrLoc(p.module, tmp)])
 
 proc genAsmOrEmitStmt(p: BProc, t: CgNode, isAsmStmt=false): Rope =
   var res = ""
@@ -317,9 +317,10 @@ proc genAsmOrEmitStmt(p: BProc, t: CgNode, isAsmStmt=false): Rope =
         let sym = it.astLit.sym
         # special support for raw field symbols
         discard getTypeDesc(p.module, skipTypes(sym.typ, abstractPtrs))
-        p.config.internalAssert(sym.locId != 0, it.info):
-          "field's surrounding type not setup"
-        res.add(p.fieldName(sym))
+        # make sure the owner was generated, so that the field's mangled name
+        # is available
+        discard getTypeDesc(p.module, sym.owner.typ)
+        res.add(p.fieldName(sym.owner.typ, sym))
     of cnkLocal:
       # make sure the C type description is available:
       discard getTypeDesc(p.module, skipTypes(it.typ, abstractPtrs))
diff --git a/compiler/backend/ccgthreadvars.nim b/compiler/backend/ccgthreadvars.nim
index b3398f65d89..ad96e396e5f 100644
--- a/compiler/backend/ccgthreadvars.nim
+++ b/compiler/backend/ccgthreadvars.nim
@@ -44,7 +44,6 @@ proc declareThreadVar*(m: BModule, id: GlobalId, isExtern: bool) =
 proc generateThreadLocalStorage(m: BModule) =
   if m.g.nimtv != "" and (usesThreadVars in m.flags or sfMainModule in m.module.flags):
     for t in items(m.g.nimtvDeps): discard getTypeDesc(m, t)
-    finishTypeDescriptions(m)
     m.s[cfsSeqTypes].addf("typedef struct {$1} NimThreadVars;$n", [m.g.nimtv])
 
 proc generateThreadVarsSize(m: BModule) =
diff --git a/compiler/backend/ccgtypes.nim b/compiler/backend/ccgtypes.nim
index 69d0571f112..4d6c58c5276 100644
--- a/compiler/backend/ccgtypes.nim
+++ b/compiler/backend/ccgtypes.nim
@@ -22,6 +22,11 @@ proc isKeyword(w: PIdent): bool =
      ord(wInline): return true
   else: return false
 
+proc mangleField(m: BModule; name: string): string =
+  result = mangle(name)
+  if isKeyword(m.g.graph.cache.getIdent(name)):
+    result.add "_0"
+
 proc mangleField(m: BModule; name: PIdent): string =
   result = mangle(name.s)
   # fields are tricky to get right and thanks to generic types producing
@@ -80,28 +85,8 @@ const
                           tyDistinct, tyRange, tyStatic, tyAlias, tySink,
                           tyInferred}
 
-proc typeName(typ: PType): Rope =
-  let typ = typ.skipTypes(irrelevantForBackend)
-  result =
-    if typ.sym != nil and typ.kind in {tyObject, tyEnum}:
-      rope($typ.kind & '_' & typ.sym.name.s.mangle)
-    else:
-      rope($typ.kind)
-
-proc getTypeName(m: BModule; typ: PType; sig: SigHash): Rope =
-  var t = typ
-  while true:
-    if t.sym != nil and {sfImportc, sfExportc} * t.sym.flags != {}:
-      return t.sym.extname
-
-    if t.kind in irrelevantForBackend:
-      t = t.lastSon
-    else:
-      break
-  let typ = if typ.kind in {tyAlias, tySink}: typ.lastSon else: typ
-  result = typ.typeName & $sig
-
 proc mapSetType(conf: ConfigRef; typ: PType): TCTypeKind =
+  ## Legacy procedure.
   case int(getSize(conf, typ))
   of 1: result = ctInt8
   of 2: result = ctInt16
@@ -109,73 +94,140 @@ proc mapSetType(conf: ConfigRef; typ: PType): TCTypeKind =
   of 8: result = ctInt64
   else: result = ctArray
 
-proc mapType(conf: ConfigRef; typ: PType): TCTypeKind =
-  ## Maps a Nim type to a C type
-  case typ.kind
-  of tyNone, tyTyped: result = ctVoid
-  of tyBool: result = ctBool
-  of tyChar: result = ctChar
-  of tyNil: result = ctPtr
-  of tySet: result = mapSetType(conf, typ)
-  of tyOpenArray, tyVarargs:
-    result = ctNimOpenArray
-  of tyArray, tyUncheckedArray: result = ctArray
-  of tyObject, tyTuple: result = ctStruct
-  of tyUserTypeClasses:
-    doAssert typ.isResolvedUserTypeClass
-    return mapType(conf, typ.lastSon)
-  of tyGenericBody, tyGenericInst, tyGenericParam, tyDistinct, tyOrdinal,
-     tyTypeDesc, tyAlias, tySink, tyInferred, tyEnum:
-    result = mapType(conf, lastSon(typ))
-  of tyRange: result = mapType(conf, typ[0])
-  of tyPtr, tyVar, tyLent, tyRef:
-    var base = skipTypes(typ.lastSon, typedescInst)
-    case base.kind
-    of tyArray, tyUncheckedArray: result = ctPtrToArray
-    of tyOpenArray, tyVarargs:
-      result = ctNimOpenArray
-    of tySet:
-      if mapSetType(conf, base) == ctArray: result = ctPtrToArray
-      else: result = ctPtr
-    else: result = ctPtr
-  of tyPointer: result = ctPtr
-  of tySequence: result = ctNimSeq
-  of tyProc: result = if typ.callConv != ccClosure: ctProc else: ctStruct
-  of tyString: result = ctNimStr
-  of tyCstring: result = ctCString
-  of tyInt..tyUInt64:
-    result = TCTypeKind(ord(typ.kind) - ord(tyInt) + ord(ctInt))
-  of tyStatic:
-    if typ.n != nil: result = mapType(conf, lastSon typ)
-    else: doAssert(false, "mapType: " & $typ.kind)
-  else: doAssert(false, "mapType: " & $typ.kind)
+proc mapType(types: TypeEnv, typ: TypeId): TCTypeKind
+
+proc mapType(types: TypeEnv; desc: TypeHeader): TCTypeKind =
+  ## Maps a NimSkull type to the corresponding C type.
+  case desc.kind
+  of tkIndirect, tkImported:
+    mapType(types, desc.elem)
+  of tkVoid: ctVoid
+  of tkBool: ctBool
+  of tkChar: ctChar
+  of tkInt:
+    case desc.size(types)
+    of 1: ctInt8
+    of 2: ctInt16
+    of 4: ctInt32
+    of 8: ctInt64
+    else: unreachable()
+  of tkUInt:
+    case desc.size(types)
+    of 1: ctUInt8
+    of 2: ctUInt16
+    of 4: ctUInt32
+    of 8: ctUInt64
+    else: unreachable()
+  of tkFloat:
+    case desc.size(types)
+    of 4: ctFloat32
+    of 8: ctFloat64
+    else: unreachable()
+  of tkArray, tkUncheckedArray:
+    ctArray
+  of tkRecord, tkUnion:
+    ctStruct
+  of tkPtr, tkRef, tkLent, tkVar:
+    case mapType(types, desc.elem)
+    of ctArray:
+      ctPtrToArray
+    else:
+      ctPtr
+  of tkPointer: ctPtr
+  of tkProc: ctProc
+  of tkCstring: ctCString
+  # handling of the non-lowered types follows:
+  # XXX: this needs to eventually be removed; the whole code generator needs
+  #      to only operate on the lowered types
+  of tkSet:
+    case desc.size(types)
+    of 1: ctInt8
+    of 2: ctInt16
+    of 4: ctInt32
+    of 8: ctInt64
+    else: ctArray
+  of tkOpenArray: ctNimOpenArray
+  of tkSeq:       ctNimSeq
+  of tkString:    ctNimStr
+  of tkClosure:   ctStruct
+  else:
+    unreachable(desc.kind)
+
+proc mapType(types: TypeEnv, typ: TypeId): TCTypeKind =
+  mapType(types, types.headerFor(typ, Original))
+
+proc mapType(m: BModule; typ: PType): TCTypeKind =
+  ## Legacy procedure. Bridges the old to the new types.
+  let id = m.addLate(typ)
+  mapType(m.types, id)
 
-proc mapReturnType(conf: ConfigRef; typ: PType): TCTypeKind =
+proc mapReturnType(m: BModule; typ: PType): TCTypeKind =
   #if skipTypes(typ, typedescInst).kind == tyArray: result = ctPtr
   #else:
-  result = mapType(conf, typ)
+  result = mapType(m, typ)
+
+proc getTypeDesc(m: BModule, typ: PType): Rope
+proc useType(m: BModule, typ: TypeId, desc: TypeHeader; onlyName = false): Rope
+
+proc containsGarbageCollectedRef(env: TypeEnv, typ: TypeId): bool =
+  ## Computes whether `typ` is or contains a garbage-collected type.
+  let n = env.get(typ).desc[Canonical]
+  case env[n].kind
+  of tkRef, tkClosure:
+    result = true
+  of tkArray:
+    result = containsGarbageCollectedRef(env, env[n].elem)
+  of tkRecord:
+    var rec = typ
+    # traverse the object hierarchy:
+    while rec != VoidType:
+      for (_, f) in env.fields(env.headerFor(rec, Canonical)):
+        # is the field a garbabe-collected reference?
+        if containsGarbageCollectedRef(env, f.typ):
+          return true
+
+      rec = env.headerFor(rec, Canonical).base(env)
 
-proc isImportedType(t: PType): bool =
-  result = t.sym != nil and sfImportc in t.sym.flags
-
-proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope
+    result = false
+  else:
+    # neither an aggregate type nor a garbage-collected ref
+    result = false
 
-proc isInvalidReturnType(conf: ConfigRef; rettype: PType): bool =
-  # Arrays and sets cannot be returned by a C procedure, because C is
+proc usesRvo(types: TypeEnv, typ: TypeId): bool =
+  ## Computes for the record type `typ` whether it uses the return-value
+  ## optimization.
+  # seek to the root type in the inheritance hierarchy:
+  var base = typ
+  while (let next = types.headerFor(base, Lowered).base(types);
+         next != VoidType):
+    base = next
+
+  # does the type have a RTTI header? does the record have a garbage-collected
+  # field?
+  # XXX: these rules originate from the refc days, where they were important
+  #      for efficiency. This is no longer the case, and it'd make sense to
+  #      make usage of RVO dependent on the *size* of the type instead
+  result = types.headerFor(base, Lowered).fieldOffset(types) == -1 or
+           containsGarbageCollectedRef(types, typ)
+
+proc isInvalidReturnType(types: TypeEnv; typ: TypeId): bool =
+  # Arrays cannot be returned by a C procedure, because C is
   # such a poor programming language.
   # We exclude records with refs too. This enhances efficiency.
   # keep synchronized with ``mirpasses.eligibleForRvo``
-  if rettype == nil: result = true
+  let typ = types.canonical(typ)
+  case types.headerFor(typ, Lowered).kind
+  of tkArray:  true
+  of tkRecord: usesRvo(types, typ)
+  else:        false
+
+proc isInvalidReturnType(m: BModule; rettype: PType): bool =
+  ## Legacy procedure; only exists for bridging the old to the new code.
+  if rettype.isNil:
+    false # nil stands for void, which is a valid return type
   else:
-    case mapType(conf, rettype)
-    of ctArray:
-      result = not (skipTypes(rettype, typedescInst).kind in
-          {tyVar, tyLent, tyRef, tyPtr})
-    of ctStruct:
-      let t = skipTypes(rettype, typedescInst)
-      result = containsGarbageCollectedRef(t) or
-          (t.kind == tyObject and not isObjLackingTypeField(t))
-    else: result = false
+    let id = m.addLate(rettype)
+    isInvalidReturnType(m.types, id)
 
 const
   CallingConvToStr: array[TCallingConvention, string] = ["N_NIMCALL",
@@ -184,12 +236,6 @@ const
                  # but one can #define it to what one wants
     "N_INLINE", "N_NOINLINE", "N_FASTCALL", "N_CLOSURE", "N_NOCONV"]
 
-proc cacheGetType(tab: TypeCache; sig: SigHash): Rope =
-  # returns nil if we need to declare this type
-  # since types are now unique via the ``getUniqueType`` mechanism, this slow
-  # linear search is not necessary anymore:
-  result = tab.getOrDefault(sig)
-
 proc addAbiCheck(m: BModule, t: PType, name: Rope) =
   if isDefined(m.config, "checkAbi") and (let size = getSize(m.config, t); size != szUnknownSize):
     var msg = "backend & Nim disagree on size for: "
@@ -199,145 +245,63 @@ proc addAbiCheck(m: BModule, t: PType, name: Rope) =
     m.s[cfsTypeInfo].addf("NIM_STATIC_ASSERT(sizeof($1) == $2, $3);$n", [name, rope(size), msg2.rope])
     # see `testCodegenABICheck` for example error message it generates
 
-proc ccgIntroducedPtr(conf: ConfigRef; s: PSym, retType: PType): bool =
-  var pt = skipTypes(s.typ, typedescInst)
-  assert skResult != s.kind
-
-  if tfByRef in pt.flags: return true
-  elif tfByCopy in pt.flags: return false
-  case pt.kind
-  of tyObject:
-    if s.typ.sym != nil and sfForward in s.typ.sym.flags:
-      # forwarded objects are *always* passed by pointers for consistency!
-      result = true
-    elif (optByRef in s.options) or (getSize(conf, pt) > conf.target.floatSize * 3):
-      result = true           # requested anyway
-    elif (tfFinal in pt.flags) and (pt[0] == nil):
-      result = false          # no need, because no subtyping possible
-    else:
-      result = true           # ordinary objects are always passed by reference,
-                              # otherwise casting doesn't work
-  of tyTuple:
-    result = (getSize(conf, pt) > conf.target.floatSize*3) or (optByRef in s.options)
-  else:
-    result = false
-  # first parameter and return type is 'lent T'? --> use pass by pointer
-  if s.position == 0 and retType != nil and retType.kind == tyLent:
-    result = not (pt.kind in {tyVar, tyArray, tyOpenArray, tyVarargs, tyRef, tyPtr, tyPointer} or
-      pt.kind == tySet and mapSetType(conf, pt) == ctArray)
+proc ccgIntroducedPtr(m: BModule; s: PSym, retType: PType): bool =
+  isPassByRef(m.config, s, retType) and mapType(m, s.typ) != ctArray
 
-proc initResultParamLoc(conf: ConfigRef; param: CgNode): TLoc =
+proc initResultParamLoc(m: BModule; param: CgNode): TLoc =
   result = initLoc(locParam, param, "Result", OnStack)
   let t = param.typ
-  if mapReturnType(conf, t) != ctArray and isInvalidReturnType(conf, t):
+  if mapReturnType(m, t) != ctArray and isInvalidReturnType(m, t):
     incl(result.flags, lfIndirect)
     result.storage = OnUnknown
 
-proc typeNameOrLiteral(m: BModule; t: PType, literal: string): Rope =
-  if t.sym != nil and sfImportc in t.sym.flags and t.sym.magic == mNone:
-    useHeader(m, t.sym)
-    result = t.sym.extname
-  else:
-    result = rope(literal)
+proc useType(m: BModule, typ: TypeId; onlyName = false): Rope =
+  useType(m, typ, m.types.headerFor(typ, Lowered), onlyName)
 
 proc getSimpleTypeDesc(m: BModule, typ: PType): Rope =
-  const
-    NumericalTypeToStr: array[tyInt..tyUInt64, string] = [
-      "NI", "NI8", "NI16", "NI32", "NI64",
-      "NF", "NF32", "NF64",
-      "NU", "NU8", "NU16", "NU32", "NU64"]
-  case typ.kind
-  of tyPointer:
-    result = typeNameOrLiteral(m, typ, "void*")
-  of tyString:
-    discard cgsym(m, "NimStrPayload")
-    discard cgsym(m, "NimStringV2")
-    result = typeNameOrLiteral(m, typ, "NimStringV2")
-  of tyCstring: result = typeNameOrLiteral(m, typ, "NCSTRING")
-  of tyBool: result = typeNameOrLiteral(m, typ, "NIM_BOOL")
-  of tyChar: result = typeNameOrLiteral(m, typ, "NIM_CHAR")
-  of tyNil: result = typeNameOrLiteral(m, typ, "void*")
-  of tyInt..tyUInt64:
-    result = typeNameOrLiteral(m, typ, NumericalTypeToStr[typ.kind])
-  of tyDistinct, tyRange, tyOrdinal: result = getSimpleTypeDesc(m, typ[0])
-  of tyStatic:
-    m.config.internalAssert(typ.n != nil, "tyStatic for getSimpleTypeDesc")
-    result = getSimpleTypeDesc(m, lastSon typ)
-  of tyGenericInst, tyAlias, tySink, tyEnum:
-    result = getSimpleTypeDesc(m, lastSon typ)
-  else: result = ""
-
-  if result != "" and typ.isImportedType():
-    let sig = hashType typ
-    if cacheGetType(m.typeCache, sig) == "":
-      m.typeCache[sig] = result
-
-proc pushType(m: BModule, typ: PType) =
-  for i in 0..high(m.typeStack):
-    # pointer equality is good enough here:
-    if m.typeStack[i] == typ: return
-  m.typeStack.add(typ)
-
-proc getTypePre(m: BModule, typ: PType; sig: SigHash): Rope =
-  if typ == nil: result = rope("void")
-  else:
-    result = getSimpleTypeDesc(m, typ)
-    if result == "": result = cacheGetType(m.typeCache, sig)
+  useType(m, m.addLate(typ))
 
-proc structOrUnion(t: PType): Rope =
-  let cachedUnion = rope("union")
-  let cachedStruct = rope("struct")
-  let t = t.skipTypes({tyAlias, tySink})
-  if tfUnion in t.flags: cachedUnion
-  else: cachedStruct
+proc structOrUnion(kind: TypeKind): Rope =
+  case kind
+  of tkRecord: "struct"
+  of tkUnion:  "union"
+  else:        unreachable(kind)
 
 proc addForwardStructFormat(m: BModule, structOrUnion: Rope, typename: Rope) =
   m.s[cfsForwardTypes].addf "typedef $1 $2 $2;$n", [structOrUnion, typename]
 
-proc getTypeForward(m: BModule, typ: PType; sig: SigHash): Rope =
-  result = cacheGetType(m.forwTypeCache, sig)
+proc getTypeForward(m: BModule, typ: TypeId, desc: TypeHeader): Rope =
+  result = m.forwTypeCache.getOrDefault(typ)
   if result != "": return
-  result = getTypePre(m, typ, sig)
+  result = m.typeCache.getOrDefault(typ)
   if result != "": return
-  let concrete = typ.skipTypes(abstractInst)
-  case concrete.kind
-  of tySequence, tyTuple, tyObject:
-    result = getTypeName(m, typ, sig)
-    m.forwTypeCache[sig] = result
-    if not isImportedType(concrete):
-      addForwardStructFormat(m, structOrUnion(typ), result)
-    else:
-      pushType(m, concrete)
-    doAssert m.forwTypeCache[sig] == result
-  else: internalError(m.config, "getTypeForward(" & $typ.kind & ')')
-
-proc getTypeDescWeak(m: BModule; t: PType; check: var IntSet): Rope =
-  ## like getTypeDescAux but creates only a *weak* dependency. In other words
-  ## we know we only need a pointer to it so we only generate a struct forward
-  ## declaration:
-  let etB = t.skipTypes(abstractInst)
-  case etB.kind
-  of tyObject, tyTuple:
-    result = getTypeForward(m, t, hashType(t))
-    pushType(m, t)
+
+  case desc.kind
+  of tkRecord, tkUnion:
+    result = computeTypeName(m.g.graph, m.types, typ)
+    addForwardStructFormat(m, structOrUnion(desc.kind), result)
+    m.forwTypeCache[typ] = result
+  of tkImported:
+    result = useType(m, typ, desc)
   else:
-    result = getTypeDescAux(m, t, check)
+    unreachable(desc.kind)
 
-proc getSeqPayloadType(m: BModule; t: PType): Rope =
-  var check = initIntSet()
-  result = getTypeDescWeak(m, t, check) & "_Content"
-  #result = getTypeForward(m, t, hashType(t)) & "_Content"
+proc payloadType(m: BModule, typ: TypeId): TypeId =
+  # the second field is a pointer to the payload type
+  m.types.headerFor(m.types[lookupField(m.types, typ, 1)].typ, Lowered).elem
 
-proc seqV2ContentType(m: BModule; t: PType; check: var IntSet) =
-  let sig = hashType(t)
-  let result = cacheGetType(m.typeCache, sig)
-  if result == "":
-    # the struct definition hasn't been emitted yet
-    discard getTypeDescAux(m, t, check)
-  else:
-    # emit the payload type:
-    appcg(m, m.s[cfsTypes], "struct $2_Content { NI cap; $1 data[SEQ_DECL_SIZE];};$N",
-          [getTypeDescAux(m, t.skipTypes(abstractInst)[0], check), result])
+proc requestFullDesc(m: BModule, typ: PType) =
+  ## Requests the full type description for the seq/string type and its
+  ## payload.
+  ## This procedure is a temporary workaround; it becomes obsolete once seq
+  ## and string operations are lowered during the MIR phase.
+  let id = m.addLate(typ)
+  discard useType(m, id) # pull in the seq/string type
+  discard useType(m, payloadType(m, id)) # pull in the payload type
+
+proc getSeqPayloadType(m: BModule; t: PType): Rope =
+  let typ = m.addLate(t)
+  result = useType(m, payloadType(m, typ))
 
 proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
   ## Sets up and returns the locs of the parameter symbols for procedure
@@ -358,7 +322,7 @@ proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
       continue
 
     let storage =
-      if mapType(m.config, param.typ.skipTypes({tyVar, tyLent})) == ctArray:
+      if mapType(m, param.typ.skipTypes({tyVar, tyLent})) == ctArray:
         # something that's represented as a C array. Since an indirection is
         # involved, we don't know where the location resides
         OnUnknown
@@ -368,68 +332,123 @@ proc prepareParameters(m: BModule, t: PType): seq[TLoc] =
     result[i] = initLoc(locParam, newLocalRef(LocalId(i), param.info, param.typ),
                         mangleParamName(m.config, param), storage)
 
-    if ccgIntroducedPtr(m.config, param, t[0]):
+    if ccgIntroducedPtr(m, param, t[0]):
       # the parameter is passed by address; mark it as indirect
       incl(result[i].flags, lfIndirect)
       result[i].storage = OnUnknown
 
-proc genProcParams(m: BModule, t: PType, rettype, params: var Rope,
-                   check: var IntSet, locs: openArray[TLoc],
-                   declareEnvironment=true; weakDep=false) =
+proc prepareParameters(m: BModule, desc: TypeHeader): seq[TLoc] =
+  assert desc.kind == tkProc
+  result.newSeq(desc.numParams + 1)
+
+  for i, it, flags in params(m.types, desc):
+    let i = i + 1
+    if it == VoidType:
+      # ignore compile-time only parameters
+      # XXX: the parameter needs to be eliminated during to-MIR translation
+      #      already
+      continue
+
+    # the loc sequence is only used for procedure type emission, so using nil
+    # as the node is fine
+    result[i] = initLoc(locParam, nil, "_" & $i, OnUnknown)
+
+    if pfByRef in flags and mapType(m.types, it) != ctArray:
+      # the parameter is passed by address; mark it as indirect
+      incl(result[i].flags, lfIndirect)
+      result[i].storage = OnUnknown
+
+proc genParamDecl(m: BModule, id: TypeId, params: var Rope, name: string,
+                  indirect, noAlias, weakDep: bool) =
+  ## Emits the declaration for a parameter.
+  case mapType(m.types, id)
+  of ctNimOpenArray:
+    # an openArray tuple is "unpacked" into the parameter list (it takes up
+    # two parameters)
+    params.add useType(m, m.types[m.types.lookupField(id, 0)].typ)
+    params.add " "
+    if noAlias:
+      params.add("NIM_NOALIAS ")
+    params.add(name)
+    params.addf(", NI $1Len_0", [name])
+  elif indirect:
+    params.add useType(m, id, onlyName=true)
+    params.add("* ")
+    if noAlias:
+      params.add("NIM_NOALIAS ")
+    params.add(name)
+  else:
+    params.add useType(m, id, onlyName=weakDep)
+    if noAlias:
+      params.add(" NIM_NOALIAS")
+    params.add(" ")
+    params.add(name)
+
+proc finishProcType(m: BModule, ret: TypeId, withEnv, withVarargs: bool,
+                    params: var string) =
+  ## Appends the return type as a parameter, and wraps `params` in parenthesis.
+  if isInvalidReturnType(m.types, ret):
+    if params != "":
+      params.add ", "
+    if mapType(m.g.env.types, ret) == ctArray:
+      params.add useType(m, ret)
+    else:
+      params.add useType(m, ret, onlyName=true)
+      params.add "*"
+    params.add " Result"
+
+  if withEnv:
+    if params != "":
+      params.add ", "
+    params.add "void* ClE_0"
+
+  if withVarargs:
+    if params != "":
+      params.add ", "
+    params.add "..."
+
+  if params == "": params.add("void)")
+  else: params.add(")")
+  params = "(" & params
+
+proc genProcParams(m: BModule, desc: TypeHeader, ret, params: var Rope,
+                   locs: openArray[TLoc], weakDep: bool) =
+  assert desc.kind == tkProc
+  params = ""
+  let rt = desc.retType(m.types)
+  if isInvalidReturnType(m.types, rt):
+    ret = ~"void"
+  else:
+    ret = useType(m, rt, weakDep)
+
+  for i, typ, flags in params(m.types, desc):
+    let i = i + 1
+    if locs[i].k == locNone: continue
+    if params != "": params.add(~", ")
+    genParamDecl(m, typ, params, locs[i].r, lfIndirect in locs[i].flags,
+                 noAlias=false, weakDep)
+
+  finishProcType(m, rt, desc.callConv(m.types) == ccClosure,
+                 desc.hasVarargs(m.types), params)
+
+proc genProcParams(m: BModule, t: PType, rettype, params: var string,
+                   locs: openArray[TLoc]) =
+  ## Legacy procedure for contexts where type IDs aren't yet used.
   params = ""
-  if t[0] == nil or isInvalidReturnType(m.config, t[0]):
+  let rty = m.addLate(t[0])
+  if isInvalidReturnType(m.g.env.types, rty):
     rettype = ~"void"
   else:
-    rettype = getTypeDescAux(m, t[0], check)
-  for i in 1..<t.n.len:
-    m.config.internalAssert(t.n[i].kind == nkSym, t.n.info, "genProcParams")
-    var param = t.n[i].sym
+    rettype = useType(m, rty)
+
+  for i in 1..<t.len:
     if locs[i].k == locNone: continue
     if params != "": params.add(~", ")
+    let ty = m.addLate(t[i])
+    genParamDecl(m, ty, params, locs[i].r, lfIndirect in locs[i].flags,
+                 sfNoalias in t.n[i].sym.flags, weakDep=false)
 
-    var arr = param.typ.skipTypes({tyGenericInst})
-    if arr.kind in {tyVar, tyLent, tySink}:
-      arr = arr.lastSon
-    let isOpenArray = arr.kind in {tyOpenArray, tyVarargs}
-
-    if isOpenArray:
-      # declare the pointer field for openArray:
-      params.add(getTypeDescWeak(m, arr.base, check))
-      params.add("*")
-    elif lfIndirect in locs[i].flags:
-      params.add(getTypeDescWeak(m, param.typ, check))
-      params.add(~"*")
-    elif weakDep:
-      params.add(getTypeDescWeak(m, param.typ, check))
-    else:
-      params.add(getTypeDescAux(m, param.typ, check))
-    params.add(~" ")
-    if sfNoalias in param.flags:
-      params.add(~"NIM_NOALIAS ")
-    params.add(locs[i].r)
-    # declare the len field for open arrays:
-    if isOpenArray:
-      # need to pass hidden parameter:
-      params.addf(", NI $1Len_$2", [locs[i].r, 0.rope])
-
-  if t[0] != nil and isInvalidReturnType(m.config, t[0]):
-    var arr = t[0]
-    if params != "": params.add(", ")
-    if mapReturnType(m.config, t[0]) != ctArray:
-      params.add(getTypeDescWeak(m, arr, check))
-      params.add("*")
-    else:
-      params.add(getTypeDescAux(m, arr, check))
-    params.addf(" Result", [])
-  if t.callConv == ccClosure and declareEnvironment:
-    if params != "": params.add(", ")
-    params.add("void* ClE_0")
-  if tfVarargs in t.flags:
-    if params != "": params.add(", ")
-    params.add("...")
-  if params == "": params.add("void)")
-  else: params.add(")")
-  params = "(" & params
+  finishProcType(m, rty, t.callConv == ccClosure, tfVarargs in t.flags, params)
 
 proc mangleRecFieldName(m: BModule; field: PSym): Rope =
   if {sfImportc, sfExportc} * field.flags != {}:
@@ -438,307 +457,253 @@ proc mangleRecFieldName(m: BModule; field: PSym): Rope =
     result = rope(mangleField(m, field.name))
   m.config.internalAssert(result != "", field.info, "mangleRecFieldName")
 
-proc genRecordFieldsAux(m: BModule, n: PNode,
-                        rectype: PType,
-                        check: var IntSet, unionPrefix = ""): Rope =
-  result = ""
-  case n.kind
-  of nkRecList:
-    for i in 0..<n.len:
-      result.add(genRecordFieldsAux(m, n[i], rectype, check, unionPrefix))
-  of nkRecCase:
-    m.config.internalAssert(n[0].kind == nkSym, n.info, "genRecordFieldsAux")
-    result.add(genRecordFieldsAux(m, n[0], rectype, check, unionPrefix))
-    # prefix mangled name with "_U" to avoid clashes with other field names,
-    # since identifiers are not allowed to start with '_'
-    var unionBody = ""
-    for i in 1..<n.len:
-      case n[i].kind
-      of nkOfBranch, nkElse:
-        let k = lastSon(n[i])
-        if k.kind != nkSym:
-          let structName = "_" & mangleRecFieldName(m, n[0].sym) & "_" & $i
-          let a = genRecordFieldsAux(m, k, rectype, check, unionPrefix & $structName & ".")
-          if a != "":
-            if tfPacked notin rectype.flags:
-              unionBody.add("struct {")
-            else:
-              if hasAttribute in CC[m.config.cCompiler].props:
-                unionBody.add("struct __attribute__((__packed__)){")
-              else:
-                unionBody.addf("#pragma pack(push, 1)$nstruct{", [])
-            unionBody.add(a)
-            unionBody.addf("} $1;$n", [structName])
-            if tfPacked in rectype.flags and hasAttribute notin CC[m.config.cCompiler].props:
-              unionBody.addf("#pragma pack(pop)$n", [])
-        else:
-          unionBody.add(genRecordFieldsAux(m, k, rectype, check, unionPrefix))
-      else: internalError(m.config, "genRecordFieldsAux(record case branch)")
-    if unionBody != "":
-      result.addf("union{$n$1};$n", [unionBody])
-  of nkSym:
-    let field = n.sym
-    if field.typ.kind == tyVoid: return
-    #assert(field.ast == nil)
-    let sname = mangleRecFieldName(m, field)
-    if field.locId == 0:
-      # XXX: the C struct definition for the type is re-generated in every C
-      #      file the type is used in, so the field might have an associated
-      #      loc. Eventually, each C type will only be generated once, and then
-      #      the guard can be removed
-      m.fields.put(field): unionPrefix & sname
-
-    if field.alignment > 0:
-      result.addf "NIM_ALIGN($1) ", [rope(field.alignment)]
-    let noAlias = if sfNoalias in field.flags: " NIM_NOALIAS" else: ""
-
-    let fieldType = field.typ.skipTypes(abstractInst)
-    if fieldType.kind == tyUncheckedArray:
-      result.addf("$1 $2[SEQ_DECL_SIZE];$n",
-          [getTypeDescAux(m, fieldType.elemType, check), sname])
-    elif field.bitsize != 0:
-      result.addf("$1$4 $2:$3;$n", [getTypeDescAux(m, field.typ, check), sname, rope($field.bitsize), noAlias])
+proc mangleDynLibProc(sym: PSym): Rope
+
+proc genDecl(m: BModule, result: var Rope, typ: TypeId, name: Rope,
+             align, bitsize: int, noAlias: bool) =
+  let desc = m.types.headerFor(typ, Lowered)
+  if align != 0 and align != desc.align:
+    result.addf("NIM_ALIGN($1) ", [$align])
+
+  case desc.kind
+  of tkVoid:
+    # XXX: void fields need to be eliminated during PType->MIR translation
+    #      instead
+    discard "drop"
+  of tkUncheckedArray:
+    result.add useType(m, desc.elem)
+    result.addf(" $1[SEQ_DECL_SIZE]", [name])
+  of tkArray:
+    result.add useType(m, desc.elem)
+    result.addf(" $1[$2]", [name, $desc.arrayLen(m.types)])
+  else:
+    result.add useType(m, typ)
+    if noAlias:
+      result.add " NIM_NOALIAS"
+    result.add " " & name
+    if bitsize != 0:
+      result.add ":" & $bitsize
+
+proc genFieldDesc(m: BModule, id: FieldId, field: RecField, pos: int,
+                  result: var Rope, accessor: string) =
+  var mangled: string
+  if not field.isNamed:
+    # use a name derived from the position for anonymous fields. The name can
+    # easily be reconstructed from anywhere, so it's not cached
+    mangled = "Field" & $pos
+  elif field.isNoMangle:
+    mangled = m.types.name(field)
+    m.g.fields[id] = accessor & mangled
+  else:
+    mangled = mangleField(m, m.types.name(field))
+    # for efficiency, cache the name combined with the accessor
+    m.g.fields[id] = accessor & mangled
+
+  genDecl(m, result, field.typ, mangled, field.align, field.bitsize,
+          field.isNoAlias)
+  result.add ";\n"
+
+proc getTaggedUnionDesc(m: BModule, desc: TypeHeader, result: var Rope,
+                        accessor: string)
+
+proc genRecordDesc(m: BModule, desc: TypeHeader, result: var Rope,
+                   accessor: string) =
+  if desc.isPacked(m.types) and hasAttribute in CC[m.config.cCompiler].props:
+    # if only push/pop are supported, the outer struct is already wrapped in a
+    # pair of those
+    result.add "struct __attribute__((__packed__)) {\n"
+  else:
+    result.add "struct {\n"
+
+  var pos = 0
+  for (id, it) in m.types.fields(desc):
+    if m.types.isEmbedded(it.typ):
+      # embedded tagged union
+      getTaggedUnionDesc(m, m.types.headerFor(it.typ, Lowered), result,
+                         accessor)
     else:
-      # TODO: C++ remove
-      # don't use fieldType here because we need the
-      # tyGenericInst for C++ template support
-      result.addf("$1$3 $2;$n", [getTypeDescAux(m, field.typ, check), sname, noAlias])
-  else: internalError(m.config, n.info, "genRecordFieldsAux()")
-
-proc getRecordFields(m: BModule, typ: PType, check: var IntSet): Rope =
-  result = genRecordFieldsAux(m, typ.n, typ, check)
-
-proc ensureObjectFields*(m: BModule; field: PSym, typ: PType) =
-  ## Two different object types can produce the same signature hash in
-  ## certain cases (the hidden parameter type of a generic's inner procedure,
-  ## for example), in which case ``getTypeDescAux`` never calls
-  ## ``genRecordDesc``. This procedures makes sure that the field has a valid
-  ## loc.
-  if field.locId == 0:
-    var check = initIntSet()
-    discard getRecordFields(m, typ, check)
+      genFieldDesc(m, id, it, pos, result, accessor)
+    inc pos
+
+  result.add "}"
+
+proc getTaggedUnionDesc(m: BModule, desc: TypeHeader, result: var Rope,
+                        accessor: string) =
+  # the discriminator is directly embedded into the surrounding struct
+  let
+    id    = desc.discr(m.types)
+    discr = m.types[id]
+  genFieldDesc(m, id, discr, 0, result, accessor)
+
+  let
+    name = m.types.name(discr)
+    # all ``struct`` union fields use the mangled discriminator field name
+    # as the prefix
+    unionPrefix =
+      if discr.isNoMangle:
+        "_" & name & "_"
+      else:
+        "_" & mangleField(m, name) & "_"
+
+  result.add "union {\n"
+  var i = 1
+  for (id, it) in m.types.fields(desc, 1):
+    if m.types.isEmbedded(it.typ):
+      # embedded record description. The accessor combined with the union
+      # field name is passed along
+      genRecordDesc(m, m.types.headerFor(it.typ, Lowered), result,
+                    accessor & unionPrefix & $i & ".")
+      result.addf(" $1$2;$n", [unionPrefix, $i])
+    else:
+      genFieldDesc(m, id, it, i, result, accessor)
+      result.add ";\n"
 
-proc mangleDynLibProc(sym: PSym): Rope
+    inc i
 
-proc getRecordDesc(m: BModule, typ: PType, name: Rope,
-                   check: var IntSet): Rope =
-  # declare the record:
-  var hasField = false
+  result.add "};\n"
 
-  if tfPacked in typ.flags:
+proc genUnionDesc(m: BModule, desc: TypeHeader, name: Rope, result: var Rope) =
+  result.add "union "
+  result.add name
+  result.add " {\n"
+  for (id, it) in m.types.fields(desc):
+    genFieldDesc(m, id, it, 0, result, "")
+  result.add "}"
+
+proc genRecordDesc(m: BModule, desc: TypeHeader, name: Rope, result: var Rope) =
+  let isPacked = desc.isPacked(m.types)
+
+  if isPacked:
     if hasAttribute in CC[m.config.cCompiler].props:
-      result = structOrUnion(typ) & " __attribute__((__packed__))"
+      result.add "struct __attribute__((__packed__)) "
     else:
-      result = "#pragma pack(push, 1)\L" & structOrUnion(typ)
+      result.add "#pragma pack(push, 1)\nstruct "
   else:
-    result = structOrUnion(typ)
-
-  result.add " "
+    result.add "struct "
   result.add name
 
-  if typ.kind == tyObject:
-    if typ[0] == nil:
-      if lacksMTypeField(typ):
-        appcg(m, result, " {$n", [])
-      else:
-        appcg(m, result, " {$n#TNimTypeV2* m_type;$n", [])
-        hasField = true
+  result.add " {\n"
+  # the base type (if any) is added as the first field:
+  if desc.base(m.types) != VoidType:
+    result.add useType(m, desc.base(m.types))
+    result.add " Sup;\n"
+
+  var pos = 0
+  for (id, it) in m.g.env.types.fields(desc):
+    if m.types.isEmbedded(it.typ):
+      # embedded tagged union
+      getTaggedUnionDesc(m, m.types.headerFor(it.typ, Lowered), result, "")
     else:
-      appcg(m, result, " {$n  $1 Sup;$n",
-                      [getTypeDescAux(m, typ[0].skipTypes(skipPtrs), check)])
-      hasField = true
-  else:
-    result.addf(" {$n", [name])
+      genFieldDesc(m, id, it, pos, result, "")
+    inc pos
 
-  let desc = getRecordFields(m, typ, check)
-  if desc == "" and not hasField:
-    result.addf("char dummy;$n", [])
-  else:
-    result.add(desc)
-  result.add("};\L")
-  if tfPacked in typ.flags and hasAttribute notin CC[m.config.cCompiler].props:
-    result.add "#pragma pack(pop)\L"
-
-proc getTupleDesc(m: BModule, typ: PType, name: Rope,
-                  check: var IntSet): Rope =
-  result = "$1 $2 {$n" % [structOrUnion(typ), name]
-  var desc = ""
-  for i in 0..<typ.len:
-    desc.addf("$1 Field$2;$n",
-         [getTypeDescAux(m, typ[i], check), rope(i)])
-  if desc == "": result.add("char dummy;\L")
-  else: result.add(desc)
-  result.add("};\L")
-
-proc getOpenArrayDesc(m: BModule, t: PType, check: var IntSet): Rope =
-  let sig = hashType(t)
-  if true:
-    result = cacheGetType(m.typeCache, sig)
-    if result == "":
-      result = getTypeName(m, t, sig)
-      m.typeCache[sig] = result
-      let elemType = getTypeDescWeak(m, t[0], check)
-      m.s[cfsTypes].addf("typedef struct {$n$2* Field0;$nNI Field1;$n} $1;$n",
-                         [result, elemType])
-
-proc getTypeDescAux(m: BModule, origTyp: PType, check: var IntSet): Rope =
-  # returns only the type's name
-
-  var t = origTyp.skipTypes(irrelevantForBackend)
-  m.config.internalAssert(not containsOrIncl(check, t.id),
-                          "cannot generate C type for: " & typeToString(origTyp))
-  # XXX: this BUG is hard to fix -> we need to introduce helper structs,
-  # but determining when this needs to be done is hard. We should split
-  # C type generation into an analysis and a code generation phase somehow.
-  if t.sym != nil: useHeader(m, t.sym)
-  if t != origTyp and origTyp.sym != nil: useHeader(m, origTyp.sym)
-  let sig = hashType(origTyp)
-
-  defer: # defer is the simplest in this case
-    if isImportedType(t) and not m.typeABICache.containsOrIncl(sig):
-      addAbiCheck(m, t, result)
-
-  result = getTypePre(m, t, sig)
-  if result != "":
-    excl(check, t.id)
+  result.add "}"
+  # pop the packed pragma again:
+  if isPacked and
+     hasAttribute notin CC[m.config.cCompiler].props:
+    result.add "#pragma pack(pop)\n"
+
+proc isImportedType(t: PType): bool =
+  t.sym != nil and sfImportc in t.sym.flags
+
+proc emitTypeDef(m: BModule, id: TypeId, desc: TypeHeader) =
+  ## Emits the full definition for the type.
+  if id in m.typeCache:
     return
-  case t.kind
-  of tyRef, tyPtr, tyVar, tyLent:
-    let star = "*"
-    var et = origTyp.skipTypes(abstractInst).lastSon
-    var etB = et.skipTypes(abstractInst)
-    if mapType(m.config, t) == ctPtrToArray:
-      if etB.kind == tySet:
-        et = getSysType(m.g.graph, unknownLineInfo, tyUInt8)
-      else:
-        et = elemType(etB)
-      etB = et.skipTypes(abstractInst)
-    case etB.kind
-    of tyObject, tyTuple, tySequence:
-      # no restriction! We have a forward declaration for structs
-      let name = getTypeForward(m, et, hashType et)
-      result = name & star
-    of tyOpenArray:
-      result = getTypeDescAux(m, etB, check)
+
+  let name = computeTypeName(m.g.graph, m.types, id)
+  assert name != ""
+  # remember that the type was emitted. Doing it before producing the type
+  # body ensures that cyclic types don't result in infinite recursion:
+  m.typeCache[id] = name
+
+  case desc.kind
+  of tkArray:
+    let elem = useType(m, desc.elem)
+    m.s[cfsTypes].addf("typedef $1 $2[$3];$n",
+                       [elem, name, $desc.arrayLen(m.types)])
+  of tkUncheckedArray:
+    let elem = useType(m, desc.elem)
+    m.s[cfsTypes].addf("typedef $1 $2[1];$n",
+                       [elem, name])
+  of tkProc:
+    let locs = prepareParameters(m, desc)
+    var rettype, params: string
+    genProcParams(m, desc, rettype, params, locs, weakDep=true)
+    m.s[cfsTypes].addf("typedef $1_PTR($2, $3)$4;$n",
+                       [rope(CallingConvToStr[desc.callConv(m.types)]),
+                        rettype, name, params])
+  of tkRecord, tkUnion:
+    if id notin m.forwTypeCache:
+      m.forwTypeCache[id] = name
+      addForwardStructFormat(m, structOrUnion(desc.kind), name)
+
+    var recdesc: Rope
+    if desc.kind == tkRecord:
+      genRecordDesc(m, desc, name, recdesc)
     else:
-      # else we have a strong dependency  :-(
-      result = getTypeDescAux(m, et, check) & star
-
-    m.typeCache[sig] = result
-  of tyOpenArray, tyVarargs:
-    result = getOpenArrayDesc(m, t, check)
-  of tyEnum:
-    result = cacheGetType(m.typeCache, sig)
-    if result == "":
-      result = getTypeName(m, origTyp, sig)
-      if not (sfImportc in t.sym.flags and t.sym.magic == mNone):
-        m.typeCache[sig] = result
-        m.s[cfsTypes].addf("typedef $1 $2;$n",
-          [getTypeDescAux(m, t.lastSon, check), result])
-        when false:
-          let owner = hashOwner(t.sym)
-          if not gDebugInfo.hasEnum(t.sym.name.s, t.sym.info.line, owner):
-            var vals: seq[(string, int)] = @[]
-            for i in 0..<t.n.len:
-              assert(t.n[i].kind == nkSym)
-              let field = t.n[i].sym
-              vals.add((field.name.s, field.position.int))
-            gDebugInfo.registerEnum(EnumDesc(size: size, owner: owner, id: t.sym.id,
-              name: t.sym.name.s, values: vals))
-  of tyProc:
-    result = getTypeName(m, origTyp, sig)
-    m.typeCache[sig] = result
-    var rettype, desc: Rope
-    let params = prepareParameters(m, t)
-    genProcParams(m, t, rettype, desc, check, params, true, true)
-    if not isImportedType(t):
-      if t.callConv != ccClosure: # procedure vars may need a closure!
-        m.s[cfsTypes].addf("typedef $1_PTR($2, $3) $4;$n",
-             [rope(CallingConvToStr[t.callConv]), rettype, result, desc])
-      else:
-        m.s[cfsTypes].addf("typedef struct {$n" &
-            "N_NIMCALL_PTR($2, ClP_0) $3;$n" &
-            "void* ClE_0;$n} $1;$n",
-             [result, rettype, desc])
-  of tySequence:
-    # a sequence type is two structs underneath: one for the seq itself, and
-    # one for its payload
-    m.config.internalAssert(skipTypes(t[0], typedescInst).kind != tyEmpty,
-                            "cannot map the empty seq type to a C type")
-
-    result = cacheGetType(m.forwTypeCache, sig)
-    if result == "":
-      result = getTypeName(m, origTyp, sig)
-      if not isImportedType(t):
-        m.forwTypeCache[sig] = result
-        addForwardStructFormat(m, structOrUnion(t), result)
-
-    # it's possible that the element type cannot be emitted yet because it
-    # depends on the sequence type (a cyclic type). For this reason, the
-    # payload type is only forward-declared here, and the actual definition
-    # is emitted later
-    addForwardStructFormat(m, structOrUnion(t), result & "_Content")
-    # note: force push the type (by not using ``pushType``)
-    m.typeStack.add origTyp
-
-    m.typeCache[sig] = result
-    appcg(m, m.s[cfsTypes],
-      "struct $1 {$N" &
-      "  NI len; $1_Content* p;$N" &
-      "};$N", [result])
-  of tyUncheckedArray:
-    result = getTypeName(m, origTyp, sig)
-    m.typeCache[sig] = result
-    if not isImportedType(t):
-      let foo = getTypeDescAux(m, t[0], check)
-      m.s[cfsTypes].addf("typedef $1 $2[1];$n", [foo, result])
-  of tyArray:
-    var n: BiggestInt = toInt64(lengthOrd(m.config, t))
-    if n <= 0: n = 1   # make an array of at least one element
-    result = getTypeName(m, origTyp, sig)
-    m.typeCache[sig] = result
-    if not isImportedType(t):
-      let foo = getTypeDescAux(m, t[1], check)
-      m.s[cfsTypes].addf("typedef $1 $2[$3];$n",
-           [foo, result, rope(n)])
-  of tyObject, tyTuple:
-    result = cacheGetType(m.forwTypeCache, sig)
-    if result == "":
-      result = getTypeName(m, origTyp, sig)
-      m.forwTypeCache[sig] = result
-      if not isImportedType(t):
-        addForwardStructFormat(m, structOrUnion(t), result)
-      assert m.forwTypeCache[sig] == result
-    m.typeCache[sig] = result # always call for sideeffects:
-    if not incompleteType(t):
-      let recdesc = if t.kind != tyTuple: getRecordDesc(m, t, result, check)
-                    else: getTupleDesc(m, t, result, check)
-      if not isImportedType(t):
-        m.s[cfsTypes].add(recdesc)
-      elif tfIncompleteStruct notin t.flags:
-        discard # addAbiCheck(m, t, result) # already handled elsewhere
-  of tySet:
-    # Don't use the imported name as it may be scoped: 'Foo::SomeKind'
-    result = $t.kind & '_' & t.lastSon.typeName & $t.lastSon.hashType
-    m.typeCache[sig] = result
-    if not isImportedType(t):
-      let s = int(getSize(m.config, t))
-      case s
-      of 1, 2, 4, 8: m.s[cfsTypes].addf("typedef NU$2 $1;$n", [result, rope(s*8)])
-      else: m.s[cfsTypes].addf("typedef NU8 $1[$2];$n",
-             [result, rope(getSize(m.config, t))])
-  of tyGenericInst, tyDistinct, tyOrdinal, tyTypeDesc, tyAlias, tySink,
-     tyUserTypeClass, tyUserTypeClassInst, tyInferred:
-    result = getTypeDescAux(m, lastSon(t), check)
+      genUnionDesc(m, desc, name, recdesc)
+    m.s[cfsTypes].addf("$1;$n", [recdesc])
+  of tkImported:
+    let t = m.types[id]
+    useHeader(m, t.sym)
+    addAbiCheck(m, t, name)
+
+    # fill in the field names for records:
+    let h = m.types.headerFor(desc.elem, Lowered)
+    case h.kind
+    of tkRecord:
+      var tmp: Rope; genRecordDesc(m, h, "", tmp)
+    of tkUnion:
+      var tmp: Rope; genUnionDesc(m, h, "", tmp)
+    else:
+      discard "nothing to do"
   else:
-    internalError(m.config, "getTypeDescAux(" & $t.kind & ')')
-    result = ""
-  # fixes bug #145:
-  excl(check, t.id)
+    unreachable("doesn't need a full definition")
+
+proc useType(m: BModule, typ: TypeId, desc: TypeHeader; onlyName = false): Rope =
+  case desc.kind
+  of tkVoid:
+    result = "void"
+  of tkPointer:
+    result = "void*"
+  of tkCstring:
+    result = "NCSTRING"
+  of tkBool:
+    result = "NIM_BOOL"
+  of tkChar:
+    result = "NIM_CHAR"
+  of tkInt:
+    result = "NI" & $(desc.size(m.types) * 8)
+  of tkUInt:
+    result = "NU" & $(desc.size(m.types) * 8)
+  of tkFloat:
+    result = "NF" & $(desc.size(m.types) * 8)
+  of tkRef, tkPtr, tkVar, tkLent:
+    if mapType(m.types, desc) == ctPtrToArray:
+      # use ``T*``, where `T` is the array's element type
+      result = useType(m, m.types.headerFor(desc.elem, Lowered).elem,
+                       onlyName=true)
+    else:
+      # only the pointee's name is required, not its full definition
+      result = useType(m, desc.elem, onlyName=true)
+    result.add "*"
+  of tkImported, tkProc, tkArray, tkUncheckedArray:
+    # definition is the same as only a forward declaration
+    emitTypeDef(m, typ, desc)
+    result = m.typeCache[typ]
+  of tkRecord, tkUnion:
+    if onlyName:
+      # a forward declaration suffices
+      result = getTypeForward(m, typ, desc)
+    else:
+      emitTypeDef(m, typ, desc)
+      result = m.typeCache[typ]
+  else:
+    unreachable(desc.kind)
 
 proc getTypeDesc(m: BModule, typ: PType): Rope =
-  var check = initIntSet()
-  result = getTypeDescAux(m, typ, check)
+  result = useType(m, m.addLate(typ))
 
 type
   TClosureTypeKind = enum ## In C closures are mapped to 3 different things.
@@ -747,33 +712,23 @@ type
     clFull            ## struct {fn(args, void* env), env}
 
 proc getClosureType(m: BModule, t: PType, kind: TClosureTypeKind): Rope =
-  assert t.kind == tyProc
-  var check = initIntSet()
-  result = getTempName(m)
-  let params = prepareParameters(m, t)
-  var rettype, desc: Rope
-  genProcParams(m, t, rettype, desc, check, params, declareEnvironment=kind != clHalf)
-  if not isImportedType(t):
-    if t.callConv != ccClosure or kind != clFull:
-      m.s[cfsTypes].addf("typedef $1_PTR($2, $3) $4;$n",
-           [rope(CallingConvToStr[t.callConv]), rettype, result, desc])
-    else:
-      m.s[cfsTypes].addf("typedef struct {$n" &
-          "N_NIMCALL_PTR($2, ClP_0) $3;$n" &
-          "void* ClE_0;$n} $1;$n",
-           [result, rettype, desc])
-
-proc finishTypeDescriptions(m: BModule) =
-  var i = 0
-  var check = initIntSet()
-  while i < m.typeStack.len:
-    let t = m.typeStack[i]
-    if t.skipTypes(abstractInst).kind == tySequence:
-      seqV2ContentType(m, t, check)
-    else:
-      discard getTypeDescAux(m, t, check)
-    inc(i)
-  m.typeStack.setLen 0
+  case kind
+  of clHalf:
+    # create a proc type with all of `t`'s parameters, except for the
+    # environment pointer
+    let canon {.cursor.} =
+      m.types.headerFor(m.types.canonical(m.types[t]), Canonical)
+
+    let pt = m.types.buildProc(tkProc, ccNimCall, canon.retType(m.types), bu):
+      for (_, typ, flags) in params(m.types, canon):
+        bu.addParam(flags, typ)
+
+    result = useType(m, pt)
+  of clHalfWithEnv:
+    let c = m.types.canonical(m.types[t])
+    result = useType(m, m.types[m.types.lookupField(c, 0)].typ)
+  of clFull:
+    result = getTypeDesc(m, t)
 
 proc genProcHeader(m: BModule, prc: PSym, locs: openArray[TLoc]): Rope =
   ## Generates the C function header for `prc`, with `locs` being the locs
@@ -790,8 +745,7 @@ proc genProcHeader(m: BModule, prc: PSym, locs: openArray[TLoc]): Rope =
     result.add "static "
   elif sfImportc notin prc.flags:
     result.add "N_LIB_PRIVATE "
-  var check = initIntSet()
-  genProcParams(m, prc.typ, rettype, params, check, locs)
+  genProcParams(m, prc.typ, rettype, params, locs)
 
   # careful here! don't access ``prc.ast`` as that could reload large parts of
   # the object graph!
@@ -872,6 +826,10 @@ proc rope(arg: Int128): Rope = rope($arg)
 proc genTNimNodeArray(m: BModule, name: Rope, size: Rope) =
   m.s[cfsTypeInit1].addf("static TNimNode* $1[$2];$n", [name, size])
 
+proc lookupField(m: BModule, typ: PType, field: PSym): string =
+  result = m.fields[lookupField(m.types, m.types[typ],
+                                field.position.int32)]
+
 proc genObjectFields(m: BModule, typ, origType: PType, n: PNode, expr: Rope;
                      info: TLineInfo) =
   case n.kind
@@ -895,12 +853,11 @@ proc genObjectFields(m: BModule, typ, origType: PType, n: PNode, expr: Rope;
     var tmp = discriminatorTableName(m, typ, field)
     var L = lengthOrd(m.config, field.typ)
     assert L > 0
-    ensureObjectFields(m, field, typ)
     m.s[cfsTypeInit3].addf("$1.kind = 3;$n" &
         "$1.offset = offsetof($2, $3);$n" & "$1.typ = $4;$n" &
         "$1.name = $5;$n" & "$1.sons = &$6[0];$n" &
         "$1.len = $7;$n", [expr, getTypeDesc(m, origType),
-                           m.fields[field],
+                           lookupField(m, origType, field),
                            genTypeInfoV1(m, field.typ, info),
                            makeCString(field.name.s),
                            tmp, rope(L)])
@@ -931,11 +888,11 @@ proc genObjectFields(m: BModule, typ, origType: PType, n: PNode, expr: Rope;
     # Do not produce code for void types
     if isEmptyType(field.typ): return
     if field.bitsize == 0:
-      ensureObjectFields(m, field, typ)
       m.s[cfsTypeInit3].addf("$1.kind = 1;$n" &
           "$1.offset = offsetof($2, $3);$n" & "$1.typ = $4;$n" &
           "$1.name = $5;$n", [expr, getTypeDesc(m, origType),
-          m.fields[field], genTypeInfoV1(m, field.typ, info),
+          lookupField(m, origType, field),
+          genTypeInfoV1(m, field.typ, info),
           makeCString(field.name.s)])
   else: internalError(m.config, n.info, "genObjectFields")
 
diff --git a/compiler/backend/cgen.nim b/compiler/backend/cgen.nim
index 1b3f39a32fd..9abc5db0b9e 100644
--- a/compiler/backend/cgen.nim
+++ b/compiler/backend/cgen.nim
@@ -38,7 +38,8 @@ import
   ],
   compiler/mir/[
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/front/[
     options,
@@ -64,7 +65,8 @@ import
     ccgutils,
     ccgflow,
     cgendata,
-    cgir
+    cgir,
+    mangling
   ],
   compiler/plugins/[
   ]
@@ -101,6 +103,9 @@ const
     ## the procedure contains top-level code, which currently affects how
     ## emit, asm, and error handling works
 
+template types(m: BModule): TypeEnv =
+  m.g.env.types
+
 template getString(p: BProc, n: CgNode): string =
   p.env[n.strVal]
 
@@ -108,6 +113,13 @@ proc findPendingModule(m: BModule, s: PSym): BModule =
   let ms = s.itemId.module  #getModule(s)
   result = m.g.modules[ms]
 
+proc fieldName(p: BProc, typ: PType, field: PSym): string =
+  ## Returns the C name for the given `field`.
+  # the type the field is part of must have been emitted into the module
+  # already
+  p.module.fields[lookupField(p.module.types, p.module.types[typ],
+                              field.position.int32)]
+
 proc initLoc(result: var TLoc, k: TLocKind, lode: CgNode, s: TStorageLoc) =
   result.k = k
   result.storage = s
@@ -338,6 +350,16 @@ proc registerLateProc(m: BModule, s: PSym): ProcedureId =
   # inline procedure handling needs to know about the dependency...
   m.extra.add(result)
 
+proc addLate(m: BModule, t: PType): TypeId =
+  ## Temporary workaround for not all type being registered with the type
+  ## environment. Ultimately, a code generator should not modify the type
+  ## environment.
+  if t.isNil:
+    result = VoidType
+  else:
+    result = m.types.add(t)
+    result = m.types.canonical(result)
+
 proc accessThreadLocalVar(p: BProc)
 proc emulatedThreadVars*(conf: ConfigRef): bool {.inline.}
 proc useProc(m: BModule, id: ProcedureId)
@@ -363,14 +385,14 @@ include ccgtypes
 
 # ------------------------------ Manager of temporaries ------------------
 
-proc addrLoc(conf: ConfigRef; a: TLoc): Rope =
+proc addrLoc(m: BModule; a: TLoc): Rope =
   result = a.r
-  if lfIndirect notin a.flags and mapType(conf, a.t) != ctArray:
+  if lfIndirect notin a.flags and mapType(m, a.t) != ctArray:
     result = "(&" & result & ")"
 
 proc byRefLoc(p: BProc; a: TLoc): Rope =
   result = a.r
-  if lfIndirect notin a.flags and mapType(p.config, a.t) != ctArray:
+  if lfIndirect notin a.flags and mapType(p.module, a.t) != ctArray:
     result = "(&" & result & ")"
 
 proc rdCharLoc(a: TLoc): Rope =
@@ -436,7 +458,7 @@ proc genObjectInit(p: BProc, section: TCProcSection, t: PType, a: TLoc,
         genAssignment(p, a, tmp)
 
 proc constructLoc(p: BProc, loc: var TLoc; doInitObj = true) =
-  case mapType(p.config, loc.t)
+  case mapType(p.module, loc.t)
   of ctChar, ctBool, ctInt, ctInt8, ctInt16, ctInt32, ctInt64,
      ctFloat, ctFloat32, ctFloat64,
      ctUInt, ctUInt8, ctUInt16, ctUInt32, ctUInt64:
@@ -449,7 +471,7 @@ proc constructLoc(p: BProc, loc: var TLoc; doInitObj = true) =
     linefmt(p, cpsStmts, "$1.len = 0; $1.p = NIM_NIL;$n", [rdLoc(loc)])
   of ctArray, ctStruct, ctNimOpenArray:
     linefmt(p, cpsStmts, "#nimZeroMem((void*)$1, sizeof($2));$n",
-            [addrLoc(p.config, loc), getTypeDesc(p.module, loc.t)])
+            [addrLoc(p.module, loc), getTypeDesc(p.module, loc.t)])
 
     if doInitObj:
       genObjectInit(p, cpsStmts, loc.t, loc, constructObj)
@@ -712,11 +734,11 @@ proc startProc*(m: BModule, id: ProcedureId; procBody: sink Body): BProc =
     let
       res = resultId
       resNode = newLocalRef(res, prc.info, prc.typ[0])
-    if not isInvalidReturnType(m.config, prc.typ[0]):
+    if not isInvalidReturnType(m, prc.typ[0]):
       # declare the result symbol:
       assignLocalVar(p, resNode)
     else:
-      p.locals[res] = initResultParamLoc(p.config, resNode)
+      p.locals[res] = initResultParamLoc(p.module, resNode)
       scopeMangledParam(p, p.body[res].name)
       if skipTypes(resNode.typ, abstractInst).kind == tyArray:
         #incl(res.locFlags, lfIndirect)
@@ -764,7 +786,7 @@ proc finishProc*(p: BProc, id: ProcedureId): string =
     header = genProcHeader(p.module, prc, p.params)
     returnStmt = ""
 
-  if sfPure notin prc.flags and not isInvalidReturnType(p.config, prc.typ[0]):
+  if sfPure notin prc.flags and not isInvalidReturnType(p.module, prc.typ[0]):
     returnStmt = ropecg(p.module, "\treturn $1;$n",
                         [rdLoc(p.locals[resultId])])
 
@@ -1105,12 +1127,11 @@ proc rawNewModule*(g: BModuleList; module: PSym, filename: AbsoluteFile): BModul
   result.declaredProtos = initIntSet()
   result.cfilename = filename
   result.filename = filename
-  result.typeCache = initTable[SigHash, Rope]()
-  result.forwTypeCache = initTable[SigHash, Rope]()
+  result.typeCache = initTable[TypeId, Rope]()
+  result.forwTypeCache = initTable[TypeId, Rope]()
   result.module = module
   result.typeInfoMarker = initTable[SigHash, Rope]()
   result.sigConflicts = initCountTable[SigHash]()
-  result.typeStack = @[]
   result.typeNodesName = getTempName(result)
   # no line tracing for the init sections of the system module so that we
   # don't generate a TFrame which can confuse the stack bottom initialization:
@@ -1180,7 +1201,7 @@ proc shouldRecompile(m: BModule; code: Rope, cfile: Cfile): bool =
     result = true
 
 proc finalizeModule*(m: BModule) =
-  finishTypeDescriptions(m)
+  discard
 
 proc finalizeMainModule*(m: BModule) =
   generateThreadVarsSize(m) # TODO: not the job of the code generator
diff --git a/compiler/backend/cgendata.nim b/compiler/backend/cgendata.nim
index 7cb19ded484..66ff0f67898 100644
--- a/compiler/backend/cgendata.nim
+++ b/compiler/backend/cgendata.nim
@@ -25,7 +25,8 @@ import
   ],
   compiler/mir/[
     mirenv,
-    mirtrees
+    mirtrees,
+    mirtypes
   ],
   compiler/modules/[
     modulegraphs
@@ -35,7 +36,6 @@ import
   ],
   compiler/utils/[
     containers,
-    idioms,
     ropes,
     pathutils
   ]
@@ -43,17 +43,6 @@ import
 import std/options as std_options
 
 type
-  SymbolMap*[T] = object
-    ## Associates extra location-related data with symbols. This is
-    ## temporary scaffolding until each entity (type, local, procedure,
-    ## etc.) is consistently represented as an index-like handle in the
-    ## code generator, at which point a ``Store`` (or ``SeqMap``) can be
-    ## used directly.
-    ##
-    ## Mapping from a symbol to the associated data currently happens via
-    ## ``TSym.locId``.
-    store: Store[range[0'u32..high(uint32)-1], T]
-
   TLocKind* = enum
     locNone,                  ## no location
     locTemp,                  ## temporary location
@@ -207,7 +196,7 @@ type
       ## the locs for all alive constants of the program
     procs*: SeqMap[ProcedureId, ProcLoc]
       ## the locs for all alive procedure of the program
-    fields*: SymbolMap[string]
+    fields*: Table[FieldId, string]
       ## stores the C name for each field
 
     hooks*: seq[(BModule, ProcedureId)]
@@ -230,18 +219,13 @@ type
     cfilename*: AbsoluteFile  ## filename of the module (including path,
                               ## without extension)
     tmpBase*: Rope            ## base for temp identifier generation
-    typeCache*: TypeCache     ## cache the generated types
-    typeABICache*: HashSet[SigHash] ## cache for ABI checks; reusing typeCache
-                              ## would be ideal but for some reason enums
-                              ## don't seem to get cached so it'd generate
-                              ## 1 ABI check per occurence in code
-    forwTypeCache*: TypeCache ## cache for forward declarations of types
+    typeCache*: Table[TypeId, Rope] ## cache the generated types
+    forwTypeCache*: Table[TypeId, Rope] ## cache for forward declarations of types
     declaredThings*: IntSet   ## things we have declared in this .c file
     declaredProtos*: IntSet   ## prototypes we have declared in this .c file
     headerFiles*: seq[string] ## needed headers to include
     typeInfoMarker*: TypeCache ## needed for generating type information
     typeInfoMarkerV2*: TypeCache
-    typeStack*: TTypeSeq      ## used for type generation
     defaultCache*: Table[SigHash, int]
       ## maps a type hash to the name of a C constant storing the type's
       ## default value
@@ -277,10 +261,6 @@ template consts*(m: BModule): untyped  = m.g.consts
 
 template env*(p: BProc): untyped = p.module.g.env
 
-template fieldName*(p: BProc, field: PSym): string =
-  ## Returns the C name for the given `field`.
-  p.module.fields[field]
-
 template params*(p: BProc): seq[TLoc] =
   ## Returns the mutable list with the locs of `p`'s
   ## parameters.
@@ -317,36 +297,6 @@ iterator cgenModules*(g: BModuleList): BModule =
     # iterate modules in the order they were closed
     yield m
 
-proc put*[T](m: var SymbolMap[T], sym: PSym, it: sink T) {.inline.}  =
-  ## Adds `it` to `m` and registers a mapping between the item and
-  ## `sym`. `sym` must have no mapping registered yet.
-  assert sym.locId == 0, "symbol already registered"
-  sym.locId = uint32(m.store.add(it)) + 1
-
-proc forcePut*[T](m: var SymbolMap[T], sym: PSym, it: sink T) {.inline.} =
-  ## Adds `it` to `m` and register a mapping between the item and
-  ## `sym`, overwriting any existing mappings of `sym`.
-  sym.locId = uint32(m.store.add(it)) + 1
-
-func assign*[T](m: var SymbolMap[T], sym: PSym, it: sink T) {.inline.}  =
-  ## Sets the value of the item in `m` with which `sym` is associated. This is
-  ## only meant as a workaround.
-  assert sym.locId > 0
-  m.store[sym.locId - 1] = it
-
-func `[]`*[T](m: SymbolMap[T], sym: PSym): lent T {.inline.} =
-  m.store[sym.locId - 1]
-
-func `[]`*[T](m: var SymbolMap[T], sym: PSym): var T {.inline.} =
-  m.store[sym.locId - 1]
-
-func contains*[T](m: SymbolMap[T], sym: PSym): bool {.inline.} =
-  sym.locId > 0 and m.store.nextId().uint32 > sym.locId - 1
-
-iterator items*[T](m: SymbolMap[T]): lent T =
-  for it in m.store.items:
-    yield it
-
 func isFilled*(x: TLoc): bool {.inline.} =
   x.k != locNone
 
diff --git a/compiler/backend/mangling.nim b/compiler/backend/mangling.nim
new file mode 100644
index 00000000000..96e4a9494fe
--- /dev/null
+++ b/compiler/backend/mangling.nim
@@ -0,0 +1,199 @@
+## Implements the "name mangling" used by the code generators. Name mangling
+## needs to make sure that:
+## * the resulting identifier is valid according to the target's rules
+## * different entities get different names
+
+import
+  compiler/ast/[
+    ast_types,
+    ast_query
+  ],
+  compiler/mir/[
+    mirtypes,
+    mirtrees
+  ],
+  compiler/modules/[
+    modulegraphs
+  ],
+  compiler/utils/[
+    idioms
+  ]
+
+from compiler/backend/ccgutils import mangle
+
+const
+  CallConvToShort: array[TCallingConvention, string] = [
+    "ni", "st", "cd", "sa", "sy", "in", "ni", "fa", "cl", "nc"
+  ] ## every name must be unique and composed out of the same number of
+    ## letters
+
+proc mangle(g: ModuleGraph, env: TypeEnv, desc: TypeHeader): string
+proc mangle(g: ModuleGraph, env: TypeEnv, id: TypeId): string
+
+proc mangle(g: ModuleGraph, typ: PType): string =
+  ## For object types, returns a unique name based on the original symbol.
+  ## An empty string otherwise.
+  if typ.isNil:
+    return ""
+
+  proc withLen(s: string): string {.inline.} =
+    result = $s.len
+    result.add s
+
+  template mangleWithLen(s: string): string =
+    withLen(mangle(s))
+
+  if typ.kind == tyObject and typ.typeInst != nil:
+    # XXX: not very stable, but guaranteed to be unique and it also works
+    #      with the current IC mechanism
+    result = "I" & mangleWithLen(typ.typeInst[0].sym.name.s) & "_" & $typ.id
+  elif typ.kind == tyObject or (typ.sym != nil and sfImportc in typ.sym.flags):
+    # imported types are nominal types from the perspective of name mangling
+    let
+      s = typ.sym
+      m {.cursor.} = g.ifaces[typ.itemId.module].uniqueName
+
+    # the underscores are not strictly necessary; they're only added for
+    # better readability
+    if sfExported in s.flags:
+      # exported object types have unique name within their defining module.
+      # "G" stands for "global"
+      result = "G" & mangleWithLen(s.name.s) & "_M" & withLen(m)
+    elif sfAnon in s.flags:
+      # use the local ID as the name. "H" stands for "hidden"
+      result = "H" & $s.itemId.item & "_M" & withLen(m)
+    else:
+      # non-exported object types don't necessarily have unique names within a
+      # module; the ID is included to produced a unique name
+      result = "L" & mangleWithLen(s.name.s) & "_" & $s.itemId.item & "_M" &
+               withLen(m)
+  else:
+    result = "" # needs a structure-derived name
+
+proc mangleStruct(g: ModuleGraph, env: TypeEnv, prefix: string,
+                  desc: TypeHeader): string =
+  result = prefix
+  result.addInt desc.numFields
+  # bitsize, offset, custom alignment, etc. can only be used in records that
+  # don't use structure-basd mangling, and can thus be ignored here
+  for (_, f) in fields(env, desc):
+    result.add mangle(g, env, f.typ)
+
+proc mangleProc(result: var string, g: ModuleGraph, env: TypeEnv,
+                desc: TypeHeader) =
+  ## (return type)(parameter count)(parameters)*(E)?
+  let hasVarargs = desc.hasVarargs(env)
+  result.add mangle(g, env, desc.retType(env))
+  result.addInt desc.numParams + ord(hasVarargs)
+  for _, it, flags in env.params(desc):
+    result.add mangle(g, env, it)
+    # the flags are also part of the procedural type
+    if pfByRef in flags:
+      result.add "_R"
+
+  if hasVarargs:
+    result.add "E" # E for ellipsis
+
+proc mangle(g: ModuleGraph, env: TypeEnv, desc: TypeHeader): string =
+  ## Produces a mangled name from the *content* of the type `desc`.
+  template recurse(id: TypeId): string =
+    mangle(g, env, id)
+
+  case desc.kind
+  of tkRecord:
+    # no name specified, derive one from the structure
+    result = mangleStruct(g, env, "T", desc)
+  of tkUnion:
+    # no name specified, derive one from the structure
+    result = mangleStruct(g, env, "U", desc)
+  of tkImported, tkTaggedUnion:
+    # requires the original type name
+    unreachable()
+  of tkInt:
+    result = "i"
+    result.addInt desc.size(env) * 8
+  of tkUInt:
+    result = "u"
+    result.addInt desc.size(env) * 8
+  of tkFloat:
+    result = "f"
+    result.addInt desc.size(env) * 8
+  of tkChar:
+    result = "c"
+  of tkBool:
+    result = "b"
+  of tkArray:
+    result = "A"
+    result.addInt desc.arrayLen(env)
+    result.add mangle(g, env, desc.elem)
+  of tkProc:
+    result = "P"
+    result.add CallConvToShort[desc.callConv(env)]
+    mangleProc(result, g, env, desc)
+  of tkClosure:
+    result = "C"
+    mangleProc(result, g, env, desc)
+  of tkUncheckedArray:
+    result = "a"
+    result.add recurse(desc.elem)
+  of tkSeq:
+    result = "s"
+    result.add recurse(desc.elem)
+  of tkCstring:
+    result = "x"
+  of tkOpenArray:
+    result = "o"
+    result.add recurse(desc.elem)
+  of tkRef:
+    result = "r"
+    result.add recurse(desc.elem)
+  of tkPtr:
+    result = "p"
+    result.add recurse(desc.elem)
+  of tkPointer:
+    result = "pV" # mangle as ``ptr void``
+  of tkVar:
+    result = "v"
+    result.add recurse(desc.elem)
+  of tkLent:
+    result = "l"
+    result.add recurse(desc.elem)
+  of tkVoid:
+    result = "V"
+  of tkString:
+    result = "S"
+  of tkSet:
+    result = "e"
+    result.addInt desc.count
+  of tkIndirect:
+    unreachable("cannot mangle")
+
+proc mangle(g: ModuleGraph, env: TypeEnv, id: TypeId): string =
+  result = mangle(g, env[id])
+  if result.len == 0:
+    # derive the mangled name from the canonical representation
+    result = mangle(g, env, env.headerFor(id, Canonical))
+
+  assert result.len > 0
+
+proc computeTypeName*(g: ModuleGraph, env: TypeEnv, typ: TypeId): string =
+  ## Computes the name to address the type with in the generated code. Mangled
+  ## names are always prefixed with an underscore.
+  let n = env.get(env.canonical(typ)).desc[Canonical]
+
+  case env[n].kind
+  of tkRecord, tkUnion:
+    let inst = env.get(typ).inst
+    if inst != nil and inst.sym != nil and sfExportc in inst.sym.flags:
+      # the type has an external name, use that verbatim
+      inst.sym.extname
+    else:
+      # use the mangled/decorated name
+      "_" & mangle(g, env, typ)
+  of tkImported:
+    # use the specified external name as-is
+    env.get(typ).inst.sym.extname
+  of tkString:
+    "NimStringV2"
+  else:
+    "_" & mangle(g, env, env[n])
diff --git a/compiler/mir/mirgen.nim b/compiler/mir/mirgen.nim
index 8b6651ae0fc..3fe295a0de4 100644
--- a/compiler/mir/mirgen.nim
+++ b/compiler/mir/mirgen.nim
@@ -234,7 +234,7 @@ template useSource(bu: var MirBuilder, sp: var SourceProvider,
 
 # -------------- Symbol translation --------------
 
-func localToMir(c: var TCtx, s: PSym): Local =
+proc localToMir(c: var TCtx, s: PSym): Local =
   Local(typ: c.env.types.add(s.typ),
         flags: s.flags,
         isImmutable: s.kind in {skLet, skForVar},
@@ -290,7 +290,7 @@ template emitByName(c: var TCtx, eff: EffectKind, body: untyped) =
 template addLocal(c: var TCtx, local: Local): LocalId =
   c.builder.addLocal(local)
 
-func addLocal(c: var TCtx, s: PSym): LocalId =
+proc addLocal(c: var TCtx, s: PSym): LocalId =
   ## Translates `s` to its MIR representation, registers it with body, and
   ## establishes a mapping.
   assert s.id notin c.localsMap
@@ -309,7 +309,7 @@ func uintLiteral(env: var MirEnv, val: BiggestUInt, typ: TypeId): Value =
 func floatLiteral(env: var MirEnv, val: BiggestFloat, typ: TypeId): Value =
   literal(mnkFloatLit, env.getOrIncl(val), typ)
 
-func astLiteral(env: var MirEnv, val: PNode, typ: PType): Value =
+proc astLiteral(env: var MirEnv, val: PNode, typ: PType): Value =
   literal(env.asts.add(val), env.types.add(typ))
 
 proc toIntLiteral(env: var MirEnv, val: Int128, typ: PType): Value =
@@ -359,7 +359,7 @@ template labelNode(lbl: LabelId): MirNode =
 template newLabelNode(c: var TCtx): MirNode =
   labelNode(c.builder.allocLabel())
 
-func nameNode(c: var TCtx, s: PSym): MirNode =
+proc nameNode(c: var TCtx, s: PSym): MirNode =
   let t = c.typeToMir(s.typ)
   case s.kind
   of skTemp:
@@ -380,7 +380,7 @@ func nameNode(c: var TCtx, s: PSym): MirNode =
   else:
     unreachable(s.kind)
 
-func genLocation(c: var TCtx, n: PNode): Value =
+proc genLocation(c: var TCtx, n: PNode): Value =
   let f = c.builder.push: c.builder.add(nameNode(c, n.sym))
   c.builder.popSingle(f)
 
@@ -1824,7 +1824,7 @@ proc genAsmOrEmitStmt(c: var TCtx, kind: range[mnkAsm..mnkEmit], n: PNode) =
       # both asm and emit statements support arbitrary expressions
       # (including type expressions) ...
       if it.typ != nil and it.typ.kind == tyTypeDesc:
-        c.use genTypeExpr(c, it)
+        c.use typeLit(c.typeToMir(it.typ.base))
       elif it.kind == nkSym and it.sym.kind == skField:
         # emit and asm support using raw field symbols. For pushing them
         # through to the code generators, they're quoted (i.e., boxed into
diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index 92748c662d3..460718d1dd1 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -2,7 +2,16 @@
 ## `TypeEnv <#TypeEnv>`_, which stores the data for all types.
 ##
 ## All types are addressed via ``TypeId``, with the built-in types using
-## static IDs.
+## static IDs. Every ``TypeId`` is associated with a `TypeSym <#TypeSym>`_,
+## linking together the type's various representations. If multiple equal
+## structural types are added to the environment, the one added first is
+## designated as the "canonical" one.
+##
+## At the MIR level, a type representation has three different levels
+## (`Level <#Level>`_). On the `Original` level, all type references are
+## exactly as they appear in the ``PType`` form, the `Canonical` level only
+## uses references to canonical types, and the `Lowered` level is the type as
+## the code generator sees it.
 
 import
   std/[
@@ -10,8 +19,11 @@ import
     tables
   ],
   compiler/ast/[
+    ast,
     ast_types,
-    lineinfos
+    lineinfos,
+    idents,
+    types
   ],
   compiler/front/[
     options
@@ -24,26 +36,128 @@ import
     mirtrees,
     typemaps
   ],
+  compiler/ic/[
+    bitabs
+  ],
   compiler/utils/[
     containers,
     idioms
   ]
 
 type
-  TypeEnv* {.requiresInit.} = object
+  TypeKind* = enum
+    tkVoid
+    tkBool, tkChar
+    tkInt, tkUInt, tkFloat
+
+    tkPointer
+    tkPtr, tkRef, tkVar, tkLent
+
+    tkProc
+    tkClosure ## proc + environment
+
+    tkArray
+    tkUncheckedArray
+    tkOpenArray
+    tkSet
+    tkSeq
+    tkString
+    tkCstring
+
+    tkImported
+    tkIndirect # not a real type
+
+    # record-like types:
+    tkRecord
+    tkUnion
+    tkTaggedUnion
+
+  ParamFlag* = enum
+    pfByRef
+
+  IntVal = distinct uint32
+    ## If the MSB is not set, the lower 31 bit represent an unsigned integer
+    ## value. Otherwise, they represent a ``LitId``.
+
+  FieldId* = distinct uint32
+  HeaderId* = uint32
+
+  RecField* = object
+    ## Record field description.
+    ident: LitId
+    offset: IntVal
+    align*: int16
+    extra: uint16
+    typ*: TypeId
+
+  TypeHeader* = object
+    ## Type description header.
+    kind*: TypeKind
+    align*: int16   ## required alignment
+    size: IntVal    ## size in bytes
+    a: uint32       ## meaning depends on the type
+    b: uint32       ## meaning depends on the type
+
+  Level* = enum
+    Original  ## contains the original type symbols
+    Canonical ## same as `Original`, but with only canonical types symbols
+    Lowered   ## fully lowered version of the type
+
+  TypeSym* = object
+    ## A *type symbol* links together the various representations of a type.
+    inst*: PType
+      ## the original type instance
+    canon*: TypeId
+      ## if a type symbol is the canonical one, canon points to itself
+    desc*: array[Level, HeaderId]
+
+  TypeEnv* = object
     ## Stores the data associated with types. Has no valid default value, and
     ## must be explicitly initialized first.
     map: TypeTable[TypeId]
-      ## maps the hash of a type. Since the hash is not guaranteed to be
-      ## unique, hash collisions are possible!
-      # XXX: ^^ the collision needs to be addressed at some point. A proper,
-      #      non-sighash-based comparision needs to be used
-    types: Store[TypeId, PType]
+    symbols {.requiresInit.}: Store[TypeId, TypeSym]
+
+    headers: Store[HeaderId, TypeHeader]
+      ## all type headers
+    fields: seq[RecField]
+      ## all record fields referenced from `headers`
+    params: seq[tuple[x: uint32, typ: TypeId]]
+      ## all parameters referenced from `headers`
+
+    structs: seq[uint32]
+      ## an open-addressing using hash table. Indexed by ``hash(desc)``. The
+      ## items are indices (biased by 1) into the `headers` sequence
+    numStructs: int
+      ## the number of occupied slots in `structs`
+
+    canon: Table[HeaderId, TypeId]
+      ## maps headers of canonical type descriptions to their type symbol
+
+    instances: Table[(int, HeaderId), TypeId]
+      ## associates a generic type ID + instance body with a type symbol. This
+      ## is used for eliminating same-shaped instantiations of a generic
+      ## object type
+
+    idents: BiTable[string]
+    numbers: BiTable[BiggestInt]
+
+    config: ConfigRef
+    graph: ModuleGraph
+
     sizeType: TypeId
       ## the target-dependent integer type to use for size values
     usizeType: TypeId
       ## the target-dependent unsigned integer type to use for size values
 
+  RecordBuilder = object
+    header: TypeHeader
+    start: int
+    fields: seq[RecField]
+
+  ProcBuilder* = object
+    header: TypeHeader
+    params: seq[tuple[x: uint32, typ: TypeId]]
+
 const
   VoidType*    = TypeId 0
   BoolType*    = TypeId 1
@@ -62,42 +176,744 @@ const
   CstringType* = TypeId 14
   PointerType* = TypeId 15
 
+  Skip = {tyAlias, tyDistinct, tySink, tyGenericInst, tyEnum, tyOrdinal,
+          tyRange} + tyUserTypeClasses
+    ## types not relevant to the MIR type description
+
+  MangleFlag = 0x4000'u16
+  NoAliasFlag = 0x8000'u16
+
+func `==`*(a, b: FieldId): bool {.borrow, inline.}
+func `==`(a, b: IntVal): bool {.borrow, inline.}
+
+func hash(env: TypeEnv, t: TypeHeader): Hash =
+  ## Computes the structural hash for the type `t`.
+  result = hash(t.kind)
+  case t.kind
+  of tkVoid, tkBool, tkChar, tkPointer, tkString, tkCstring:
+    discard "no additional content to hash"
+  of tkInt, tkUInt, tkFloat, tkPtr, tkRef, tkVar, tkLent, tkSeq,
+     tkUncheckedArray, tkOpenArray, tkSet, tkIndirect, tkImported:
+    result = result !& hash(t.a)
+  of tkArray:
+    result = result !& hash(t.a) !& hash(t.b)
+  of tkRecord, tkUnion, tkTaggedUnion:
+    # size and alignment doesn't need to be part of the hash. Two structural
+    # types with the same content cannot have different size or alignment,
+    # and two nominal types are always distinct
+    for it in t.a..<t.b:
+      result = result !& hash(env.fields[it])
+  of tkProc, tkClosure:
+    for it in t.a..<t.b:
+      result = result !& hash(env.params[it])
+
+  result = !$(result)
+
+func isEqual(env: TypeEnv, a, b: TypeHeader): bool =
+  ## Compares `a` and `b` for structural equality.
+  if a.kind != b.kind:
+    return false
+
+  func isEqual(s: seq, a, b, len: uint32): bool {.nimcall.} =
+    for i in 0..<len:
+      if s[a + i] != s[b + i]:
+        return false
+    result = true
+
+  template fieldCount(t: TypeHeader): uint32 =
+    t.b - t.a # also valid for procedure types
+
+  case a.kind
+  of tkVoid, tkBool, tkChar, tkPointer, tkString, tkCstring:
+    true
+  of tkInt, tkUInt, tkFloat, tkPtr, tkRef, tkVar, tkLent, tkSeq,
+     tkUncheckedArray, tkOpenArray, tkSet, tkIndirect, tkImported:
+    a.a == b.a
+  of tkArray:
+    a.a == b.a and a.b == b.b
+  of tkRecord, tkUnion, tkTaggedUnion:
+    if fieldCount(a) == fieldCount(b): # same number of fields?
+      isEqual(env.fields, a.a, b.a, fieldCount(a))
+    else:
+      false
+  of tkProc, tkClosure:
+    if fieldCount(a) == fieldCount(b): # same number of params?
+      isEqual(env.params, a.a, b.a, fieldCount(a))
+    else:
+      false
+
+# -------------------------
+# Hash-table implementation
+
+template maxHash(t: seq): int =
+  t.high
+
+template isFilled(m: uint32): bool =
+  m != 0
+
+template nextTry(i, max: int): int =
+  (i + 1) and max
+
+func enlarge(env: var TypeEnv) =
+  ## Grows and re-hashes the `env.structs` hash-table.
+  template tbl: untyped = env.structs
+  var n = newSeq[uint32](tbl.len * 2)
+  swap(n, tbl)
+  for old in n.items:
+    if old.isFilled:
+      var j = hash(env, env.headers[old-1]) and maxHash(tbl)
+      while tbl[j].isFilled:
+        j = nextTry(j, maxHash(tbl))
+      tbl[j] = old
+
+func deduplicate(env: var TypeEnv, header: TypeHeader): (bool, HeaderId) =
+  ## Adds `header` to env, but only if the type wasn't added already. Only
+  ## types previously passed to `deduplicate` are considered. Returns the
+  ## ID to address the added header with and whether it existed already.
+  let hash = hash(env, header) ## hash of the tree
+  var i = hash and maxHash(env.structs)
+  # note: the items in the table are offset by 1, so that '0' means
+  # "empty slot"
+  if env.structs.len > 0:
+    while (let slot = env.structs[i]; slot.isFilled):
+      let h = uint32(slot - 1) # header index
+      if isEqual(env, header, env.headers[h]): # same types?
+        return (true, h) # already exists
+      i = nextTry(i, maxHash(env.structs))
+
+    # not a duplicate. Before adding a new entry, first enlarge the table, if
+    # necessary
+    template mustRehash(len, counter: int): bool =
+      (len * 2 < counter * 3) or (len - counter < 4)
+
+    if mustRehash(env.structs.len, env.numStructs):
+      enlarge(env)
+      i = hash and maxHash(env.structs)
+      # find the first empty slot:
+      while isFilled(env.structs[i]):
+        i = nextTry(i, maxHash(env.structs))
+
+  else:
+    # the table is empty, initialize it
+    env.structs.setLen(16) # must to be a power-of-two
+    i = hash and maxHash(env.structs)
+
+  let id = env.headers.add header
+  # remember the description in the list:
+  env.structs[i] = id + 1
+  inc env.numStructs
+
+  result = (false, id)
+
+proc toIntVal(env: var TypeEnv, val: BiggestInt): IntVal =
+  ## Turns `val` into an ``IntVal``.
+  if val in 0..0x7FFF_FFFF:
+    IntVal(val)
+  else:
+    IntVal(uint32(env.numbers.getOrIncl(val)) or 0x8000_0000'u32)
+
+proc getInt(env: TypeEnv, val: IntVal): BiggestInt =
+  ## Turns `val` back into an integer value.
+  if (val.uint32 and 0x8000_0000'u32) == 0:
+    BiggestInt(val.uint32 and 0x7FFF_FFFF'u32)
+  else:
+    env.numbers[LitId(val.uint32 and 0x7FFF_FFFF'u32)]
+
+# Type inspection/query routines
+# ------------------------------
+
+# the querie routines are simple enough to warrant inlining
+{.push inline.}
+
+func headerFor*(env: TypeEnv, id: TypeId, phase: Level): lent TypeHeader =
+  env.headers[env.symbols[id].desc[phase]]
+
+func `[]`*(env: TypeEnv, id: HeaderId): lent TypeHeader {.inline.} =
+  env.headers[id]
+
+func size*(desc: TypeHeader, env: TypeEnv): BiggestInt {.inline.} =
+  ## Returns the size-in-bytes for the given type.
+  env.getInt(desc.size)
+
+proc elem*(desc: TypeHeader): TypeId {.inline.} =
+  ## Returns the element type for `h`.
+  assert desc.kind in {tkArray, tkSeq, tkUncheckedArray, tkIndirect,
+                       tkImported, tkOpenArray, tkLent, tkVar, tkPtr, tkRef}
+  desc.a.TypeId
+
+proc count*(desc: TypeHeader): uint32 {.inline.} =
+  ## Returns the number of elements the ``set`` type can contain.
+  assert desc.kind == tkSet
+  desc.a
+
+proc arrayLen*(desc: TypeHeader, env: TypeEnv): BiggestInt {.inline.} =
+  assert desc.kind == tkArray
+  env.getInt(IntVal desc.b)
+
+func discr*(desc: TypeHeader, env: TypeEnv): FieldId =
+  ## Returns the discriminator field for the given tagged union.
+  assert desc.kind == tkTaggedUnion
+  FieldId desc.a
+
+func numParams*(desc: TypeHeader): int =
+  int(desc.b - desc.a) - 1
+
+func callConv*(desc: TypeHeader, env: TypeEnv): TCallingConvention =
+  TCallingConvention env.params[desc.a].x
+
+func hasVarargs*(desc: TypeHeader, env: TypeEnv): bool =
+  (env.params[desc.a].x and 0x8000_0000'u32) != 0
+
+func retType*(desc: TypeHeader, env: TypeEnv): TypeId =
+  assert desc.kind in {tkProc, tkClosure}
+  env.params[desc.a].typ
+
+iterator params*(env: TypeEnv, desc: TypeHeader
+                ): tuple[i: int, typ: TypeId, flags: set[ParamFlag]] =
+  ## Returns the typ and flags for all parameters of type t
+  for i in (desc.a + 1)..<desc.b:
+    yield (int(i - desc.a - 1), env.params[i].typ,
+           cast[set[ParamFlag]](env.params[i].x))
+
+func base*(desc: TypeHeader, env: TypeEnv): TypeId =
+  ## Returns the node storing the base type (i.e., the parent type) for a
+  ## record type.
+  assert desc.kind == tkRecord
+  env.fields[desc.a].typ
+
+func fieldOffset*(desc: TypeHeader, env: TypeEnv): int32 =
+  ## Returns the first field's position in the object.
+  assert desc.kind == tkRecord
+  env.fields[desc.a].align.int32
+
+func isPacked*(desc: TypeHeader, env: TypeEnv): bool =
+  ## Whether the record type is
+  assert desc.kind == tkRecord
+  env.fields[desc.a].extra == 1
+
+func numFields*(desc: TypeHeader): int =
+  ## Returns the number of fields in the record-like type, ignoring parent
+  ## types.
+  int(desc.b - desc.a) - ord(desc.kind == tkRecord)
+
+func isNamed*(f: RecField): bool =
+  f.ident != LitId(0)
+
+func name*(env: TypeEnv, f: RecField): lent string =
+  assert f.ident != LitId(0)
+  result = env.idents[f.ident]
+
+func isNoMangle*(f: RecField): bool =
+  ## Whether the field's name must not be mangled.
+  (f.extra and MangleFlag) == 0
+
+func isNoAlias*(f: RecField): bool =
+  (f.extra and NoAliasFlag) != 0
+
+func bitsize*(f: RecField): int =
+  int(f.extra and 0x00FF)
+
+{.pop.} # inline
+
+iterator fields*(env: TypeEnv, desc: TypeHeader;
+                 offset = 0): (FieldId, RecField) =
+  ## Returns all fields directly part of `desc`. Super types are not
+  ## considered.
+  assert desc.kind in {tkRecord, tkUnion, tkTaggedUnion}
+  # note: the field storing the super type is not included
+  let offset = ord(desc.kind == tkRecord) + offset
+  for it in (desc.a + uint32(offset))..<desc.b:
+    yield (FieldId(it), env.fields[it])
+
+proc computeDepth*(env: TypeEnv, desc: TypeHeader, pos: int32): int =
+  ## Computes the depth at which the field with position `pos` is located.
+  ## 0 means it's part of `desc`, 1 means it's part of the first parent type,
+  ## etc.
+  case desc.kind
+  of tkRecord:
+    result = 0
+    var h {.cursor.} = desc
+    while h.fieldOffset(env) > pos:
+      h = env.headerFor(h.base(env), Lowered)
+      inc result
+  of tkUnion:
+    result = 0
+  of tkImported, tkIndirect:
+    result = computeDepth(env, env.headerFor(desc.elem, Lowered), pos)
+  else:
+    unreachable(desc.kind)
+
+proc canonical*(env: TypeEnv, typ: TypeId): TypeId =
+  ## Returns the canonical symbol for `typ`. All indirections are skipped.
+  result = env.symbols[typ].canon
+  # skip indirections:
+  while env.headerFor(result, Canonical).kind == tkIndirect:
+    result = env.headerFor(result, Canonical).elem
+
+proc isEmbedded*(env: TypeEnv, typ: TypeId): bool =
+  ## Whether the `typ` is a record that's directly embedded where it's used.
+  env.symbols[typ].inst.isNil and
+    env.headerFor(typ, Lowered).kind in {tkRecord, tkTaggedUnion}
+
+proc lookupField*(env: TypeEnv, typ: TypeId, pos: int32): FieldId =
+  ## Returns the ID of the field with position `pos`. Said field *must* exist
+  ## in record-like type `typ`. Imported types and indirection are skipped.
+
+  # skip indirections and imported types:
+  var typ = env.symbols[typ].canon
+  while env.headerFor(typ, Canonical).kind in {tkIndirect, tkImported}:
+    typ = env.headerFor(typ, Canonical).elem
+
+  var curr = 0'i32
+  # seek to the type in the inheritance hierarchy that contains the field
+  if env.headerFor(typ, Lowered).kind == tkRecord:
+    curr = env.headerFor(typ, Lowered).fieldOffset(env)
+    while curr > pos: # part of the current record?
+      # it's not, try the parent type
+      typ = env.headerFor(typ, Lowered).base(env)
+      curr = env.headerFor(typ, Lowered).fieldOffset(env)
+
+    assert typ != VoidType, "field not in record"
+
+  proc searchRecord(env: TypeEnv, desc: TypeHeader, pos: int32,
+                    curr: var int32): (bool, FieldId) =
+    # look for the field whose position matches `pos`. Anonymous record-like
+    # types are always embedded at the moment, so they are transparently
+    # recursed into
+    for (id, it) in fields(env, desc):
+      if isEmbedded(env, it.typ):
+        result = searchRecord(env, env.headerFor(it.typ, Lowered), pos, curr)
+        if result[0]:
+          return
+      elif curr == pos:
+        return (true, id)
+      else:
+        inc curr
+
+    result = (false, default(FieldId))
+
+  let r = searchRecord(env, env.headerFor(typ, Lowered), pos, curr)
+  assert r[0], "field not in type"
+  result = r[1]
+
+# Record/proc builder API
+# -----------------------
+
+proc newType*(env: var TypeEnv, desc: HeaderId): TypeId =
+  ## If none exists already, creates a new type symbol for `desc`.
+  result = env.canon.mgetOrPut(desc, env.symbols.nextId())
+  if result == env.symbols.nextId():
+    # no type symbol exists yet
+    result = env.symbols.add(TypeSym(canon: result, desc: [desc, desc, desc]))
+
+proc openRecord(size: IntVal, align: int16; offset = 0;
+                base = VoidType): RecordBuilder =
+  result.header = TypeHeader(kind: tkRecord, size: size, align: align, b: 1)
+  result.fields.add RecField(typ: base, align: offset.int16)
+
+proc open(kind: TypeKind; size: IntVal, align: int16): RecordBuilder =
+  assert kind in {tkUnion, tkTaggedUnion}
+  result.header = TypeHeader(kind: kind, size: size, align: align)
+
+proc openProc(env: TypeEnv, kind: TypeKind, conv: TCallingConvention,
+              ret: TypeId, isVarargs: bool): ProcBuilder =
+  ## Opens a builder for a procedure-like type.
+  assert kind in {tkProc, tkClosure}
+  result.header = TypeHeader(kind: kind, b: 1,
+                             align: env.config.target.ptrSize.int16)
+  if kind == tkProc:
+    result.header.size = IntVal(env.config.target.ptrSize)
+  else:
+    # a closure is two pointers
+    result.header.size = IntVal(env.config.target.ptrSize * 2)
+  result.params.add (uint32(conv) or (uint32(ord(isVarargs)) shl 31), ret)
+
+proc openRecord(b: var RecordBuilder): RecordBuilder =
+  result = RecordBuilder(start: b.fields.len)
+  swap(result.fields, b.fields) # temporarily take over the buffer
+  result.header = TypeHeader(kind: tkRecord, b: 1)
+  result.fields.add RecField(typ: VoidType, align: 0)
+
+proc open(b: var RecordBuilder, kind: TypeKind): RecordBuilder =
+  assert kind in {tkUnion, tkTaggedUnion}
+  result = RecordBuilder(start: b.fields.len)
+  swap(result.fields, b.fields) # temporarily take over the buffer
+  result.header = TypeHeader(kind: kind)
+
+proc addField(b: var RecordBuilder, env: var TypeEnv, offset: IntVal,
+              typ: TypeId; name = ""; mangle = true) =
+  ## Adds a field declaration. `typ` is the type, `name` the name, and `mangle`
+  ## indicates whether the name should be mangled.
+  inc b.header.b
+  if name.len > 0:
+    b.fields.add RecField(typ: typ, offset: offset,
+                          ident: env.idents.getOrIncl(name),
+                          extra: (if mangle: MangleFlag else: 0))
+  else:
+    b.fields.add RecField(typ: typ, offset: offset)
+
+proc addField(b: var RecordBuilder, offset: IntVal, typ: TypeId) =
+  inc b.header.b
+  b.fields.add RecField(typ: typ, offset: offset)
+
+proc addField(b: var RecordBuilder, env: var TypeEnv, s: PSym, typ: TypeId) =
+  var field = RecField(typ: typ, offset: env.toIntVal(s.offset),
+                       align: s.alignment.int16)
+  if {sfImportc, sfExportc} * s.flags == {}:
+    field.ident = env.idents.getOrIncl(s.name.s)
+    field.extra = MangleFlag
+  else:
+    # use the external name and disable mangling
+    field.ident = env.idents.getOrIncl(s.extname)
+
+  if sfNoalias in s.flags:
+    field.extra = field.extra or NoAliasFlag
+
+  # the bitsize value can only be in the range 0..64, so it fits well into the
+  # lower 8 bit of `extra`
+  field.extra = field.extra or uint16(s.bitsize)
+
+  inc b.header.b
+  b.fields.add field
+
+proc addParam*(b: var ProcBuilder, s: set[ParamFlag], typ: TypeId) =
+  ## Adds a parameter to the proc type.
+  inc b.header.b
+  b.params.add (cast[uint32](s), typ)
+
+proc close(prev: var RecordBuilder, env: var TypeEnv,
+           other: sink RecordBuilder): HeaderId =
+  ## Closes `other`, commiting the type description to `env`. `prev` must be
+  ## the builder `other` was previously spawned from.
+  var header = other.header
+  header.a += env.fields.len.uint32
+  header.b += env.fields.len.uint32
+  # move the fields to the environment:
+  env.fields.add other.fields.toOpenArray(other.start, other.fields.high)
+  other.fields.setLen(other.start)
+  # hand the buffer back to the parent builder:
+  swap(prev.fields, other.fields)
+
+  # nested records are currently always anonymous and never de-duplicated:
+  result = env.headers.add header
+
+proc close(b: sink RecordBuilder, env: var TypeEnv; unique = false): HeaderId =
+  ## Finalizes the record description and commits it to `env`. De-duplication
+  ## is only performed if `unique` is false.
+  var header = b.header
+  header.a += env.fields.len.uint32
+  header.b += env.fields.len.uint32
+  var start = env.fields.len
+  env.fields.add b.fields
+
+  if unique:
+    result = env.headers.add(header)
+  else:
+    # register the type description in the deduplication table
+    var existed: bool
+    (existed, result) = deduplicate(env, header)
+    if existed:
+      env.fields.setLen(start)
+
+proc close(env: var TypeEnv, b: sink ProcBuilder): uint32 =
+  ## Finished the type description, and returns its root node. If the type
+  ## description already existed previously, no new one is added.
+  var header = b.header
+  header.a += env.params.len.uint32
+  header.b += env.params.len.uint32
+  var start = env.params.len
+  env.params.add b.params
+
+  # register the type description in the deduplication table
+  var existed: bool
+  (existed, result) = deduplicate(env, header)
+  if existed:
+    env.params.setLen(start)
+
+# Type translation/lowering
+# -------------------------
+
+proc add*(env: var TypeEnv, t: PType): TypeId
+
+proc recordToMir(env: var TypeEnv, rec: var RecordBuilder, n: PNode,
+                 packed, canon: bool) =
+  ## Translates record node/AST `n` to the corresponding MIR type description.
+  template recurse(rec: var RecordBuilder, n: PNode) =
+    recordToMir(env, rec, n, packed, canon)
+
+  case n.kind
+  of nkSym:
+    var t = env.add(n.sym.typ)
+    if canon:
+      t = canonical(env, t)
+
+    rec.addField(env, n.sym, t)
+  of nkRecList:
+    for it in n.items:
+      recurse(rec, it)
+  of nkRecCase:
+    # at the moment, tagged union description are directly embedded into
+    # their parent record
+    var tu = rec.open(tkTaggedUnion)
+    recurse(tu, n[0]) # discriminator
+    for i in 1..<n.len:
+      let child = n[i][^1]
+      if child.kind == nkSym:
+        recurse(tu, child)
+      else:
+        # start a new record
+        var sub = tu.openRecord()
+        if packed:
+          sub.fields[^1].extra = 1 # mark as packed
+        recurse(sub, child)
+        let x = tu.close(env, sub)
+        # add as field to the tagged union:
+        tu.addField(IntVal(0), env.newType(x))
+
+    let x = rec.close(env, tu)
+    rec.addField(env.toIntVal(n[0].sym.offset), env.newType(x))
+  else:
+    unreachable(n.kind)
+
+proc nextFieldPosition(t: PType): int =
+  ## Computes the position of the would-be next field added to object-type `t`.
+  let t = t.skipTypes(skipPtrs)
+  if t.n.len > 0:
+    var n = t.n
+    # seek to the record's very last field:
+    while n.kind != nkSym:
+      n = n[^1]
+    result = n.sym.position + 1
+  elif t[0].isNil:
+    # no super type and no body
+    result = 0
+  else:
+    # no body, but there's a super type to inspect
+    result = nextFieldPosition(t[0])
+
+proc skipIrrelevant(t: sink PType): PType =
+  ## Skips all types that don't contribute to the MIR type description.
+  while t.kind in Skip and (t.sym.isNil or sfImportc notin t.sym.flags):
+    t = t.lastSon
+  result = t
+
+proc add(env: var TypeEnv, desc: sink TypeHeader): HeaderId =
+  ## Adds `desc` to `env`, but only if it doesn't exist there already.
+  var existed: bool
+  (existed, result) = deduplicate(env, desc)
+
+proc objectBase(t: PType): PType =
+  # skip ref/ptr types, but make sure to not skip instance types
+  # wrapping the immediate object type
+  result = t.base
+  while result.kind notin {tyRef, tyPtr, tyObject}:
+    result = result.lastSon
+
+  case result.kind
+  of tyRef, tyPtr:
+    result = result.lastSon
+  else:
+    result = t.base # use the original base type
+
+proc makeDesc(kind: TypeKind, size: IntVal, align: int16,
+              typ: TypeId; other = 0'u32): TypeHeader {.inline.} =
+  TypeHeader(kind: kind, size: size, align: align, a: typ.uint32, b: other)
+
+proc typeToMir(env: var TypeEnv, t: PType; canon = false, unique=true): HeaderId =
+  ## Translates `t` to its MIR representation. All structural types are
+  ## deduplicated, meaning that two structural types with the same structure
+  ## will result in the same ``HeaderId``. For ``tyObject`` types,
+  ## deduplication only happens if `unique` is false.
+  template typeref(typ: PType): TypeId =
+    let t = env.add(typ)
+    if canon: canonical(env, t)
+    else:     t
+
+  template single(k: TypeKind, elem: PType): HeaderId =
+    env.add makeDesc(k, env.toIntVal(t.size), t.align, typeref elem)
+
+  template simple(id: TypeId): HeaderId = env.symbols[id].desc[Original]
+
+  case t.kind
+  of tyVoid:    simple(VoidType)
+  of tyBool:    simple(BoolType)
+  of tyChar:    simple(CharType)
+  of tyInt8:    simple(Int8Type)
+  of tyInt16:   simple(Int16Type)
+  of tyInt32:   simple(Int32Type)
+  of tyInt64:   simple(Int64Type)
+  of tyInt:     simple(env.sizeType)
+  of tyUInt8:   simple(UInt8Type)
+  of tyUInt16:  simple(UInt16Type)
+  of tyUInt32:  simple(UInt32Type)
+  of tyUInt64:  simple(UInt64Type)
+  of tyUInt:    simple(env.usizeType)
+  of tyFloat32: simple(Float32Type)
+  of tyFloat:   simple(Float64Type)
+  of tyFloat64: simple(Float64Type)
+  of tyString:  simple(StringType)
+  of tyCstring: simple(CstringType)
+  of tyPointer, tyNil: simple(PointerType)
+  of tyTuple:
+    var tup = openRecord(env.toIntVal(t.size), t.align)
+    if t.len == 0:
+      tup.addField(IntVal 0, CharType)
+    elif t.size < 0:
+      # the size contains some incomplete imported types; no offsets can be
+      # computed
+      for i in 0..<t.len:
+        tup.addField(env, IntVal 0, typeref t[i])
+    else:
+      var offset: BiggestInt = 0
+      for i in 0..<t.len:
+        let mask = t[i].align - 1
+        offset = (offset + mask) and not(mask) # align the offset
+        tup.addField(env, env.toIntVal(offset), typeref t[i])
+        offset += t[i].size
+
+    tup.close(env)
+  of tyObject:
+    let
+      size = env.toIntVal(t.size)
+    var
+      rec: RecordBuilder
+      isEmpty = false
+
+    if tfUnion in t.flags:
+      rec = open(tkUnion, size, t.align)
+      isEmpty = t.n.len == 0
+    elif t[0] != nil:
+      # object has a super type
+      let b = objectBase(t)
+      rec = openRecord(size, t.align, b.nextFieldPosition, typeref(b))
+    elif lacksMTypeField(t):
+      # no super type and no type header
+      rec = openRecord(size, t.align)
+      isEmpty = t.n.len == 0
+    elif (let rtti = env.graph.getCompilerProc("TNimTypeV2"); rtti != nil):
+      # the object has a field for the RTTI
+      let ptrTyp = env.newType(single(tkPtr, rtti.typ))
+      # the type field is at position -1
+      rec = openRecord(size, t.align, -1)
+      rec.addField(env, IntVal 0, ptrTyp, "m_type")
+    else:
+      # legacy support for backends not yet using RTTI fields
+      rec = openRecord(size, t.align)
+
+    if rec.header.kind == tkRecord and tfPacked in t.flags:
+      rec.fields[0].extra = 1 # mark as packed
+
+    recordToMir(env, rec, t.n, tfPacked in t.flags, canon)
+
+    if isEmpty:
+      # record-like types must always have at least *one* field
+      rec.addField(IntVal 0, CharType)
+
+    # object/union types are not de-duplicated
+    rec.close(env, unique)
+  of tyProc:
+    var prc: ProcBuilder
+    let ret = if t[0].isNil: VoidType else: typeref(t[0])
+    if t.callConv == ccClosure:
+      prc = env.openProc(tkClosure, t.callConv, ret, tfVarargs in t.flags)
+    else:
+      prc = env.openProc(tkProc, t.callConv, ret, tfVarargs in t.flags)
+
+    # future direction: static parameters need to be filtered out here.
+    # Typedesc parameters only need to be removed in non-compile-time
+    # execution contexts
+    for i in 1..<t.len:
+      var s: set[ParamFlag]
+      if isPassByRef(env.config, t.n[i].sym, t[0]):
+        s.incl pfByRef
+
+      prc.addParam(s, typeref t[i])
+
+    env.close(prc)
+  of tyVar:
+    # a ``var openArray`` is just an ``openArray``
+    if classifyBackendView(t) == bvcSequence:
+      typeToMir(env, t[0], canon)
+    else:
+      single(tkVar, t[0])
+  of tyLent:
+    if classifyBackendView(t) == bvcSequence:
+      typeToMir(env, t[0], canon)
+    else:
+      single(tkLent, t[0])
+  of tyRef:
+    single(tkRef, t[^1])
+  of tyPtr:
+    single(tkPtr, t[^1])
+  of tyOpenArray, tyVarargs:
+    single(tkOpenArray, t[0])
+  of tyArray:
+    # in terms of in-memory representation, array always have a length of at
+    # least 1
+    let len = max(lengthOrd(env.config, t), One)
+    env.add makeDesc(tkArray, env.toIntVal(t.size), t.align,
+                     typeref elemType(t), uint32 env.toIntVal(toInt len))
+  of tySequence:
+    single(tkSeq, t[0])
+  of tySet:
+    # sets always have a length <= 2^16
+    let len = toUInt32 lengthOrd(env.config, t)
+    env.add TypeHeader(kind: tkSet, size: env.toIntVal(t.size), align: t.align,
+                       a: len)
+  of tyUncheckedArray:
+    single(tkUncheckedArray, t[0])
+  of tyTypeDesc, tyStatic, tyUntyped, tyTyped:
+    # have no relevance in the MIR's type syste, beyond taking up slots
+    # XXX: untyped/typed shouldn't reach here, but currently they do
+    simple(VoidType)
+  of tyEnum, tyOrdinal, tyRange:
+    # the underlying type is usually a simple, single-node type, so
+    # translate it directly
+    typeToMir(env, t.lastSon, canon)
+  of tyUserTypeClasses, tyGenericInst, tyInferred, tySink, tyAlias, tyDistinct:
+    # use a type-reference instead of in-place translation. This prevents
+    # unnecessary de-duplication work for, e.g., object types
+    single(tkIndirect, t.lastSon)
+  else:
+    unreachable(t.kind)
+
 proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
   ## Returns a fully initialized type environment instance.
-  result = TypeEnv(map: default(TypeTable[TypeId]),
-                   types: default(Store[TypeId, PType]),
-                   sizeType: VoidType,
-                   usizeType: VoidType)
+  result = TypeEnv(symbols: default(Store[TypeId, TypeSym]))
+  result.graph = graph
+  result.config = graph.config
 
-  template add(kind: TTypeKind, expect: TypeId) =
-    let
-      typ = graph.getSysType(unknownLineInfo, kind)
-      id  = result.types.add(typ)
-    assert id == expect
-    # the type needs to be mapped too
-    result.map[typ] = id
-
-  add(tyVoid, VoidType)
-  add(tyBool, BoolType)
-  add(tyChar, CharType)
-  add(tyInt8, Int8Type)
-  add(tyInt16, Int16Type)
-  add(tyInt32, Int32Type)
-  add(tyInt64, Int64Type)
-  add(tyUInt8, UInt8Type)
-  add(tyUInt16, UInt16Type)
-  add(tyUInt32, UInt32Type)
-  add(tyUInt64, UInt64Type)
-  add(tyFloat32, Float32Type)
-  add(tyFloat64, Float64Type)
-  add(tyString, StringType)
-  add(tyCstring, CstringType)
-  add(tyPointer, PointerType)
+  template add(ttk: TTypeKind, expect: TypeId, tk: TypeKind) =
+    block:
+      let
+        typ = graph.getSysType(unknownLineInfo, ttk)
+        desc = result.headers.add:
+          TypeHeader(kind: tk, size: IntVal(typ.size), align: typ.align)
+        id  = result.symbols.add:
+          TypeSym(inst: typ, canon: expect, desc: [desc, desc, desc])
 
-  # also register the built-in unspecified-width types. This prevents int/float
-  # literal types from being added to the environment
-  add(tyInt,   TypeId(ord(PointerType) + 1))
-  add(tyFloat, TypeId(ord(PointerType) + 2))
+      assert id == expect
+      # register a mapping:
+      result.map[typ] = id
+      result.canon[desc] = id
+
+  # setup the built-in types:
+  add tyVoid,    VoidType,    tkVoid
+  add tyBool,    BoolType,    tkBool
+  add tyChar,    CharType,    tkChar
+  add tyInt8,    Int8Type,    tkInt
+  add tyInt16,   Int16Type,   tkInt
+  add tyInt32,   Int32Type,   tkInt
+  add tyInt64,   Int64Type,   tkInt
+  add tyUInt8,   UInt8Type,   tkUInt
+  add tyUInt16,  UInt16Type,  tkUInt
+  add tyUInt32,  UInt32Type,  tkUInt
+  add tyUInt64,  UInt64Type,  tkUInt
+  add tyFloat32, Float32Type, tkFloat
+  add tyFloat64, Float64Type, tkFloat
+  add tyString,  StringType,  tkString
+  add tyCstring, CstringType, tkCstring
+  add tyPointer, PointerType, tkPointer
 
   (result.sizeType, result.usizeType) =
     case graph.config.target.intSize
@@ -105,15 +921,209 @@ proc initTypeEnv*(graph: ModuleGraph): TypeEnv =
     of 8:       (Int64Type, UInt64Type)
     else:       unreachable()
 
+  # also register the built-in unspecified-width types. This prevents int/float
+  # literal types from being added to the environment
+  discard result.add(graph.getSysType(unknownLineInfo, tyInt))
+  discard result.add(graph.getSysType(unknownLineInfo, tyFloat))
+
+  # setup the lowered representation of the string type
+  let str = graph.getCompilerProc("NimStringV2")
+  if str != nil: # not all code generators use the lowered type yet
+    let base = result.add(str.typ)
+    # redirect NimStringV2 in a way such that the code generators will
+    # treat it as being the same as ``string``
+    # XXX: this is an interim solution. Ultimately, the definition of
+    #      ``string`` in the system module should express this directly
+    result.symbols[StringType].desc[Lowered] =
+      result.symbols[base].desc[Lowered]
+    result.symbols[base].canon = StringType
+
+proc newPtrTy(env: var TypeEnv, elem: TypeId): TypeId =
+  # inherit size and alignment information from the base pointer type
+  var h = env.headerFor(PointerType, Original)
+  h.kind = tkPtr
+  h.a = elem.uint32
+  env.newType(env.add h)
+
+proc newUncheckedArrayTy(env: var TypeEnv, elem: TypeId): TypeId =
+  let desc = makeDesc(tkUncheckedArray, IntVal(0),
+                      env.headerFor(elem, Original).align, elem)
+  env.newType(env.add desc)
+
+template buildProc*(env: var TypeEnv, kind: TypeKind, conv: TCallingConvention,
+                    ret: TypeId, builder, body: untyped): TypeId =
+  ## Convenience template for a structured way of producing type descriptions.
+  block:
+    var builder = openProc(env, kind, conv, ret, false)
+    body
+    env.newType(env.close(builder))
+
+template buildRecord(env: var TypeEnv, size: IntVal, align: int16,
+                     builder, body: untyped): HeaderId =
+  block:
+    var builder = openRecord(size, align)
+    body
+    builder.close(env)
+
+proc lowerType(env: var TypeEnv, graph: ModuleGraph, id: HeaderId): HeaderId =
+  let h = env.headers[id]
+  case h.kind
+  of tkSet:
+    # either an array or integer, depending on the number of elements
+    case env.getInt(h.size)
+    of 1: env.symbols[UInt8Type].desc[Lowered]
+    of 2: env.symbols[UInt16Type].desc[Lowered]
+    of 4: env.symbols[UInt32Type].desc[Lowered]
+    of 8: env.symbols[UInt64Type].desc[Lowered]
+    else:
+      # -> array[size, uint8]
+      env.add makeDesc(tkArray, h.size, h.align, UInt8Type, h.size.uint32)
+  of tkClosure:
+    # -> (ClP_0: proc, ClE_0: pointer)
+    # the proc pointer uses the nimcall calling convention
+    let prc = env.buildProc(tkProc, ccNimCall, h.retType(env), bu):
+      for _, typ, flags in params(env, h):
+        bu.addParam(flags, typ)
+
+      # add the environment parameter:
+      bu.addParam({}, PointerType)
+
+    env.buildRecord(h.size, h.align, bu):
+      bu.addField(env, IntVal 0, prc, "ClP_0", mangle=false)
+      # XXX: the type of the environment pointer should be a ``RootRef``
+      bu.addField(env, IntVal graph.config.target.ptrSize,
+                  PointerType, "ClE_0", mangle=false)
+  of tkOpenArray:
+    # -> (ptr UncheckedArray[T], int)
+    let ptrTyp = env.newPtrTy(env.newUncheckedArrayTy(h.elem))
+
+    env.buildRecord(h.size, h.align, bu):
+      bu.addField(env, IntVal 0, ptrTyp)
+      bu.addField(env, IntVal graph.config.target.ptrSize, env.sizeType)
+  of tkSeq:
+    # -> (cap: int, data: ptr (int, UncheckedArray[T]))
+    let
+      dataType = env.newUncheckedArrayTy(h.elem)
+      # the payload type's name is inferred from the body
+      payload = env.buildRecord(h.size, h.align, bu):
+        bu.addField(env, IntVal 0, env.sizeType, "cap")
+        bu.addField(env, IntVal graph.config.target.intSize, dataType, "data")
+      ppTyp = env.newPtrTy(env.newType(payload))
+
+    env.buildRecord(h.size, h.align, bu):
+      bu.addField(env, IntVal 0, env.sizeType, "len")
+      bu.addField(env, IntVal graph.config.target.intSize, ppTyp, "p")
+  else:
+    id
+
+proc typeSymToMir(env: var TypeEnv, t: PType): TypeId =
+  discard getSize(env.config, t) # compute size, alignment, and field offsets
+
+  if t.kind == tyObject:
+    if sfCompilerProc in t.sym.flags:
+      # compilerproc types can be defined in multiple modules (see
+      # ``TNimType``). Only create a type symbol for the instance that's
+      # registered in the compilerproc table
+      # XXX: this is workaround. Compilerproc types should only be defined
+      #      a single time within a project
+      let real = env.graph.getCompilerProc(t.sym.name.s).typ
+      if t != real:
+        result = env.add(real)
+        env.map[t] = result
+        return
+
+    # register the type symbol *first*. This prevents infinite recursion for
+    # cyclic types
+    result = env.symbols.add TypeSym(inst: t, canon: env.symbols.nextId())
+    env.map[t] = result
+
+    let
+      orig  = typeToMir(env, t, canon=false)
+      canon = typeToMir(env, t, canon=true, unique=(tfFromGeneric notin t.flags))
+
+    # there's nothing to lower for object types
+    env.symbols[result].desc = [orig, canon, canon]
+
+    # generic types support covariance for tuples. Pick an instance as the
+    # "canonical" one, so that - for example - ``Generic[(int,)]`` and
+    # ``Generic[tuple[x: int]]`` map to the same MIR type in the end
+    if tfFromGeneric in t.flags and
+       (let c = env.instances.mgetOrPut((t.sym.owner.typ.id, canon), result);
+        c != result):
+      env.symbols[result].canon = c
+  else:
+    # create the type description preserving the original type symbols:
+    let
+      orig  = typeToMir(env, t, canon=false)
+      canon = typeToMir(env, t, canon=true)
+    var lowered: HeaderId
+
+    var prev = env.canon.getOrDefault(canon, env.symbols.nextId())
+    if prev == env.symbols.nextId():
+      # the new type symbol is the *canonical* one. Create the lowered
+      # representation
+      lowered = lowerType(env, env.graph, canon)
+      # lowering could have added new type symbols
+      prev = env.symbols.nextId()
+      env.canon[canon] = prev
+    else:
+      # a canonical type symbol already exists. Inherit its lowered
+      # representation
+      lowered = env.symbols[prev].desc[Lowered]
+
+    # now add the symbol and mapping:
+    result = env.symbols.add TypeSym(inst: t, canon: prev,
+                                     desc: [orig, canon, lowered])
+    env.map[t] = result
+
+proc handleImported(env: var TypeEnv, t: PType): TypeId =
+  if t.sym != nil and sfImportc in t.sym.flags:
+    # an imported type. It's wrapped in a ``tkImported``, referencing the
+    # underlying type
+    let base = typeSymToMir(env):
+      if t.kind in Skip:
+        t.lastSon.skipIrrelevant()
+      else:
+        t
+
+    discard getSize(env.config, t) # compute the sizes, alignments, and offsets
+
+    let
+      size  = env.toIntVal(t.size)
+      orig  = env.add makeDesc(tkImported, size, t.align, base)
+      canon = env.add makeDesc(tkImported, size, t.align,
+                               env.canonical(base))
+    result = env.symbols.add TypeSym(inst: t, canon: env.symbols.nextId(),
+                                     desc: [orig, canon, canon])
+
+    # doesn't matter if a symbol mapping already exists (happens when
+    # `base` == `t`); override it
+    env.map[t] = result
+  else:
+    result = typeSymToMir(env, t)
+
 proc add*(env: var TypeEnv, t: PType): TypeId =
   ## If not registered yet, adds `t` to `env` and returns the ID to later
-  ## look it up with. Basic structural type unification is performed.
-  result = env.map.mgetOrPut(t, env.types.nextId())
-  if result == env.types.nextId():
-    result = env.types.add(t)
+  ## look it up with.
+  result = env.map.getOrDefault(t, env.symbols.nextId())
+  if result == env.symbols.nextId(): # not seen yet?
+    result = handleImported(env, t)
+    # translation of the type registered the mapping for us
+
+func get*(env: TypeEnv, id: TypeId): lent TypeSym =
+  ## Returns the symbol for `id`.
+  env.symbols[id]
+
+template `[]`*(env: TypeEnv, id: FieldId): RecField =
+  env.fields[ord(id)]
+
+template `[]`*(env: TypeEnv, t: PType): TypeId =
+  env.map[t]
 
 func `[]`*(env: TypeEnv, id: TypeId): lent PType {.inline.} =
-  env.types[id]
+  # XXX: this procedure needs to eventually start returning the ``TypeSym``
+  #      instead
+  env.symbols[id].inst
 
 func sizeType*(env: TypeEnv): TypeId {.inline.} =
   ## Returns the type to use for values representing some size. This is a
diff --git a/compiler/mir/typemaps.nim b/compiler/mir/typemaps.nim
index ce57f670f5d..f1e0cebc1a8 100644
--- a/compiler/mir/typemaps.nim
+++ b/compiler/mir/typemaps.nim
@@ -175,7 +175,7 @@ func hash*(x: Type): Hash {.inline.} =
   ## Leaked implementation detail -- do not use.
   hash(PType x)
 
-proc `[]`*[T](t: TypeTable[T], key: PType): lent T {.inline.} =
+proc `[]`*[T](t: TypeTable[T], key: PType): T {.inline.} =
   ## Looks up the item for `key`.
   t.inner[Type key]
 
@@ -186,3 +186,7 @@ proc `[]=`*[T](t: var TypeTable[T], key: PType, val: sink T) {.inline.} =
 proc mgetOrPut*[T](t: var TypeTable, key: PType, val: T): var T =
   ## If `key` has no mapping in `t`, adds one with `val` as the value first.
   t.inner.mgetOrPut(Type(key), val)
+
+proc getOrDefault*[T](t: TypeTable[T], key: PType, def: T): T =
+  ## If there's a value for `key` in `t`, returns it, `def` otherwise.
+  t.inner.getOrDefault(Type(key), def)
diff --git a/tests/align/talign.nim b/tests/align/talign.nim
index fbc4b674c47..711748a3daa 100644
--- a/tests/align/talign.nim
+++ b/tests/align/talign.nim
@@ -1,5 +1,5 @@
 discard """
-ccodeCheck: "\\i @'NIM_ALIGN(128) NI mylocal1' .*"
+ccodeCheck: "\\i @'NIM_ALIGN(128) NI64 mylocal1' .*"
 labels: "pragma alignment generic"
 description: '''
   . First one is is for Azure. The keyword ``alignof`` only exists in ``c++11``
@@ -36,9 +36,9 @@ proc foobar() =
   doAssert (cast[uint](addr(toplevel3)) and 31) == 0
 
   # test multiple align expressions
-  var mylocal1 {.align(128), align(32).}: int = 123
-  var mylocal2 {.align(128), align(32).}: int = 123
-  var mylocal3 {.align(32), align(128).}: int = 123
+  var mylocal1 {.align(128), align(32).}: int64 = 123
+  var mylocal2 {.align(128), align(32).}: int64 = 123
+  var mylocal3 {.align(32), align(128).}: int64 = 123
 
   doAssert (cast[uint](addr(mylocal1)) and 127) == 0
   doAssert (cast[uint](addr(mylocal2)) and 127) == 0
diff --git a/tests/ccgbugs/tnoalias.nim b/tests/ccgbugs/tnoalias.nim
index f200992d752..42d6238c877 100644
--- a/tests/ccgbugs/tnoalias.nim
+++ b/tests/ccgbugs/tnoalias.nim
@@ -1,10 +1,10 @@
 discard """
-  ccodecheck: "\\i@'NI* NIM_NOALIAS field;' @'NIM_CHAR* NIM_NOALIAS x,' @'void* NIM_NOALIAS q'"
+  ccodecheck: "\\i@'NI64* NIM_NOALIAS field;' @'NIM_CHAR* NIM_NOALIAS x,' @'void* NIM_NOALIAS q'"
 """
 
 type
   BigNum = object
-    field {.noalias.}: ptr UncheckedArray[int]
+    field {.noalias.}: ptr UncheckedArray[int64]
 
 proc p(x {.noalias.}: openArray[char]) =
   var q {.noalias.}: pointer = addr(x[0])
diff --git a/tests/lang_exprs/tempty_typed_expressions_issues.nim b/tests/lang_exprs/tempty_typed_expressions_issues.nim
index ed8ae20dde7..635d546368c 100644
--- a/tests/lang_exprs/tempty_typed_expressions_issues.nim
+++ b/tests/lang_exprs/tempty_typed_expressions_issues.nim
@@ -1,6 +1,6 @@
 discard """
   targets: "c js vm"
-  knownIssue.c vm: '''
+  knownIssue.c js vm: '''
     `typeRel` treats an empty array matching against a concrete type as a
     generic match, resulting in no implicit conversion being injected (the
     conversion is required for the proper typing of statement-list
@@ -9,8 +9,6 @@ discard """
 """
 
 # XXX: merge into ``tempty_typed_expressions.nim`` once the issue is fixed
-# XXX: doesn't fail for the JS backend due to the code generator being more
-#      lenient
 
 proc get(x: array[0, int]): array[0, int] = x
 

From d36b9a3525e28b2cc065812c8b87a030764d7699 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 24 Jul 2024 22:50:16 +0200
Subject: [PATCH 155/169] fix wrong cursor inference in the context of loops
 (#1388)

## Summary

* fix cursor inference bug where variables were erroneously inferred as
  cursors, leading to use-after-free issues
* improve cursor inference. `var`/`let` bindings are now inferred to be
  cursors more reliably

Fixes https://github.com/nim-works/nimskull/issues/1385

## Details

For `var`/`let` bindings defined in loops, the `aliveEnd` is now only
updated during the first analysis of the loop. This ensures that
variables defined outside the loop, but only assigned to within the
loop, always have longer alive times than variables defined within
loops, thus preventing outer variables borrowing from inner variables
(cursorfication cannot happen when a variable outlives its assignment
source).

This fix also renders the `isConditionallyReassigned` heuristic
obsolete, which was used to fix a more specific case of the same bug.
The heuristic disabled cursorfication for all variables of which
re-assignments are enclosed by a loop and `if`/`else`/`elif`/`of`,
which also applied to, e.g.:

```nim
while cond:
  if cond:
    var a = newString(...)
    var b = newString(...)
    var x: string
    x = a
    x = b # this assignment disabled `x` being turned into a cursor
    discard a
```

With the heuristic removed, in the above example, `x` is now turned
into a cursor, matching what would happen when there is no enclosing
loop or `if`.
---
 compiler/sem/varpartitions.nim    | 30 +++++++++-------
 tests/arc/topt_no_loop_cursor.nim | 58 +++++++++++++++++++++++++++++++
 tests/arc/topt_refcursors.nim     | 24 +++++++++----
 3 files changed, 93 insertions(+), 19 deletions(-)
 create mode 100644 tests/arc/topt_no_loop_cursor.nim

diff --git a/compiler/sem/varpartitions.nim b/compiler/sem/varpartitions.nim
index cb2662057a3..fce7ad41249 100644
--- a/compiler/sem/varpartitions.nim
+++ b/compiler/sem/varpartitions.nim
@@ -81,7 +81,6 @@ type
     ownsData,
     preventCursor,
     isReassigned,
-    isConditionallyReassigned,
     viewDoesMutate,
     viewBorrowsFromConst
 
@@ -118,12 +117,13 @@ type
 
   Partitions* = object
     abstractTime: AbstractTime
+    loopStart: AbstractTime
     s: seq[VarIndex]
     graphs: seq[MutationInfo]
     goals: set[Goal]
     unanalysableMutation: bool
     inAsgnSource, inConstructor, inNoSideEffectSection: int
-    inConditional, inLoop: int
+    inLoop: int
     owner: PSym
     g: ModuleGraph
 
@@ -791,10 +791,6 @@ proc traverse(c: var Partitions; n: PNode) =
 
 proc markAsReassigned(c: var Partitions; vid: int) {.inline.} =
   c.s[vid].flags.incl isReassigned
-  if c.inConditional > 0 and c.inLoop > 0:
-    # bug #17033: live ranges with loops and conditionals are too
-    # complex for our current analysis, so we prevent the cursorfication.
-    c.s[vid].flags.incl isConditionallyReassigned
 
 proc computeLiveRanges(c: var Partitions; n: PNode) =
   # first pass: Compute live ranges for locals.
@@ -831,7 +827,11 @@ proc computeLiveRanges(c: var Partitions; n: PNode) =
     dec c.abstractTime
     if n.sym.kind in {skVar, skResult, skTemp, skLet, skForVar, skParam}:
       let id = variableId(c, n.sym)
-      if id >= 0:
+      # during the second iteration of loop analysis, only update the live
+      # ranges for variables that are not defined within the loop. The
+      # intention is to prevent outer variables from having the same (or
+      # shorter) alive ranges than inner variables
+      if id >= 0 and c.s[id].aliveStart < c.loopStart:
         c.s[id].aliveEnd = max(c.s[id].aliveEnd, c.abstractTime)
         if n.sym.kind == skResult:
           c.s[id].aliveStart = min(c.s[id].aliveStart, c.abstractTime)
@@ -864,19 +864,22 @@ proc computeLiveRanges(c: var Partitions; n: PNode) =
   of nkPragmaBlock:
     computeLiveRanges(c, n.lastSon)
   of nkWhileStmt, nkForStmt:
+    let start = c.abstractTime
     for child in n: computeLiveRanges(c, child)
     # analyse loops twice so that 'abstractTime' suffices to detect cases
     # like:
     #   while cond:
     #     mutate(graph)
     #     connect(graph, cursorVar)
+    if c.inLoop == 0:
+      # live ranges in nested loops are only computed once, during the first
+      # iteration of the outermost loop
+      c.loopStart = start
     inc c.inLoop
     for child in n: computeLiveRanges(c, child)
-    inc c.inLoop
-  of nkElifBranch, nkElifExpr, nkElse, nkOfBranch:
-    inc c.inConditional
-    for child in n: computeLiveRanges(c, child)
-    dec c.inConditional
+    dec c.inLoop
+    if c.inLoop == 0:
+      c.loopStart = MaxTime
   else:
     for child in n: computeLiveRanges(c, child)
 
@@ -889,6 +892,7 @@ proc computeGraphPartitions*(s: PSym; n: PNode; g: ModuleGraph; goals: set[Goal]
     if resultPos < s.ast.safeLen:
       registerResult(result, s.ast[resultPos])
 
+  result.loopStart = MaxTime
   computeLiveRanges(result, n)
   # restart the timer for the second pass:
   result.abstractTime = AbstractTime 0
@@ -949,7 +953,7 @@ proc computeCursors*(s: PSym; n: PNode; g: ModuleGraph) =
   var par = computeGraphPartitions(s, n, g, {cursorInference})
   for i in 0 ..< par.s.len:
     let v = addr(par.s[i])
-    if v.flags * {ownsData, preventCursor, isConditionallyReassigned} == {} and
+    if v.flags * {ownsData, preventCursor} == {} and
         v.sym.kind notin {skParam, skResult} and
         v.sym.flags * {sfThread, sfGlobal} == {} and hasDestructor(v.sym.typ):
       let rid = root(par, i)
diff --git a/tests/arc/topt_no_loop_cursor.nim b/tests/arc/topt_no_loop_cursor.nim
new file mode 100644
index 00000000000..8f5de25f8ea
--- /dev/null
+++ b/tests/arc/topt_no_loop_cursor.nim
@@ -0,0 +1,58 @@
+discard """
+  description: '''
+    Ensure that outer variables don't borrow from locals within loops, when not
+    safe
+  '''
+  matrix: "--showir:mir_in:test --hints:off"
+  action: compile
+  nimoutFull: true
+  nimout: '''-- MIR: test
+scope:
+  def x: Object
+  scope:
+    while true:
+      scope:
+        scope:
+          def _3: bool = not(arg cond)
+          if _3:
+            scope:
+              goto [L2]
+        def y: Object = ()
+        def_cursor _5: Object = x
+        use(arg _5) -> [L3, L4, Resume]
+        x = sink y
+        goto [L3, L5]
+        finally (L3):
+          destroy y
+          continue {L4, L5}
+        L5:
+  L2:
+  goto [L4, L6]
+  finally (L4):
+    destroy x
+    continue {L6}
+  L6:
+
+-- end
+'''
+"""
+
+type Object = object
+
+# make Object a type that's eligible for cursor inference
+proc `=destroy`(x: var Object) =
+  discard
+
+proc use(x: Object) =
+  discard
+
+proc test(cond: bool) =
+  var x: Object
+  while cond:
+    var y = Object()
+    use x
+    # if `x` were a cursor, the above usage would observe a stale value,
+    # as the value assigned below went out of scope already
+    x = y
+
+test(false)
diff --git a/tests/arc/topt_refcursors.nim b/tests/arc/topt_refcursors.nim
index 4ad516800f4..7db1110c098 100644
--- a/tests/arc/topt_refcursors.nim
+++ b/tests/arc/topt_refcursors.nim
@@ -23,7 +23,8 @@ scope:
         def_cursor _10: Node = it
         it = _10[].ri
   L2:
-  def_cursor jt: Node = root
+  def jt: Node
+  =copy(name jt, arg root)
   scope:
     while true:
       scope:
@@ -37,12 +38,25 @@ scope:
             scope:
               goto [L5]
         def_cursor _18: Node = jt
-        def_cursor ri: Node = _18[].ri
+        def ri: Node
+        =copy(name ri, arg _18[].ri)
         def_cursor _19: Node = jt
         def_cursor _20: string = _19[].s
-        echo(arg type(array[0..0, string]), arg _20) -> [Resume]
-        jt = ri
+        echo(arg type(array[0..0, string]), arg _20) -> [L6, L7, Resume]
+        =sink(name jt, arg ri)
+        wasMoved(name ri)
+        goto [L6, L8]
+        finally (L6):
+          =destroy(name ri)
+          continue {L7, L8}
+        L8:
   L5:
+  goto [L7, L9]
+  finally (L7):
+    =destroy(name jt)
+    continue {L9}
+  L9:
+
 -- end of expandArc ------------------------'''
 """
 
@@ -64,5 +78,3 @@ proc traverse(root: Node) =
     jt = ri
 
 traverse(nil)
-
-# XXX: This optimization is not sound

From f0c722a88c526e2d7de57189ed80c03690e05ffb Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sat, 27 Jul 2024 19:01:28 +0200
Subject: [PATCH 156/169] fix fields with names containing backticks being
 inaccessible (#1389)

## Summary

Fix a regression where field names with backticks in them couldn't be
accessed with a field access.

Fixes https://github.com/nim-works/nimskull/issues/1379.

## Details

* identifier nodes resulting from gensyms are now tagged with a new
  node flag (`nfWasGensym`)
* `originalName` only strips the `gensym` suffix from identifiers
  marked with the flag
* the node flag is persistent, so that it stays on the node across tree
  copies

Looking for the full "`gensym" suffix wouldn't work, because it would
also trigger the stripping for user-created names containing the
suffix.
---
 compiler/ast/ast_query.nim                    |  3 ++-
 compiler/ast/ast_types.nim                    |  2 ++
 compiler/sem/evaltempl.nim                    |  1 +
 compiler/sem/semexprs.nim                     | 19 ++++++++++---------
 tests/lang_callable/macros/tmacros_issues.nim | 18 +++++++++++++++++-
 5 files changed, 32 insertions(+), 11 deletions(-)

diff --git a/compiler/ast/ast_query.nim b/compiler/ast/ast_query.nim
index 5c4ac058d35..7a5bed931c7 100644
--- a/compiler/ast/ast_query.nim
+++ b/compiler/ast/ast_query.nim
@@ -63,7 +63,8 @@ const
   PtrLikeKinds*: TTypeKinds = {tyPointer, tyPtr} # for VM
   
   PersistentNodeFlags*: TNodeFlags = {nfDotSetter, nfDotField, nfLL,
-                                      nfFromTemplate, nfDefaultRefsParam}
+                                      nfFromTemplate, nfDefaultRefsParam,
+                                      nfWasGensym}
   
   namePos*          = 0 ## Name of the type/proc-like node
   patternPos*       = 1 ## empty except for term rewriting macros
diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index e3eead924da..9269889125e 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -612,6 +612,8 @@ type
     nfDefaultRefsParam ## a default param value references another parameter
                        ## the flag is applied to proc default values and to calls
     nfHasComment ## node has a comment
+    nfWasGensym  ## the identifier node was a gensym prior to template
+                 ## evaluation
 
   TNodeFlags* = set[TNodeFlag]
   TTypeFlag* = enum   ## keep below 32 for efficiency reasons (now: 43)
diff --git a/compiler/sem/evaltempl.nim b/compiler/sem/evaltempl.nim
index 0411400f3a8..321081e73a1 100644
--- a/compiler/sem/evaltempl.nim
+++ b/compiler/sem/evaltempl.nim
@@ -88,6 +88,7 @@ proc evalTemplateAux(templ, actual: PNode, c: var TemplCtx, result: PNode) =
         if sfGenSym in s.flags:
           result.add newIdentNode(getIdent(c.ic, x.name.s & "`gensym" & $c.instID),
             if c.instLines: actual.info else: templ.info)
+          result.flags.incl nfWasGensym
         else:
           result.add newSymNode(x, if c.instLines: actual.info else: templ.info)
     else:
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index 62e53f41943..f476c717149 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -1711,13 +1711,14 @@ proc tryReadingTypeField(c: PContext, n: PNode, i: PIdent, ty: PType): PNode =
   else:
     result = tryReadingGenericParam(c, n, i, ty)
 
-proc originalName(cache: IdentCache, ident: PIdent): PIdent =
-  ## Returns the identifier stripped off of the '`gensym' suffix, if any.
-  let i = find(ident.s, '`')
-  if i != -1:
-    # if there's a backtick in the name, the name must come from a gensym'ed
-    # symbol. Strip the '`gensym' suffix
-    cache.getIdent(ident.s.cstring, i, hashIgnoreStyle(ident.s, 0, i - 1))
+proc originalName(c: PContext, n, orig: PNode): PIdent =
+  ## Returns the identifier stripped off of the '`gensym' suffix, if
+  ## it originated from a processed gensym symbol node.
+  let ident = legacyConsiderQuotedIdent(c, n, orig)
+  if nfWasGensym in n.flags:
+    let i = rfind(ident.s, '`')
+    # strip the suffix
+    c.cache.getIdent(ident.s.cstring, i, hashIgnoreStyle(ident.s, 0, i - 1))
   else:
     ident
 
@@ -1747,7 +1748,7 @@ proc builtinFieldAccess(c: PContext, n: PNode, flags: TExprFlags): PNode =
 
   n[0] = semExprWithType(c, n[0], flags)
   var
-    i = originalName(c.cache, legacyConsiderQuotedIdent(c, n[1], n))
+    i = originalName(c, n[1], n)
     ty = n[0].typ
     f: PSym = nil
 
@@ -2072,7 +2073,7 @@ proc semArrayAccess(c: PContext, n: PNode, flags: TExprFlags): PNode =
     result = semExpr(c, result, flags)
 
 proc propertyWriteAccess(c: PContext, n, a: PNode): PNode =
-  var id = originalName(c.cache, legacyConsiderQuotedIdent(c, a[1],a))
+  var id = originalName(c, a[1], a)
   var setterId = newIdentNode(getIdent(c.cache, id.s & '='), a[1].info)
   # a[0] is already checked for semantics, that does ``builtinFieldAccess``
   # this is ugly. XXX Semantic checking should use the ``nfSem`` flag for
diff --git a/tests/lang_callable/macros/tmacros_issues.nim b/tests/lang_callable/macros/tmacros_issues.nim
index d572d0968e2..6977782c9d0 100644
--- a/tests/lang_callable/macros/tmacros_issues.nim
+++ b/tests/lang_callable/macros/tmacros_issues.nim
@@ -538,4 +538,20 @@ block orginal_parameter_types:
     doAssert x.intVal == 1
     doAssert y.intVal == 2
 
-  m(1, 2)
\ No newline at end of file
+  m(1, 2)
+
+block field_names_with_backticks:
+  # field names containing backticks (only possible with macro-generated
+  # code) couldn't be accessed with dot expressions
+  macro test() =
+    let name = ident"a`b"
+
+    result = quote do:
+      type Object = object
+        `name`: int
+
+      # test accessing the field with both constructors and a dot expression
+      let o = Object(`name`: 1)
+      doAssert o.`name` == 1
+
+  test()

From 5aa938784fa420b3c7e4685bfaa43a4d862f0f3d Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 30 Jul 2024 00:36:55 +0000
Subject: [PATCH 157/169] build(deps): Bump
 mikepenz/release-changelog-builder-action from 5.0.0.pre.a04 to 5 (#1390)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Bumps

[mikepenz/release-changelog-builder-action](https://github.com/mikepenz/release-changelog-builder-action)
from 5.0.0.pre.a04 to 5.
<details>
<summary>Release notes</summary>
<p><em>Sourced from <a

href="https://github.com/mikepenz/release-changelog-builder-action/releases">mikepenz/release-changelog-builder-action's
releases</a>.</em></p>
<blockquote>
<h2>v5</h2>
<ul>
<li>no changes</li>
</ul>
<h2>v5.0.0-rc01</h2>
<h2>🚀 Features</h2>
<ul>
<li>Enhance CONTRIBUTORS template
<ul>
<li>PR: <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1343">#1343</a></li>
</ul>
</li>
</ul>
<h2>🐛 Fixes</h2>
<ul>
<li>Fix to match categories case insensitive for gitea
<ul>
<li>PR: <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1346">#1346</a></li>
<li>Thanks <a

href="https://github.com/MoonLiightz"><code>@​MoonLiightz</code></a></li>
</ul>
</li>
</ul>
<h2>📦 Dependencies</h2>
<ul>
<li>Dependency upgrades | <code>semver 7.6.3</code>
<ul>
<li>PR: <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1347">#1347</a></li>
</ul>
</li>
</ul>
</blockquote>
</details>
<details>
<summary>Commits</summary>
<ul>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/c7b3b6d92924cca3c990f7891d83d0fd56ae3944"><code>c7b3b6d</code></a>
Merge pull request <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1348">#1348</a>
from mikepenz/develop</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/ef820d296c56675e58f7edbc7d5a43adde3d972a"><code>ef820d2</code></a>
Merge pull request <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1347">#1347</a>
from mikepenz/feature/depency_upgrades_20240726</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/542703f95eabfdcc22919fcd983746e8386a1fdc"><code>542703f</code></a>
- recompile dist</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/166c6cd397596ffc308be0a40c0ac420b853ccf7"><code>166c6cd</code></a>
- revert octokit rest as its now an ESM package</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/488cb35032ee550ebf78f51f3765022d7ad70280"><code>488cb35</code></a>
Dependency upgrades</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/4d5a5160cbe596a1d466ffbfbacaf005c9450d08"><code>4d5a516</code></a>
Merge pull request <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1346">#1346</a>
from mikepenz/fix/1345</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/3ff44d5e84d76d53e9fbf3942f536eeef429ffc9"><code>3ff44d5</code></a>
- recompile dist</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/76ceff7ddbed08cd9ec6e7e7a3a87f10b6016c1c"><code>76ceff7</code></a>
- make gitea labels lowercase so categories are matched case
insensitive</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/bbbdb7a6e6b42a99b1fdfe678ac6c77a7909d149"><code>bbbdb7a</code></a>
Merge pull request <a

href="https://redirect.github.com/mikepenz/release-changelog-builder-action/issues/1343">#1343</a>
from mikepenz/feature/contributors</li>
<li><a

href="https://github.com/mikepenz/release-changelog-builder-action/commit/09758f3887d667e5dd44c66c2e781ae54805e9fc"><code>09758f3</code></a>
- ensure contributors are not listed multiple times</li>
<li>See full diff in <a

href="https://github.com/mikepenz/release-changelog-builder-action/compare/v5.0.0-a04...v5">compare
view</a></li>
</ul>
</details>
<br />


[![Dependabot compatibility

score](https://dependabot-badges.githubapp.com/badges/compatibility_score?dependency-name=mikepenz/release-changelog-builder-action&package-manager=github_actions&previous-version=5.0.0.pre.a04&new-version=5)](https://docs.github.com/en/github/managing-security-vulnerabilities/about-dependabot-security-updates#about-compatibility-scores)

Dependabot will resolve any conflicts with this PR as long as you don't
alter it yourself. You can also trigger a rebase manually by commenting
`@dependabot rebase` .

[//]: # (dependabot-automerge-start)
[//]: # (dependabot-automerge-end)

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 .github/workflows/publisher.yml                        | 2 +-
 .github/workflows/slash-command-generate-changelog.yml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/publisher.yml b/.github/workflows/publisher.yml
index 6c2fc56d13d..9c4eeb50225 100644
--- a/.github/workflows/publisher.yml
+++ b/.github/workflows/publisher.yml
@@ -113,7 +113,7 @@ jobs:
 
       - id: changelog
         name: Create release changelog
-        uses: mikepenz/release-changelog-builder-action@v5.0.0-a04
+        uses: mikepenz/release-changelog-builder-action@v5
         with:
           configuration: ".github/changelog.json"
           toTag: ${{ steps.release-files.outputs.version }}
diff --git a/.github/workflows/slash-command-generate-changelog.yml b/.github/workflows/slash-command-generate-changelog.yml
index ce93cd85d3e..9a717bd644f 100644
--- a/.github/workflows/slash-command-generate-changelog.yml
+++ b/.github/workflows/slash-command-generate-changelog.yml
@@ -44,7 +44,7 @@ jobs:
 
       - id: changelog
         name: Create changelog
-        uses: mikepenz/release-changelog-builder-action@v5.0.0-a04
+        uses: mikepenz/release-changelog-builder-action@v5
         with:
           configuration: ".github/changelog.json"
           fromTag: ${{ github.event.client_payload.slash_command.args.named.from || '' }}

From 4fed1a68b03ccc72e7871746b61e497a5da6b21d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 31 Jul 2024 03:00:50 +0200
Subject: [PATCH 158/169] fix C codegen regression with closures (#1392)

## Summary

Fix explicit or implicit creation of a closure leading to C
compiler errors when using strict(er) C compilers.

## Details

* when lowering closure types, use a `tkProc` type with `ccClosure`
  calling convention
* using a `ccNimCall` type with an additional `void` parameter meant
  that `cgen` placed the result type (in case of RVO) *after* the
  environment type, which is incorrect and doesn't match the signature
  of closure procedures
* C compilers that require compatible types when implicitly casting
  rightfully reported an error in this case
---
 compiler/mir/mirtypes.nim | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index 460718d1dd1..bccc5ce4547 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -980,14 +980,10 @@ proc lowerType(env: var TypeEnv, graph: ModuleGraph, id: HeaderId): HeaderId =
       env.add makeDesc(tkArray, h.size, h.align, UInt8Type, h.size.uint32)
   of tkClosure:
     # -> (ClP_0: proc, ClE_0: pointer)
-    # the proc pointer uses the nimcall calling convention
-    let prc = env.buildProc(tkProc, ccNimCall, h.retType(env), bu):
+    let prc = env.buildProc(tkProc, ccClosure, h.retType(env), bu):
       for _, typ, flags in params(env, h):
         bu.addParam(flags, typ)
 
-      # add the environment parameter:
-      bu.addParam({}, PointerType)
-
     env.buildRecord(h.size, h.align, bu):
       bu.addField(env, IntVal 0, prc, "ClP_0", mangle=false)
       # XXX: the type of the environment pointer should be a ``RootRef``

From f84f175c1f7cf018ddf4542f48dcbb568906099a Mon Sep 17 00:00:00 2001
From: "P. Starsider" <132208486+starsiderfox@users.noreply.github.com>
Date: Wed, 31 Jul 2024 03:08:12 +0200
Subject: [PATCH 159/169] Fix `sysrand` for Android (and some other POSIX
 platforms) (#1391)

## Summary
Fixes a bug that caused the compiler to fail to compile anything with
e.g.  `--os:android`  (and some uncommon POSIX platforms) when it uses
`sysrand`  in any way, such as when importing  `random` .  `koch`  was
affected so one couldn't bootstrap nimskull in android as the host
platform.

## Details
There's two POSIX constants used in  `sysrand.nim`  that are not
actually constants for some platforms like Android.  `EINTR`  and
`EAGAIN`  are required to be constants at compile time because they're
used in a  `case of`  but the condition is so simple that we can replace
it by an  `if`  statement.

They're technically constants in all platforms, but on the C side (taken
from  `errno.h` ), not in nimskull, and the latter is oblivious to the
content of those header files.
---
 lib/std/sysrand.nim | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/lib/std/sysrand.nim b/lib/std/sysrand.nim
index c92d1ab5d8f..d8c8a94bd15 100644
--- a/lib/std/sysrand.nim
+++ b/lib/std/sysrand.nim
@@ -189,8 +189,8 @@ elif defined(linux) and not defined(emscripten):
       elif readBytes > 0:
         inc(result, readBytes)
       else:
-        case osLastError().int
-        of EINTR, EAGAIN:
+        let err = osLastError().int
+        if err == EINTR or err == EAGAIN:
           discard
         else:
           result = -1

From ec9b4aca0ad78d769e7538d727c13dbe95ad2b6a Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 1 Aug 2024 23:48:52 +0200
Subject: [PATCH 160/169] macros: make `quote` a proper quasi-quoting operator
 (#1393)

## Summary

`quote` now keeps the quoted block as is, which means that:
* no symbols are bound or mixed in automatically from the enclosing
  scopes
* identifiers in definition positions aren't turned into gensyms; they
  stay as is
* `.gensym` and `.inject` pragmas within the quoted block don't affect
  the AST

Symbols thus need to be bound or created explicitly, via `bindSym` and
`genSym`, respectively. **This is a breaking change.**

## Details

### Motivation For The Change

* symbols from the `quote`'s scope being bound is error-prone, leading
  to confusing compilation errors
* the intention of documentation of `quote` already said it does quasi-
  quoting (even though it didn't)
* the implementation relied on the intricacies of templates and
  template evaluation

### New Behaviour

* quoted AST is not modified. No symbols are bound and no identifiers
  are turned into gensyms

### Implementation

* `semQuoteAst` transforms the `quote` call into a call to the internal
  `quoteImpl` procedure
* the pre-processed quoted AST is passed as the first arguments; the
  extracted unquoted expression are passed as the remaining arguments
* the internal-only `evalToAst` magic procedure is used for evaluating
  the unquoted expressions. `newLit` cannot be used here, as the trees
  it produces for `object` values are only valid when all the type's
  fields are exported
* placing the AST is of the evaluated unqouted expressions is handled
  in-VM, by `quoteImpl`

### Standard Library And Test Changes

* multiple modules from the standard library relied on the previous
  symbol binding and gensym behaviour; they're changed to use `bindSym`
  or `genSym`. Outside-visible behaviour doesn't change
* the `t7875.nim` test relied on the gensym behaviour. The definition
  outside the macro is not relevant to the issue the test guards
  against, so it can just be removed
* the quoted ASTs in `tsizeof.nim` are wrapped in blocks in order to
  prevent the identifiers from colliding
---
 compiler/ast/ast_types.nim                    |  2 +
 compiler/sem/semexprs.nim                     | 99 ++++++++-----------
 compiler/sem/sempass2.nim                     |  2 +
 compiler/sem/varpartitions.nim                |  2 +-
 compiler/vm/vmgen.nim                         |  9 +-
 lib/core/macros.nim                           | 27 ++++-
 lib/experimental/ast_pattern_matching.nim     |  2 +-
 lib/js/asyncjs.nim                            |  3 +-
 lib/js/jsffi.nim                              | 49 ++++-----
 lib/std/jsonutils.nim                         |  4 +-
 lib/std/tasks.nim                             |  3 +-
 lib/std/wrapnils.nim                          |  6 +-
 tests/lang_callable/macros/t7875.nim          |  5 +-
 tests/lang_callable/macros/tmacro6.nim        |  2 +-
 .../defer/tdefer_malformed_many_children.nim  |  2 +-
 tests/misc/tsizeof.nim                        | 21 ++--
 16 files changed, 135 insertions(+), 103 deletions(-)

diff --git a/compiler/ast/ast_types.nim b/compiler/ast/ast_types.nim
index 9269889125e..ff49afbb6a1 100644
--- a/compiler/ast/ast_types.nim
+++ b/compiler/ast/ast_types.nim
@@ -817,6 +817,8 @@ type
     mException, mBuiltinType, mSymOwner, mUncheckedArray, mGetImplTransf,
     mSymIsInstantiationOf, mNodeId, mPrivateAccess
 
+    mEvalToAst
+
     # magics only used internally:
     mStrToCStr
       ## the backend-dependent string-to-cstring conversion
diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index f476c717149..e98531714e9 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -2552,9 +2552,6 @@ proc expectString(c: PContext, n: PNode): string =
   else:
     localReport(c.config, n, reportSem rsemStringLiteralExpected)
 
-proc newAnonSym(c: PContext; kind: TSymKind, info: TLineInfo): PSym =
-  result = newSym(kind, c.cache.idAnon, nextSymId c.idgen, getCurrOwner(c), info)
-
 proc semExpandToAst(c: PContext, n: PNode): PNode =
   let macroCall = n[1]
 
@@ -2606,14 +2603,11 @@ proc semExpandToAst(c: PContext, n: PNode, magicSym: PSym,
   else:
     result = semDirectOp(c, n, flags)
 
-proc processQuotations(c: PContext; n: var PNode, op: string,
-                       quotes: var seq[PNode],
-                       ids: var seq[PNode]) =
+proc processQuotations(c: PContext; n: PNode, op: string, call: PNode): PNode =
   template returnQuote(q) =
-    quotes.add q
-    n = newIdentNode(getIdent(c.cache, $quotes.len), n.info)
-    ids.add n
-    return
+    call.add q
+    # return a placeholder node. The integer represents the parameter index
+    return newTreeI(nkAccQuoted, n.info, newIntNode(nkIntLit, call.len - 3))
 
   template handlePrefixOp(prefixed) =
     if prefixed[0].kind == nkIdent:
@@ -2639,14 +2633,22 @@ proc processQuotations(c: PContext; n: var PNode, op: string,
         tempNode[0] = n[0]
         tempNode[1] = n[1]
         handlePrefixOp(tempNode)
-  of nkIdent:
-    if n.ident.s == "result":
-      n = ids[0]
   else:
     discard # xxx: raise an error
 
+  result = n
   for i in 0..<n.safeLen:
-    processQuotations(c, n[i], op, quotes, ids)
+    let x = processQuotations(c, n[i], op, call)
+    if x != n[i]:
+      # copy on write
+      if result == n:
+        result = copyNodeWithKids(n)
+      result[i] = x
+
+  if result.kind == nkAccQuoted:
+    # escape the accquote node by wrapping it in another accquote. This signals
+    # that the node is not a placeholder
+    result = newTree(nkAccQuoted, result)
 
 proc semQuoteAst(c: PContext, n: PNode): PNode =
   if n.len != 2 and n.len != 3:
@@ -2657,57 +2659,38 @@ proc semQuoteAst(c: PContext, n: PNode): PNode =
     #      got = result.len - 1
     return
 
-  # We transform the do block into a template with a param for
-  # each interpolation. We'll pass this template to getAst.
   var
     quotedBlock = n[^1]
     op = if n.len == 3: expectString(c, n[1]) else: "``"
-    quotes = newSeq[PNode](2)
-      # the quotes will be added to a nkCall statement
-      # leave some room for the callee symbol and the result symbol
-    ids = newSeq[PNode](1)
-      # this will store the generated param names
-      # leave some room for the result symbol
 
   if quotedBlock.kind != nkStmtList:
     semReportIllformedAst(c.config, n, {nkStmtList})
 
-  # This adds a default first field to pass the result symbol
-  ids[0] = newAnonSym(c, skParam, n.info).newSymNode
-  processQuotations(c, quotedBlock, op, quotes, ids)
-
-  var dummyTemplate = newProcNode(
-    nkTemplateDef, quotedBlock.info, body = quotedBlock,
-    params = c.graph.emptyNode,
-    name = newAnonSym(c, skTemplate, n.info).newSymNode,
-              pattern = c.graph.emptyNode, genericParams = c.graph.emptyNode,
-              pragmas = c.graph.emptyNode, exceptions = c.graph.emptyNode)
-
-  if ids.len > 0:
-    dummyTemplate[paramsPos] = newNodeI(nkFormalParams, n.info)
-    dummyTemplate[paramsPos].add:
-      getSysSym(c.graph, n.info, "untyped").newSymNode # return type
-    ids.add getSysSym(c.graph, n.info, "untyped").newSymNode # params type
-    ids.add c.graph.emptyNode # no default value
-    dummyTemplate[paramsPos].add newTreeI(nkIdentDefs, n.info, ids)
-
-  var tmpl = semTemplateDef(c, dummyTemplate)
-  quotes[0] = tmpl[namePos]
-  # This adds a call to newIdentNode("result") as the first argument to the
-  # template call
-  let identNodeSym = getCompilerProc(c.graph, "newIdentNode")
-  # so that new Nim compilers can compile old macros.nim versions, we check for
-  # 'nil' here and provide the old fallback solution:
-  let identNode = if identNodeSym == nil:
-                    newIdentNode(getIdent(c.cache, "newIdentNode"), n.info)
-                  else:
-                    identNodeSym.newSymNode
-  quotes[1] = newTreeI(nkCall, n.info, identNode, newStrNode(nkStrLit, "result"))
-  result =
-    c.semExpandToAst:
-      newTreeI(nkCall, n.info,
-        createMagic(c.graph, c.idgen, "getAst", mExpandToAst).newSymNode,
-        newTreeI(nkCall, n.info, quotes))
+  # turn the quasi-quoted block into a call to the internal ``quoteImpl``
+  # procedure
+  # future direction: implement this transformation in user code. The compiler
+  # only needs to provide an AST quoting facility (without quasi-quoting)
+
+  let call = newNodeI(nkCall, n.info, 2)
+  call[0] = newSymNode(c.graph.getCompilerProc("quoteImpl"))
+  # extract the unquoted parts and append them to `call`:
+  let quoted = processQuotations(c, quotedBlock, op, call)
+  # the pre-processed AST of the quoted block is passed as the first argument:
+  call[1] = newTreeI(nkNimNodeLit, n.info, quoted)
+  call[1].typ = sysTypeFromName(c.graph, n.info, "NimNode")
+
+  template ident(name: string): PNode =
+    newIdentNode(c.cache.getIdent(name), unknownLineInfo)
+
+  # the unquoted expressions are wrapped in evalToAst calls. Use a qualified
+  # identifier in order to prevent user-defined evalToAst calls to be picked
+  let callee = newTree(nkDotExpr, ident("macros"), ident("evalToAst"))
+  for i in 2..<call.len:
+    call[i] = newTreeI(nkCall, call[i].info, [callee, call[i]])
+
+  # type the call. The actual work of substituting the placeholders is
+  # done in-VM, by the ``quoteImpl`` procedure
+  result = semDirectOp(c, call, {})
 
 proc tryExpr(c: PContext, n: PNode, flags: TExprFlags = {}): PNode =
   # watch out, hacks ahead:
diff --git a/compiler/sem/sempass2.nim b/compiler/sem/sempass2.nim
index d60c2146345..306bb52febd 100644
--- a/compiler/sem/sempass2.nim
+++ b/compiler/sem/sempass2.nim
@@ -1448,6 +1448,8 @@ proc track(tracked: PEffects, n: PNode) =
     reportErrors(tracked.config, n)
   of nkError:
     localReport(tracked.config, n)
+  of nkNimNodeLit:
+    discard "don't analyse literal AST"
   else:
     for i in 0 ..< n.safeLen:
       track(tracked, n[i])
diff --git a/compiler/sem/varpartitions.nim b/compiler/sem/varpartitions.nim
index fce7ad41249..e5ec8aa31e0 100644
--- a/compiler/sem/varpartitions.nim
+++ b/compiler/sem/varpartitions.nim
@@ -670,7 +670,7 @@ const
     nkMethodDef, nkIteratorDef, nkMacroDef, nkTemplateDef, nkLambda, nkDo,
     nkFuncDef, nkConstSection, nkConstDef, nkIncludeStmt, nkImportStmt,
     nkExportStmt, nkPragma, nkTypeOfExpr, nkMixinStmt,
-    nkBindStmt}
+    nkBindStmt, nkNimNodeLit}
 
 proc potentialMutationViaArg(c: var Partitions; n: PNode; callee: PType) =
   if constParameters in c.goals and tfNoSideEffect in callee.flags:
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index d7ac4e017dd..805e3e9e524 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -207,7 +207,7 @@ const
                      cnkObjDownConv, cnkDeref, cnkDerefView, cnkLvalueConv}
 
   MagicsToKeep* = {mIsolate, mNHint, mNWarning, mNError, mMinI, mMaxI,
-                   mAbsI, mDotDot, mNGetType, mNSizeOf, mNLineInfo}
+                   mAbsI, mDotDot, mNGetType, mNSizeOf, mNLineInfo, mEvalToAst}
     ## the set of magics that are kept as normal procedure calls and thus need
     ## an entry in the function table.
     # XXX: mNGetType, mNGetSize, and mNLineInfo *are* real magics, but their
@@ -2171,6 +2171,13 @@ proc genMagic(c: var TCtx; n: CgNode; dest: var TDest; m: TMagic) =
 
     c.gABC(n, opcExpandToAst, dest, x, numArgs)
     c.freeTempRange(x, numArgs)
+  of mEvalToAst:
+    if n[1].typ.isNimNode():
+      # don't use ``DataToAst` if the argument is already a NimNode, only copy
+      # the tree
+      c.genUnaryABC(n, dest, opcNCopyNimTree)
+    else:
+      c.genDataToAst(n[1], dest)
   of mSizeOf, mAlignOf, mOffsetOf:
     fail(n.info, vmGenDiagMissingImportcCompleteStruct, m)
 
diff --git a/lib/core/macros.nim b/lib/core/macros.nim
index 9cbbba59394..2038e7da222 100644
--- a/lib/core/macros.nim
+++ b/lib/core/macros.nim
@@ -522,7 +522,8 @@ proc quote*(bl: typed, op = "``"): NimNode {.magic: "QuoteAst", noSideEffect.} =
   ## A custom operator interpolation needs accent quoted (``) whenever it resolves
   ## to a symbol.
   ##
-  ## See also `genasts <genasts.html>`_ which avoids some issues with `quote`.
+  ## See also:
+  ## * `genasts <genasts.html>`_
   runnableExamples:
     macro check(ex: untyped) =
       # this is a simplified version of the check macro from the
@@ -591,6 +592,30 @@ proc quote*(bl: typed, op = "``"): NimNode {.magic: "QuoteAst", noSideEffect.} =
         doAssert y == 3
     bar2()
 
+proc quoteImpl(n: NimNode, args: varargs[NimNode]): NimNode {.compilerproc,
+    compileTime.} =
+  ## Substitutes the placeholders in `n` with the corresponding AST from
+  ## `args`. Invoked by the compiler for implementating ``quote``.
+  proc aux(n: NimNode, args: openArray[NimNode]): NimNode =
+    case n.kind
+    of nnkAccQuoted:
+      if n[0].kind == nnkAccQuoted:
+        result = n[0] # an escaped accquoted tree
+      else:
+        result = args[n[0].intVal] # a placeholder
+    else:
+      result = n
+      for i in 0..<n.len:
+        result[i] = aux(n[i], args)
+
+  result = aux(n, args)
+  # unwrap single-element statement lists:
+  if n.kind == nnkStmtList and n.len == 1:
+    result = n[0]
+
+proc evalToAst*[T](x: T): NimNode {.magic: "EvalToAst".} =
+  ## Leaked implementation detail. **Do not use**.
+
 proc expectKind*(n: NimNode, k: NimNodeKind) =
   ## Checks that `n` is of kind `k`. If this is not the case,
   ## compilation aborts with an error message. This is useful for writing
diff --git a/lib/experimental/ast_pattern_matching.nim b/lib/experimental/ast_pattern_matching.nim
index 53f11f04176..ced2b76f627 100644
--- a/lib/experimental/ast_pattern_matching.nim
+++ b/lib/experimental/ast_pattern_matching.nim
@@ -38,7 +38,7 @@ type
     WrongIdent
     WrongCustomCondition
 
-  MatchingError = object
+  MatchingError* = object
     node*: NimNode
     expectedKind*: set[NimNodeKind]
     case kind*: MatchingErrorKind
diff --git a/lib/js/asyncjs.nim b/lib/js/asyncjs.nim
index ac61c1a34c1..b66708cc3e3 100644
--- a/lib/js/asyncjs.nim
+++ b/lib/js/asyncjs.nim
@@ -141,12 +141,13 @@ proc generateJsasync(arg: NimNode): NimNode =
   if len(code) > 0:
     # turn |NimSkull| outgoing exceptions into JavaScript errors
     let body = result.body
+    let reraise = bindSym("reraise")
     result.body = quote:
       try:
         `body`
       except CatchableError as e:
         # use .noreturn call to make sure `body` being an expression works
-        reraise(e)
+        `reraise`(e)
 
   let asyncPragma = quote:
     {.codegenDecl: "async function $2($3)".}
diff --git a/lib/js/jsffi.nim b/lib/js/jsffi.nim
index bd70c0277e9..d5360e6bff1 100644
--- a/lib/js/jsffi.nim
+++ b/lib/js/jsffi.nim
@@ -225,38 +225,36 @@ macro `.`*(obj: JsObject, field: untyped): JsObject =
     let obj = newJsObject()
     obj.a = 20
     assert obj.a.to(int) == 20
+  let helper = genSym(nskProc, "helper")
   if validJsName($field):
     let importString = "#." & $field
     result = quote do:
-      proc helper(o: JsObject): JsObject
-        {.importjs: `importString`, gensym.}
-      helper(`obj`)
+      proc `helper`(o: JsObject): JsObject {.importjs: `importString`.}
+      `helper`(`obj`)
   else:
     if not mangledNames.hasKey($field):
       mangledNames[$field] = $mangleJsName($field)
     let importString = "#." & mangledNames[$field]
     result = quote do:
-      proc helper(o: JsObject): JsObject
-        {.importjs: `importString`, gensym.}
-      helper(`obj`)
+      proc `helper`(o: JsObject): JsObject {.importjs: `importString`.}
+      `helper`(`obj`)
 
 macro `.=`*(obj: JsObject, field, value: untyped): untyped =
   ## Experimental dot accessor (set) for type JsObject.
   ## Sets the value of a property of name `field` in a JsObject `x` to `value`.
+  let helper = genSym(nskProc, "helper")
   if validJsName($field):
     let importString = "#." & $field & " = #"
     result = quote do:
-      proc helper(o: JsObject, v: auto)
-        {.importjs: `importString`, gensym.}
-      helper(`obj`, `value`)
+      proc `helper`(o: JsObject, v: auto) {.importjs: `importString`.}
+      `helper`(`obj`, `value`)
   else:
     if not mangledNames.hasKey($field):
       mangledNames[$field] = $mangleJsName($field)
     let importString = "#." & mangledNames[$field] & " = #"
     result = quote do:
-      proc helper(o: JsObject, v: auto)
-        {.importjs: `importString`, gensym.}
-      helper(`obj`, `value`)
+      proc `helper`(o: JsObject, v: auto) {.importjs: `importString`.}
+      `helper`(`obj`, `value`)
 
 macro `.()`*(obj: JsObject,
              field: untyped,
@@ -284,10 +282,12 @@ macro `.()`*(obj: JsObject,
     if not mangledNames.hasKey($field):
       mangledNames[$field] = $mangleJsName($field)
     importString = "#." & mangledNames[$field] & "(@)"
+
+  let helper = genSym(nskProc, "helper")
   result = quote:
-    proc helper(o: JsObject): JsObject
-      {.importjs: `importString`, gensym, discardable.}
-    helper(`obj`)
+    proc `helper`(o: JsObject): JsObject
+      {.importjs: `importString`, discardable.}
+    `helper`(`obj`)
   for idx in 0 ..< args.len:
     let paramName = newIdentNode("param" & $idx)
     result[0][3].add newIdentDefs(paramName, newIdentNode("JsObject"))
@@ -304,10 +304,11 @@ macro `.`*[K: cstring, V](obj: JsAssoc[K, V],
     if not mangledNames.hasKey($field):
       mangledNames[$field] = $mangleJsName($field)
     importString = "#." & mangledNames[$field]
+
+  let helper = genSym(nskProc, "helper")
   result = quote do:
-    proc helper(o: type(`obj`)): `obj`.V
-      {.importjs: `importString`, gensym.}
-    helper(`obj`)
+    proc `helper`(o: type(`obj`)): `obj`.V {.importjs: `importString`.}
+    `helper`(`obj`)
 
 macro `.=`*[K: cstring, V](obj: JsAssoc[K, V],
                                     field: untyped,
@@ -321,10 +322,11 @@ macro `.=`*[K: cstring, V](obj: JsAssoc[K, V],
     if not mangledNames.hasKey($field):
       mangledNames[$field] = $mangleJsName($field)
     importString = "#." & mangledNames[$field] & " = #"
+
+  let helper = genSym(nskProc, "helper")
   result = quote do:
-    proc helper(o: type(`obj`), v: `obj`.V)
-      {.importjs: `importString`, gensym.}
-    helper(`obj`, `value`)
+    proc `helper`(o: type(`obj`), v: `obj`.V) {.importjs: `importString`.}
+    `helper`(`obj`, `value`)
 
 macro `.()`*[K: cstring, V: proc](obj: JsAssoc[K, V],
                                            field: untyped,
@@ -447,10 +449,11 @@ macro `{}`*(typ: typedesc, xs: varargs[untyped]): auto =
   body.add quote do:
     return `a`
 
+  let inner = genSym(nskProc, "inner")
   result = quote do:
-    proc inner(): `typ` {.gensym.} =
+    proc `inner`(): `typ` =
       `body`
-    inner()
+    `inner`()
 
 # Macro to build a lambda using JavaScript's `this`
 # from a proc, `this` being the first argument.
diff --git a/lib/std/jsonutils.nim b/lib/std/jsonutils.nim
index 9fea21cc5c7..2aac6df8120 100644
--- a/lib/std/jsonutils.nim
+++ b/lib/std/jsonutils.nim
@@ -186,11 +186,11 @@ proc discKeyMatch[T](obj: T, json: JsonNode, key: static string): bool =
 macro discKeysMatchBodyGen(obj: typed, json: JsonNode,
                            keys: static seq[string]): untyped =
   result = newStmtList()
-  let r = ident("result")
+  let match = bindSym("discKeyMatch")
   for key in keys:
     let keyLit = newLit key
     result.add quote do:
-      `r` = `r` and discKeyMatch(`obj`, `json`, `keyLit`)
+      result = result and `match`(`obj`, `json`, `keyLit`)
 
 proc discKeysMatch[T](obj: T, json: JsonNode, keys: static seq[string]): bool =
   result = true
diff --git a/lib/std/tasks.nim b/lib/std/tasks.nim
index ac18862228e..615a2cadcb3 100644
--- a/lib/std/tasks.nim
+++ b/lib/std/tasks.nim
@@ -183,8 +183,9 @@ macro toTask*(e: typed{nkCall | nkInfix | nkPrefix | nkPostfix | nkCommand | nkC
                     )
 
 
+    let cAlloc = bindSym("c_calloc")
     let scratchObjPtrType = quote do:
-      cast[ptr `scratchObjType`](c_calloc(csize_t 1, csize_t sizeof(`scratchObjType`)))
+      cast[ptr `scratchObjType`](`cAlloc`(csize_t 1, csize_t sizeof(`scratchObjType`)))
 
     let scratchLetSection = newLetStmt(
       scratchIdent,
diff --git a/lib/std/wrapnils.nim b/lib/std/wrapnils.nim
index 763af52fc0b..e7a1593d282 100644
--- a/lib/std/wrapnils.nim
+++ b/lib/std/wrapnils.nim
@@ -145,12 +145,14 @@ macro `??.`*(a: typed): Option =
   let lhs = genSym(nskVar, "lhs")
   let lhs2 = genSym(nskVar, "lhs")
   let body = process(a, lhs2, 0)
+  let optionSym = bindSym("Option")
+  let optionOpSym = bindSym("option")
   result = quote do:
-    var `lhs`: Option[type(`a`)]
+    var `lhs`: `optionSym`[type(`a`)]
     block:
       var `lhs2`: type(`a`)
       `body`
-      `lhs` = option(`lhs2`)
+      `lhs` = `optionOpSym`(`lhs2`)
     `lhs`
 
 template fakeDot*(a: Option, b): untyped =
diff --git a/tests/lang_callable/macros/t7875.nim b/tests/lang_callable/macros/t7875.nim
index 7b6e47b8657..648b8fe6d35 100644
--- a/tests/lang_callable/macros/t7875.nim
+++ b/tests/lang_callable/macros/t7875.nim
@@ -1,5 +1,5 @@
 discard """
-  nimout: "var mysym`gensym0: MyType[float32]"
+  nimout: "var mysym: MyType[float32]"
   joinable: false
 """
 
@@ -8,9 +8,6 @@ import macros
 type
   MyType[T] = object
 
-# this is totally fine
-var mysym: MyType[float32]
-
 macro foobar(): untyped =
   let floatSym = bindSym"float32"
 
diff --git a/tests/lang_callable/macros/tmacro6.nim b/tests/lang_callable/macros/tmacro6.nim
index c65d34b6d7b..d9c7f9b4e81 100644
--- a/tests/lang_callable/macros/tmacro6.nim
+++ b/tests/lang_callable/macros/tmacro6.nim
@@ -1,6 +1,6 @@
 discard """
 errormsg: "expression '123' is of type 'int literal(123)' and has to be used (or discarded)"
-line: 71
+line: 73
 """
 
 import macros
diff --git a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
index 324ba6b56d1..8d01ce15249 100644
--- a/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
+++ b/tests/lang_stmts/defer/tdefer_malformed_many_children.nim
@@ -2,7 +2,7 @@ discard """
   description: "`defer` must have exactly one child node (macro input)."
   errormsg: "illformed AST"
   file: "macros.nim"
-  line: 622
+  line: 647
 """
 
 import std/macros
diff --git a/tests/misc/tsizeof.nim b/tests/misc/tsizeof.nim
index 909c35c17db..a71c42da491 100644
--- a/tests/misc/tsizeof.nim
+++ b/tests/misc/tsizeof.nim
@@ -29,10 +29,13 @@ doAssert mysize3 == 32
 
 import macros, typetraits
 
+proc wrapBlock(n: NimNode): NimNode =
+  result = newTree(nnkBlockStmt, newEmptyNode(), n)
+
 macro testSizeAlignOf(args: varargs[untyped]): untyped =
   result = newStmtList()
   for arg in args:
-    result.add quote do:
+    result.add wrapBlock(quote do:
       let
         c_size = c_sizeof(`arg`)
         nim_size = sizeof(`arg`)
@@ -47,18 +50,20 @@ macro testSizeAlignOf(args: varargs[untyped]): untyped =
           msg.add  " align(get, expected): " & $nim_align & " != " & $c_align
         echo msg
         failed = true
+    )
 
 
 macro testOffsetOf(a, b: untyped): untyped =
   let typeName = newLit(a.repr)
   let member   = newLit(b.repr)
-  result = quote do:
+  result = wrapBlock(quote do:
     let
       c_offset   = c_offsetof(`a`,`b`)
       nim_offset = offsetof(`a`,`b`)
     if c_offset != nim_offset:
       echo `typeName`, ".", `member`, " offsetError, C: ", c_offset, " nim: ", nim_offset
       failed = true
+  )
 
 proc strAlign(arg: string): string =
   const minLen = 22
@@ -74,10 +79,11 @@ macro c_offsetof(fieldAccess: typed): int32 =
           else: fieldAccess
   let a = s[0].getTypeInst
   let b = s[1]
-  result = quote do:
+  result = wrapBlock(quote do:
     var res: int32
     {.emit: [res, " = offsetof(", `a`, ", ", `b`, ");"] .}
     res
+  )
 
 template c_offsetof(t: typedesc, a: untyped): int32 =
   var x: ptr t
@@ -87,10 +93,11 @@ macro c_sizeof(a: typed): int32 =
   ## Bullet proof implementation that works using the sizeof operator
   ## in the c backend. Assuming of course this implementation is
   ## correct.
-  result = quote do:
+  result = wrapBlock(quote do:
     var res: int32
     {.emit: [res, " = sizeof(", `a`, ");"] .}
     res
+  )
 
 macro c_alignof(arg: untyped): untyped =
   ## Bullet proof implementation that works on actual alignment
@@ -105,21 +112,23 @@ macro c_alignof(arg: untyped): untyped =
 
 macro testAlign(arg:untyped):untyped =
   let prefix = newLit(arg.lineinfo & "  alignof " & arg.repr & " ")
-  result = quote do:
+  result = wrapBlock(quote do:
     let cAlign = c_alignof(`arg`)
     let nimAlign = alignof(`arg`)
     if cAlign != nimAlign:
       echo `prefix`, cAlign, " != ", nimAlign
       failed = true
+  )
 
 macro testSize(arg:untyped):untyped =
   let prefix = newLit(arg.lineinfo & "  sizeof " & arg.repr & " ")
-  result = quote do:
+  result = wrapBlock(quote do:
     let cSize = c_sizeof(`arg`)
     let nimSize = sizeof(`arg`)
     if cSize != nimSize:
       echo `prefix`, cSize, " != ", nimSize
       failed = true
+  )
 
 type
   MyEnum {.pure.} = enum

From ec713a1d39dcc6bf6df6a18214777be0d2888c7a Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Sun, 4 Aug 2024 03:31:18 +0200
Subject: [PATCH 161/169] fix a compiler crash with `.varargs` proc types
 (#1396)

## Summary

Fix the compiler crashing when a non-closure `proc` type with C-style
varargs is used somewhere. Only the C backend was affected.

Fixes https://github.com/nim-works/nimskull/issues/1394.

## Details

* `mirtypes.callConv` didn't consider the `x` field storing a boolean
  value in the most-significant bit, resulting in range defect
* the integer value is now properly masked before converting it to a
  `TCallingConvention` enum value
---
 compiler/mir/mirtypes.nim            |  7 +++++--
 tests/ccgbugs/tvarargs_proc_type.nim | 10 ++++++++++
 2 files changed, 15 insertions(+), 2 deletions(-)
 create mode 100644 tests/ccgbugs/tvarargs_proc_type.nim

diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index bccc5ce4547..f8791ffd585 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -183,6 +183,8 @@ const
   MangleFlag = 0x4000'u16
   NoAliasFlag = 0x8000'u16
 
+  VarargsFlag = 0x8000_0000'u32
+
 func `==`*(a, b: FieldId): bool {.borrow, inline.}
 func `==`(a, b: IntVal): bool {.borrow, inline.}
 
@@ -359,10 +361,11 @@ func numParams*(desc: TypeHeader): int =
   int(desc.b - desc.a) - 1
 
 func callConv*(desc: TypeHeader, env: TypeEnv): TCallingConvention =
-  TCallingConvention env.params[desc.a].x
+  # mask away the varargs flag
+  TCallingConvention(env.params[desc.a].x and not(VarargsFlag))
 
 func hasVarargs*(desc: TypeHeader, env: TypeEnv): bool =
-  (env.params[desc.a].x and 0x8000_0000'u32) != 0
+  (env.params[desc.a].x and VarargsFlag) != 0
 
 func retType*(desc: TypeHeader, env: TypeEnv): TypeId =
   assert desc.kind in {tkProc, tkClosure}
diff --git a/tests/ccgbugs/tvarargs_proc_type.nim b/tests/ccgbugs/tvarargs_proc_type.nim
new file mode 100644
index 00000000000..7fc815cfa51
--- /dev/null
+++ b/tests/ccgbugs/tvarargs_proc_type.nim
@@ -0,0 +1,10 @@
+discard """
+  description: '''
+    Regression test for a bug with querying the calling convention of a MIR
+    type. Derived from https://github.com/nim-works/nimskull/issues/1394.
+  '''
+"""
+
+# calling convention doesn't matter, as long as the proc type is not a closure
+# type
+var p: proc(x: int) {.nimcall, varargs.}

From f5d8ce96c76a9b375c031aed510db0bd8c3b3a23 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 5 Aug 2024 00:09:04 +0200
Subject: [PATCH 162/169] fix C compilation errors with closures and nested
 types (#1397)

## Summary

Fix a bug with hook synthesis that led to C compiler errors when using
some closure procedures or `ref`s of non-top-level `object` type.

## Details

* `sighashes` now uses the symbol ID as the object representation for
  anonymous object/enum types and object/enum types not defined at the
  top-level
* this means that `hashType(x) != hashType(y)` when
  `sameType(x, y) == false`, for object and enum types
* as a consequence, unique hook procedures are used for `ref T` types
  that used the aforementioned types for `T`
* RTTI, which is assigned to types based on type hashes, also uses
  unique instances per object type now

Multiple same-shaped anonymous/non-top-level object types are *not*
merged into a single one by the C code generator, which due to all
sharing the same set of hook procedures, resulted in C compiler errors
due to implicit conversions between incompatible pointer types.

---------

Co-authored-by: Saem Ghani <saemghani+github@gmail.com>
---
 compiler/sem/sighashes.nim                    | 34 +++++++------------
 .../destructor/tseparate_hooks1.nim           | 21 ++++++++++++
 .../destructor/tseparate_hooks2.nim           | 31 +++++++++++++++++
 3 files changed, 64 insertions(+), 22 deletions(-)
 create mode 100644 tests/lang_objects/destructor/tseparate_hooks1.nim
 create mode 100644 tests/lang_objects/destructor/tseparate_hooks2.nim

diff --git a/compiler/sem/sighashes.nim b/compiler/sem/sighashes.nim
index 1e417616928..e56fc615aed 100644
--- a/compiler/sem/sighashes.nim
+++ b/compiler/sem/sighashes.nim
@@ -164,28 +164,18 @@ proc hashType(c: var MD5Context, t: PType; flags: set[ConsiderFlag]) =
       else:
         c.hashSym(t.sym)
 
-      var symWithFlags: PSym
-      template hasFlag(sym): bool =
-        let ret = {sfAnon, sfGenSym} * sym.flags != {}
-        if ret: symWithFlags = sym
-        ret
-      if hasFlag(t.sym) or (t.kind == tyObject and t.owner.kind == skType and t.owner.typ.kind == tyRef and hasFlag(t.owner)):
-        # for `PFoo:ObjectType`, arising from `type PFoo = ref object`
-        # Generated object names can be identical, so we need to
-        # disambiguate furthermore by hashing the field types and names.
-        if t.n.len > 0:
-          let oldFlags = symWithFlags.flags
-          # Hack to prevent endless recursion
-          # xxx instead, use a hash table to indicate we've already visited a type, which
-          # would also be more efficient.
-          symWithFlags.flags.excl {sfAnon, sfGenSym}
-          hashTree(c, t.n, flags + {CoHashTypeInsideNode})
-          symWithFlags.flags = oldFlags
-        else:
-          # The object has no fields: we _must_ add something here in order to
-          # make the hash different from the one we produce by hashing only the
-          # type name.
-          c &= ".empty"
+      if t.sym.flags * {sfAnon, sfGenSym} != {} or
+         (t.kind == tyObject and t.owner.kind == skType and
+          tfRefsAnonObj in t.owner.typ.flags):
+        # one or more of the following are true for the type:
+        # * it's anonymous
+        # * it's defined not in the top-level scope
+        # * it's the object type from a ``ref object`` type construction
+        # The only property that uniquely identifies the type in this case is
+        # the symbol ID, so we use that. **This means that the hash produced
+        # for such types is dependent on the type's surroundings**
+        c &= "."
+        c &= $t.sym.id
     else:
       c &= t.id
     if t.len > 0 and t[0] != nil:
diff --git a/tests/lang_objects/destructor/tseparate_hooks1.nim b/tests/lang_objects/destructor/tseparate_hooks1.nim
new file mode 100644
index 00000000000..d6ac8290f86
--- /dev/null
+++ b/tests/lang_objects/destructor/tseparate_hooks1.nim
@@ -0,0 +1,21 @@
+discard """
+  description: '''
+    Ensure that separate hooks are created for ``ref T`` types where T are non-
+    top-level object types sharing the exact same name and shape
+  '''
+  targets: "c js vm"
+"""
+
+# XXX: this currently relies on the backend C compiler complaining. Eventually,
+#      the test should inspect the MIR output and make sure two different
+#      destroy hooks are used
+
+block:
+  type Nested = object
+
+  var a = (ref Nested)()
+
+block:
+  type Nested = object
+
+  var b = (ref Nested)()
diff --git a/tests/lang_objects/destructor/tseparate_hooks2.nim b/tests/lang_objects/destructor/tseparate_hooks2.nim
new file mode 100644
index 00000000000..ab052a5806a
--- /dev/null
+++ b/tests/lang_objects/destructor/tseparate_hooks2.nim
@@ -0,0 +1,31 @@
+discard """
+  description: '''
+    Ensure that separate hooks are created for ``ref T`` types where T are non-
+    top-level object types sharing the exact same name and shape
+  '''
+  targets: "c js vm"
+"""
+
+# XXX: this currently relies on the backend C compiler complaining. Eventually,
+#      the test should inspect the MIR output and make sure two different
+#      destroy hooks are used
+
+# for this test, both procedures must:
+# * share the same user-provided name
+# * create an anonymous environment object with the exact same shape and field
+#   names
+
+proc outer(x: int) =
+  var x = 1
+  proc inner() =
+    x = 2
+  inner()
+
+proc outer(x: float) =
+  var x = 1
+  proc inner() =
+    x = 2
+  inner()
+
+outer(1)
+outer(1.0)

From f11082404c5aa0a717f9f4da085556484d5c8f4d Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Mon, 5 Aug 2024 23:54:26 +0200
Subject: [PATCH 163/169] mirtypes: fix regression with cyclic generic object
 types (#1398)

## Summary

Fix cyclic generic object types instantiated with tuple types as one
of the arguments causing C compiler errors under some circumstances.

## Details

* the type merging logic in `mirtypes` now uses `sighashes`, which is
  able to handle cyclic types
* previously, `Obj[(int,)]` and `Obj[tuple[x: int]]` were not being
  merged into one when `Obj` is cyclic
* this led to C compiler errors when assigning between such types, or
  when the type has hooks (explicit or synthesized) that are called
---
 compiler/mir/mirtypes.nim                     | 16 +++++++++++-----
 .../tequal_instantiation_with_tuple.nim       | 19 +++++++++++++++++++
 2 files changed, 30 insertions(+), 5 deletions(-)
 create mode 100644 tests/lang_callable/generics/tequal_instantiation_with_tuple.nim

diff --git a/compiler/mir/mirtypes.nim b/compiler/mir/mirtypes.nim
index f8791ffd585..6b5055850c4 100644
--- a/compiler/mir/mirtypes.nim
+++ b/compiler/mir/mirtypes.nim
@@ -44,6 +44,10 @@ import
     idioms
   ]
 
+# XXX: sighashes are currently needed for merging generic instantiations, but
+#      this should ultimately happen earlier - in sem - already
+from compiler/sem/sighashes import hashType, ConsiderFlag
+
 type
   TypeKind* = enum
     tkVoid
@@ -133,9 +137,9 @@ type
     canon: Table[HeaderId, TypeId]
       ## maps headers of canonical type descriptions to their type symbol
 
-    instances: Table[(int, HeaderId), TypeId]
-      ## associates a generic type ID + instance body with a type symbol. This
-      ## is used for eliminating same-shaped instantiations of a generic
+    instances: Table[SigHash, TypeId]
+      ## associates the sighash of a generic type instance with a type symbol.
+      ## This is used for eliminating same-shaped instantiations of a generic
       ## object type
 
     idents: BiTable[string]
@@ -1045,9 +1049,11 @@ proc typeSymToMir(env: var TypeEnv, t: PType): TypeId =
 
     # generic types support covariance for tuples. Pick an instance as the
     # "canonical" one, so that - for example - ``Generic[(int,)]`` and
-    # ``Generic[tuple[x: int]]`` map to the same MIR type in the end
+    # ``Generic[tuple[x: int]]`` map to the same MIR type in the end. In order
+    # to support cyclic types, ``sighashes`` has to be used
     if tfFromGeneric in t.flags and
-       (let c = env.instances.mgetOrPut((t.sym.owner.typ.id, canon), result);
+       (let c = env.instances.mgetOrPut(hashType(t, {CoType, CoDistinct}),
+                                        result);
         c != result):
       env.symbols[result].canon = c
   else:
diff --git a/tests/lang_callable/generics/tequal_instantiation_with_tuple.nim b/tests/lang_callable/generics/tequal_instantiation_with_tuple.nim
new file mode 100644
index 00000000000..1e5b60df212
--- /dev/null
+++ b/tests/lang_callable/generics/tequal_instantiation_with_tuple.nim
@@ -0,0 +1,19 @@
+discard """
+  description: '''
+    Ensure that two instantiations of a cyclic generic object type are
+    considered equal at every level (type system, backend, run-time) when
+    one of them is instantiated with a named tuple and the other with an
+    unnamed one
+  '''
+  knownIssue.vm: "``vmtypegen`` considers the two types distinct"
+"""
+
+type Recursive[T] = object
+  # the same problem occurred when a ``ref`` type is used
+  self: ptr Recursive[T]
+  val: T
+
+# it's important that both tuples are comprised of the exact same types
+var x: Recursive[(int, int)]
+var y: Recursive[tuple[a, b: int]]
+x = y

From 39660ca771860ed4cc1ea4b2aa54d881576fa957 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Tue, 6 Aug 2024 22:52:15 +0200
Subject: [PATCH 164/169] cgirgen: instrument with `frameMsg` (#1399)

## Summary

Instrument `cgirgen` with stack-frame annotations in order to aid
debugging with `nim_dbg`.

## Details

* to keep overhead reasonably low, only the `exprToIr` and `stmtToIr`
  procedures are instrumented
* `debugutils.frameMsg` is generalized to accept a `TLineInfo`; the
  callsites are adjusted accordingly
---
 compiler/backend/ccgexprs.nim | 2 +-
 compiler/backend/cgirgen.nim  | 9 +++++++++
 compiler/utils/debugutils.nim | 8 ++++----
 compiler/vm/vmgen.nim         | 2 +-
 4 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/compiler/backend/ccgexprs.nim b/compiler/backend/ccgexprs.nim
index 34717bd7b71..0410ff813bb 100644
--- a/compiler/backend/ccgexprs.nim
+++ b/compiler/backend/ccgexprs.nim
@@ -1638,7 +1638,7 @@ proc useData(p: BProc, x: ConstId, typ: PType): string =
 
 proc expr(p: BProc, n: CgNode, d: var TLoc) =
   when defined(nimCompilerStacktraceHints):
-    frameMsg(p.config, n)
+    frameMsg(p.config, n.info)
   p.currLineInfo = n.info
 
   case n.kind
diff --git a/compiler/backend/cgirgen.nim b/compiler/backend/cgirgen.nim
index 5d36237e7a6..1230c8b382a 100644
--- a/compiler/backend/cgirgen.nim
+++ b/compiler/backend/cgirgen.nim
@@ -47,6 +47,9 @@ import std/options as std_options
 from compiler/ast/ast import newSym, newType, rawAddSon
 from compiler/sem/semdata import makeVarType
 
+when defined(nimCompilerStacktraceHints):
+  import compiler/utils/debugutils
+
 type
   TranslateCl = object
     graph: ModuleGraph
@@ -557,6 +560,9 @@ proc stmtToIr(tree: MirBody, env: MirEnv, cl: var TranslateCl,
   let n {.cursor.} = tree.get(cr)
   let info = cr.info ## the source information of `n`
 
+  when defined(nimCompilerStacktraceHints):
+    frameMsg(cl.graph.config, info)
+
   template to(kind: CgNodeKind, args: varargs[untyped]) =
     stmts.add newStmt(kind, info, args)
 
@@ -683,6 +689,9 @@ proc exprToIr(tree: MirBody, cl: var TranslateCl,
   let n {.cursor.} = get(tree, cr)
   let info = cr.info
 
+  when defined(nimCompilerStacktraceHints):
+    frameMsg(cl.graph.config, info)
+
   template op(kind: CgNodeKind, e: CgNode): CgNode =
     newOp(kind, info, cl.map(n.typ), e)
 
diff --git a/compiler/utils/debugutils.nim b/compiler/utils/debugutils.nim
index be37d126fa4..64624b15c50 100644
--- a/compiler/utils/debugutils.nim
+++ b/compiler/utils/debugutils.nim
@@ -636,13 +636,13 @@ template frameMsg*(c: ConfigRef, n: PNode) =
       $n.info.line,
       $n.info.col]
 
-template frameMsg*(c: ConfigRef, n: CgNode) =
+template frameMsg*(c: ConfigRef, info: TLineInfo) =
   {.line.}:
     setFrameMsg "$1 $2($3, $4)" % [
       $n.kind,
-      c.toFullPath(n.info.fileIndex),
-      $n.info.line,
-      $n.info.col]
+      c.toFullPath(info.fileIndex),
+      $info.line,
+      $info.col]
 
 const locOffset = -2
 
diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 805e3e9e524..01fbe39faef 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -2998,7 +2998,7 @@ proc binaryArith(c: var TCtx, e, x, y: CgNode, dest: var TDest,
 
 proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
   when defined(nimCompilerStacktraceHints):
-    frameMsg c.config, n
+    frameMsg c.config, n.info
 
   case n.kind
   of cnkProc:

From 7309115d7729c62cc44db12c7c1a400cd7d4ac35 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Wed, 7 Aug 2024 23:06:00 +0200
Subject: [PATCH 165/169] fix wrong hooks being picked for tuple types (#1402)

## Summary

* fix tuples such as `((A, B),)` and `((A,), B)` being assigned the
  the same set of hooks
* fix the aforementioned tuples sharing the same RTTI object

## Details

* add the tuple length to the type representation during type hashing
  (`sighash`), so that `((A,), B)` and `((A, B),)` result in two
  different `SigHash`es
* `liftdestructors` uses `sighashes` for canonicalizing structural
  types, thus previously treating said tuples as the same type
* RTTI creation, which also uses `SigHash`, was affected in the same
  way
---
 compiler/sem/sighashes.nim                    |  3 ++
 .../ttuple_hook_synthesis_issue.nim           | 30 +++++++++++++++++++
 2 files changed, 33 insertions(+)
 create mode 100644 tests/lang_objects/destructor/ttuple_hook_synthesis_issue.nim

diff --git a/compiler/sem/sighashes.nim b/compiler/sem/sighashes.nim
index e56fc615aed..152deff135f 100644
--- a/compiler/sem/sighashes.nim
+++ b/compiler/sem/sighashes.nim
@@ -188,6 +188,9 @@ proc hashType(c: var MD5Context, t: PType; flags: set[ConsiderFlag]) =
     c.hashTree(t.n, {})
   of tyTuple:
     c &= char(t.kind)
+    # add the length so that (int, int) and ((int,), int) have different
+    # representations
+    c &= t.len
     if t.n != nil and CoType notin flags:
       assert(t.n.len == t.len)
       for i in 0..<t.n.len:
diff --git a/tests/lang_objects/destructor/ttuple_hook_synthesis_issue.nim b/tests/lang_objects/destructor/ttuple_hook_synthesis_issue.nim
new file mode 100644
index 00000000000..1ccfb0d09c6
--- /dev/null
+++ b/tests/lang_objects/destructor/ttuple_hook_synthesis_issue.nim
@@ -0,0 +1,30 @@
+discard """
+  description: '''
+    Ensure that hook synthesis considers ``(A, (B, C))`` different from
+    ``(A, (B,), C)``.
+  '''
+  output: "3\n4\n1\n2\n"
+  knownIssue.js vm: "seq destructors don't work yet"
+"""
+
+type Object = object
+  val: int
+
+proc `=destroy`(x: var Object) =
+  echo x.val
+
+# a seq is only used for testing purposes, since it caused misbehaviour at
+# run-time. Using ``(Object, (Object,) Object)`` and
+# ``(Object, (Object, Object))`` also led to the same issue, but ran
+# "correctly" due to both types having the same in-memory layout
+type
+  Tup1 = (seq[(Object,)], Object)
+  Tup2 = (seq[(Object, Object)],)
+
+proc test() =
+  var x: Tup1 = (@[(Object(val: 1),)], Object(val: 2))
+  var y: Tup2 = (@[(Object(val: 3), Object(val: 4))],)
+  # both locations were treated as having type `Tup1` by the called
+  # destructor, resulting in either crashes or the wrong output being produced
+
+test()

From 22d24d75c3464478d5ed4cc125c21cb7aeca4405 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 8 Aug 2024 01:50:31 +0200
Subject: [PATCH 166/169] sem: fix error propagation for tuple construction
 (#1403)

## Summary

* fix errors in anonymous tuple constructions not being propagated
* fix the error for colon expressions in anonymous tuple constructions
  being "invalid expression" instead of "named expression not allowed
  here"

## Details

* properly propagate errors from element expressions
* don't analyze `nkExprColonExpr` as a normal expression
* don't modify input AST
* skip tuple type constructor analysis if any of the element
  expressions is erroneous
---
 compiler/sem/semexprs.nim      | 54 ++++++++++++++++++++--------------
 tests/errmsgs/tmixed_tuple.nim |  7 +++++
 2 files changed, 39 insertions(+), 22 deletions(-)
 create mode 100644 tests/errmsgs/tmixed_tuple.nim

diff --git a/compiler/sem/semexprs.nim b/compiler/sem/semexprs.nim
index e98531714e9..66dbc8bac7e 100644
--- a/compiler/sem/semexprs.nim
+++ b/compiler/sem/semexprs.nim
@@ -3148,39 +3148,49 @@ proc semTuplePositionsConstr(c: PContext, n: PNode, flags: TExprFlags): PNode =
                           "expected nkTupleConstr, got: " & $n.kind)
   
   let
-    tupExp = n                  # we don't modify n, but compute the type:
+    tupExp = shallowCopy(n)
     typ = newTypeS(tyTuple, c)  # leave typ.n nil!
-  for i in 0..<tupExp.len:
-    tupExp[i] = semExprWithType(c, tupExp[i], {}) # xxx: claim of not modifying
-                                                  #      n is dubious
-    addSonSkipIntLit(typ, tupExp[i].typ, c.idgen)
+
+  var hasError = false
+
+  for i, it in n.pairs:
+    var etyp: PType
+    if it.kind == nkExprColonExpr:
+      # can happen for ``(a, b: c)``. Analyze the expression for the sake of
+      # error correction (check/nimsuggest)
+      let elem = copyNodeWithKids(it)
+      elem[1] = semExprWithType(c, it[1], {})
+      etyp = elem[1].typ
+
+      tupExp[i] = c.config.newError(elem):
+        PAstDiag(kind: adSemNamedExprNotAllowed)
+    else:
+      tupExp[i] = semExprWithType(c, it, {})
+      etyp = tupExp[i].typ
+
+    hasError = hasError or tupExp[i].isError
+    addSonSkipIntLit(typ, etyp, c.idgen)
+
   tupExp.typ = typ
 
-  var
-    isTupleType: bool
-    hasError = false
+  if hasError:
+    # don't analyze any further
+    return c.config.wrapError(tupExp)
+
   if tupExp.len > 0: # don't interpret () as type
-    isTupleType = tupExp[0].typ.kind == tyTypeDesc
+    let isTupleType = tupExp[0].typ.kind == tyTypeDesc
     # check if either everything or nothing is tyTypeDesc
     for i in 1..<tupExp.len:
-      if tupExp[i].kind == nkExprColonExpr:
-        hasError = true
-        # xxx: not sure if this modification is safe
-        tupExp[i] = c.config.newError(tupExp[i],
-                                      PAstDiag(kind: adSemNamedExprNotAllowed))
-      elif isTupleType != (tupExp[i].typ.kind == tyTypeDesc):
+      if isTupleType != (tupExp[i].typ.kind == tyTypeDesc):
         # xxx: maybe capture the field instead of the info?
         return c.config.newError(n,
                           PAstDiag(kind: adSemCannotMixTypesAndValuesInTuple,
                                    wrongFldInfo: tupExp[i].info))
 
-  if hasError:
-    result = c.config.wrapError(tupExp)
-  elif isTupleType: # reinterpret `(int, string)` as type expressions
-    result = n
-    result.typ = makeTypeDesc(c, semTypeNode(c, n, nil).skipTypes({tyTypeDesc}))
-  else:
-    result = tupExp
+    if isTupleType: # reinterpret `(int, string)` as a type expression
+      tupExp.typ = makeTypeDesc(c, semTypeNode(c, tupExp, nil))
+
+  result = tupExp
 
 proc semTupleConstr(c: PContext, n: PNode, flags: TExprFlags): PNode =
   ## analyse tuple construction based on position of fields or return errors
diff --git a/tests/errmsgs/tmixed_tuple.nim b/tests/errmsgs/tmixed_tuple.nim
new file mode 100644
index 00000000000..8e75c03142b
--- /dev/null
+++ b/tests/errmsgs/tmixed_tuple.nim
@@ -0,0 +1,7 @@
+discard """
+  errormsg: "named expression not allowed here"
+  line: 7
+"""
+
+var x = 0
+discard (x, a: x)

From c46ddf248a8306ebdb05a19ae8d8faf876061606 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 8 Aug 2024 02:19:10 +0200
Subject: [PATCH 167/169] fix compiler crash when converting `nil` to `distinct
 pointer`  (#1404)

## Summary

Expressions such as `A(pointer(nil))` crashed the compiler when `A` is
a `distinct pointer` type. This is now fixed.

## Details

Said expression reached cgirgen as `(LvalueConv (Type "A") (NilLit))`,
and since `NilLit` is not expected as the operand of an lvalue
conversion, the compiler crashed. `distinct ptr` types weren't
affected, due to `semfold` unconditionally folding `ptr` conversions
away. `A(nil)` was not affected due to `transf` folding the expression
into just a `nil` literal as part of its `tyNil` fixup.

In order to make pointer conversion behaviour consistent, `semfold` now
folds all nil-to-pointer-like conversions into a properly typed `nil`
literal. The `tyNil` fixup logic in `transf` thus becomes obsolete, and
is removed.

Beyond fixing the crash, this also means that `pointer(nil)` is now
detected as a constant expression without having to evaluate it with
the VM.
---
 compiler/sem/semfold.nim                      | 11 +++++++--
 compiler/sem/transf.nim                       | 13 -----------
 .../tnil_to_distinct_conversion.nim           | 23 +++++++++++++++++++
 3 files changed, 32 insertions(+), 15 deletions(-)
 create mode 100644 tests/lang_exprs/tnil_to_distinct_conversion.nim

diff --git a/compiler/sem/semfold.nim b/compiler/sem/semfold.nim
index e211a3a4db4..c235366cc08 100644
--- a/compiler/sem/semfold.nim
+++ b/compiler/sem/semfold.nim
@@ -518,8 +518,15 @@ proc foldConv(n, a: PNode; idgen: IdGenerator; g: ModuleGraph): PNode =
       result = newFloatNodeT(val, n, g)
     else:
       result = rangeError(n, a, g)
-  of tyOpenArray, tyVarargs, tyProc, tyPointer:
+  of tyOpenArray, tyVarargs:
     discard
+  of tyProc, tyPointer, tyPtr:
+    if a.kind == nkNilLit:
+      # apply the type directly to the 'nil' expression
+      result = a
+      result.typ = n.typ
+    else:
+      result = nil # cannot fold
   else:
     # FIXME: conversion-to-enum is missing checks
     result = a
@@ -903,7 +910,7 @@ proc foldConstExprAux(m: PSym, n: PNode, idgen: IdGenerator, g: ModuleGraph): Fo
   # in the back-end (e.g. ``cast[pointer](someProc)``). In addition, so as to
   # not interfere with the documentation generator, statement-list expressions
   # are not folded if they have a comment in the first position
-  let exprIsPointerCast = n.kind in {nkCast, nkConv, nkHiddenStdConv} and
+  let exprIsPointerCast = n.kind == nkCast and
                           n.typ != nil and
                           n.typ.kind in {tyPointer, tyProc}
   if not exprIsPointerCast and
diff --git a/compiler/sem/transf.nim b/compiler/sem/transf.nim
index 7b96ae60e67..5feab15987f 100644
--- a/compiler/sem/transf.nim
+++ b/compiler/sem/transf.nim
@@ -636,12 +636,6 @@ proc transformConv(c: PTransf, n: PNode): PNode =
         result = newTreeIT(
           if diff < 0: nkObjUpConv else: nkObjDownConv,
           n.info, n.typ): transform(c, n[1])
-    of tyNil:
-      # a ``T(nil)`` expression
-      # XXX: it might be a better idea to eliminate the conversion during
-      #      semantic analysis instead
-      result = transform(c, n[1])
-      result.typ = n.typ
     else:
       result = transformSons(c, n)
   of tyObject:
@@ -653,13 +647,6 @@ proc transformConv(c: PTransf, n: PNode): PNode =
       result = newTreeIT(
         if diff < 0: nkObjUpConv else: nkObjDownConv,
         n.info, n.typ): transform(c, n[1])
-  of tyPointer:
-    case source.kind
-    of tyNil:
-      result = transform(c, n[1])
-      result.typ = n.typ
-    else:
-      result = transformSons(c, n)
   of tyGenericParam, tyOrdinal:
     result = transform(c, n[1])
     # happens sometimes for generated assignments, etc.
diff --git a/tests/lang_exprs/tnil_to_distinct_conversion.nim b/tests/lang_exprs/tnil_to_distinct_conversion.nim
new file mode 100644
index 00000000000..45a47d8ee22
--- /dev/null
+++ b/tests/lang_exprs/tnil_to_distinct_conversion.nim
@@ -0,0 +1,23 @@
+discard """
+  description: '''
+    Ensure that converting 'nil' literals to ``distinct pointer`` works
+  '''
+  matrix: "--hints:off --showir:mir_in:test"
+  nimoutFull: true
+  nimout: '''
+-- MIR: test
+scope:
+  def a: Ptr = nil
+  def b: Ptr = nil
+
+-- end
+'''
+"""
+
+type Ptr = distinct pointer
+
+proc test() =
+  var a = Ptr(nil) # direct conversions
+  var b = Ptr(pointer(nil)) # with intermediate conversion
+
+test()

From e0963b87615498c33c0e36b24c61810aa9d38877 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 8 Aug 2024 20:56:02 +0200
Subject: [PATCH 168/169] vmgen: respect overflow checks for 64-bit negation
 (#1408)

## Summary

Negation of 64-bit integers didn't respect the overflow check setting,
resulting in overflow defects even when the checks are disabled. This
is now fixed.

Fixes https://github.com/nim-works/nimskull/issues/1406.

## Details

The VM presently doesn't support unchecked negation. For ease of
implementation, unchecked negation is emulated in bytecode as
`not(x) + 1`.
---
 compiler/vm/vmgen.nim                    | 17 +++++++++++++++--
 tests/overflw/tunchecked_negation_32.nim | 10 ++++++++++
 tests/overflw/tunchecked_negation_64.nim | 10 ++++++++++
 3 files changed, 35 insertions(+), 2 deletions(-)
 create mode 100644 tests/overflw/tunchecked_negation_32.nim
 create mode 100644 tests/overflw/tunchecked_negation_64.nim

diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index 01fbe39faef..c530a4a7488 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -3018,8 +3018,21 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
       clearDest(c, n, dest)
   of cnkNeg:
     prepare(c, dest, n.typ)
-    let a = c.genx(n[0])
-    c.gABC(n, pick(n, opcUnaryMinusInt, opcUnaryMinusFloat), dest, a)
+    let
+      a = c.genx(n[0])
+      op = pick(n, opcUnaryMinusInt, opcUnaryMinusFloat)
+    if op == opcUnaryMinusInt:
+      # the VM has no built-in unchecked integer negation, so it's emulated in
+      # an overflow-safe manner
+      # XXX: this is sub-optimal. In the future, all VM integer operations
+      #      should be unchecked
+      c.gABC(n, opcBitnotInt, dest, a)    # invert
+      let tmp = c.getTemp(slotTempInt)
+      c.gABx(n, opcLdImmInt, tmp, 1)
+      c.gABC(n, opcAddu, dest, dest, tmp) # + 1 (two's complement)
+      c.freeTemp(tmp)
+    else:
+      c.gABC(n, op, dest, a)
     c.freeTemp(a)
   of cnkAdd: binaryArith(c, n, n[0], n[1], dest, opcAddu, opcAddFloat)
   of cnkSub: binaryArith(c, n, n[0], n[1], dest, opcSubu, opcSubFloat)
diff --git a/tests/overflw/tunchecked_negation_32.nim b/tests/overflw/tunchecked_negation_32.nim
new file mode 100644
index 00000000000..e03c0260300
--- /dev/null
+++ b/tests/overflw/tunchecked_negation_32.nim
@@ -0,0 +1,10 @@
+discard """
+  description: '''
+    Ensure that disabling overflow checks works for 32-bit integer negations
+  '''
+  targets: "c js vm"
+  matrix: "--overflowChecks:off"
+"""
+
+var x = low(int32)
+discard -x
\ No newline at end of file
diff --git a/tests/overflw/tunchecked_negation_64.nim b/tests/overflw/tunchecked_negation_64.nim
new file mode 100644
index 00000000000..23ed5382a6a
--- /dev/null
+++ b/tests/overflw/tunchecked_negation_64.nim
@@ -0,0 +1,10 @@
+discard """
+  description: '''
+    Ensure that disabling overflow checks works for 64-bit integer negations
+  '''
+  targets: "c js vm"
+  matrix: "--overflowChecks:off"
+"""
+
+var x = low(int64)
+discard -x

From 1c9e91c405452242b78f1061672fa769c2f57ee2 Mon Sep 17 00:00:00 2001
From: zerbina <100542850+zerbina@users.noreply.github.com>
Date: Thu, 8 Aug 2024 21:32:56 +0200
Subject: [PATCH 169/169] vmgen: fix incorrect code generation for `lent`/`var`
 deref (#1409)

## Summary

Fix reading from a `var`/`lent` view of an unsigned integer (with bit-
width <= 32) producing incorrect values, when using the VM.

Fixes https://github.com/nim-works/nimskull/issues/1407.

## Details

* change `genDerefView` to take the `cnkDerefView` node as input, so
  that it has access to the type of the result
* the type of the *view* (not the storage type) was previously passed
  to the `genRegLoad` call, resulting in no `NarrowU` instruction to be
  emitted for the memory access, and the value thus being sign-extended
---
 compiler/vm/vmgen.nim           | 19 +++++++++----------
 tests/vm/tvmgen_regressions.nim | 20 +++++++++++++++++++-
 2 files changed, 28 insertions(+), 11 deletions(-)

diff --git a/compiler/vm/vmgen.nim b/compiler/vm/vmgen.nim
index c530a4a7488..acada37c8ad 100644
--- a/compiler/vm/vmgen.nim
+++ b/compiler/vm/vmgen.nim
@@ -2466,18 +2466,17 @@ proc genAsgnToLocal(c: var TCtx, le, ri: CgNode) =
     gen(c, ri, dest)
 
 proc genDerefView(c: var TCtx, n: CgNode, dest: var TDest; load = true) =
-  ## Generates and emits the code for a view dereference, where `n` is the
-  ## expression that evaluates to a view. `load` indicates whether the
-  ## *handle* of the underlying location or the value stored in it should be
-  ## put into `dest`.
+  ## Generates and emits the code for a view dereference. `load` indicates
+  ## whether the *handle* of the underlying location or the value stored in
+  ## it should be put into `dest`.
   let
-    isPtr = isPtrView(n)
-    needsLoad = load and fitsRegister(n.typ.skipTypes(abstractVar))
+    isPtr = isPtrView(n.operand)
+    needsLoad = load and fitsRegister(n.typ)
 
   if isPtr or needsLoad:
     # we need to process the operand further, and thus need a temporary
     prepare(c, dest, n.typ) # XXX: the passed type is incorrect
-    let tmp = c.genx(n)
+    let tmp = c.genx(n.operand)
     var src = tmp
 
     if isPtr:
@@ -2493,7 +2492,7 @@ proc genDerefView(c: var TCtx, n: CgNode, dest: var TDest; load = true) =
     c.freeTemp(tmp)
   else:
     # no processing required; load the handle directly into `dest`
-    c.gen(n, dest)
+    c.gen(n.operand, dest)
 
 proc genAsgn(c: var TCtx; le, ri: CgNode; requiresCopy: bool) =
   case le.kind
@@ -2530,7 +2529,7 @@ proc genAsgn(c: var TCtx; le, ri: CgNode; requiresCopy: bool) =
       c.freeTemp(dest)
     else:
       var dest = noDest
-      genDerefView(c, le.operand, dest, load=false)
+      genDerefView(c, le, dest, load=false)
       putIntoLoc(c, ri, dest, 0, opcWrLoc, opcWrLoc)
       c.freeTemp(dest)
   of cnkDeref:
@@ -3083,7 +3082,7 @@ proc gen(c: var TCtx; n: CgNode; dest: var TDest) =
   of cnkDerefView:
     assert isLocView(n.operand.typ)
     # a view indirection
-    genDerefView(c, n.operand, dest)
+    genDerefView(c, n, dest)
   of cnkHiddenAddr:
     assert isLocView(n.typ)
     # load the source operand as a handle
diff --git a/tests/vm/tvmgen_regressions.nim b/tests/vm/tvmgen_regressions.nim
index 1af09d44ff2..e8ad9553487 100644
--- a/tests/vm/tvmgen_regressions.nim
+++ b/tests/vm/tvmgen_regressions.nim
@@ -30,4 +30,22 @@ block wrong_getast:
     let x = [getAst(m())]
     doAssert x[0].intVal == 1
 
-  m2()
\ No newline at end of file
+  m2()
+
+block wrong_uint_view_deref:
+  # reading from a lent/var indirection produced the wrong value for non-full-
+  # width integer types, when the highest bit was set
+  proc f_lent[T](x: var T): lent T = x
+  proc f_var[T](x: var T): var T = x
+
+  var
+    a = high(uint8)
+    b = high(uint16)
+    c = high(uint32)
+
+  doAssert f_lent(a) == high(uint8)
+  doAssert f_lent(b) == high(uint16)
+  doAssert f_lent(c) == high(uint32)
+  doAssert f_var(a)  == high(uint8)
+  doAssert f_var(b)  == high(uint16)
+  doAssert f_var(c)  == high(uint32)