geddski
diff --git a/‎package.json
Lines changed: 2 additions & 2 deletions b/‎package.json
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/python.grammar
Lines changed: 9 additions & 14 deletions b/‎src/python.grammar
Lines changed: 9 additions & 14 deletions
diff --git a/‎src/tokens.js
Lines changed: 45 additions & 104 deletions b/‎src/tokens.js
Lines changed: 45 additions & 104 deletions
@@ -13,13 +13,13 @@
   "author": "Marijn Haverbeke <marijnh@gmail.com>",
   "license": "MIT",
   "devDependencies": {
-    "lezer-generator": "^0.13.0",
+    "lezer-generator": "^0.13.3",
     "mocha": "^8.1.3",
     "rollup": "^2.27.1",
     "@rollup/plugin-node-resolve": "^9.0.0"
   },
   "dependencies": {
-    "lezer": "^0.13.0"
+    "lezer": "^0.13.2"
   },
   "repository": {
     "type" : "git",
 
@@ -67,7 +67,7 @@ importedNames { commaSep<VariableName | VariableName kw<"as"> VariableName> }
 
 commaSep<expr> { expr ("," expr)* ","? }
 
-compoundStatement[@export] {
+compoundStatement {
   IfStatement |
   WhileStatement { kw<"while"> testNamed Body elseClause? } |
   ForStatement { kw<"async">? kw<"for"> commaSep<"*"? expression> kw<"in"> commaSep<test> Body elseClause? } |
@@ -78,22 +78,22 @@ compoundStatement[@export] {
   DecoratedStatement { Decorator+ (ClassDefinition | FunctionDefinition) }
 }
 
-elseClause { _else Body }
+elseClause { kw<"else"> Body }
 
 IfStatement {
   kw<"if"> testNamed Body
-  (_elif testNamed? Body)*
+  (kw<"elif"> testNamed? Body)*
   elseClause?
 }
 
 TryStatement {
   kw<"try"> Body
-  (_except (test ((kw<"as"> | ",") VariableName)?)? Body)*
+  (kw<"except"> (test ((kw<"as"> | ",") VariableName)?)? Body)*
   elseClause?
-  (_finally Body)?
+  (kw<"finally"> Body)?
 }
 
-Body { ":" (simpleStatement | newline continueBody statement (continueBody statement)* (endBody | eof)) }
+Body { ":" (simpleStatement | newline indent statement+ (dedent | eof)) }
 
 lambdaParam { VariableName (AssignOp{"="} test)? | "*" VariableName? | "**" VariableName }
@@ -203,14 +203,11 @@ kw<term> { @specialize[@name={term}]<identifier, term> }
 
 FormatReplacement { "{" (YieldExpression | commaSep<"*"? test>) FormatConversion? (formatStringSpec | "}") }
 
+@context trackIndent from "./tokens.js"
+
 @external tokens legacyPrint from "./tokens.js" { printKeyword[@name="print"] }
 
-@external tokens statementContinueKeyword from "./tokens" {
-  _else[@name="else"],
-  _elif[@name="elif"],
-  _except[@name="except"],
-  _finally[@name="finally"]
-}
+@external tokens indentation from "./tokens" { indent, dedent }
 
 @tokens {
   CompareOp { "<" | ">" | $[<>=!] "=" | "<>" }
@@ -289,5 +286,3 @@ FormatReplacement { "{" (YieldExpression | commaSep<"*"? test>) FormatConversion
 }
 
 @external tokens newlines from "./tokens" { newline, newlineBracketed, newlineEmpty, eof }
-
-@external tokens bodyContinue from "./tokens" { continueBody, endBody }
@@ -1,132 +1,73 @@
-import {ExternalTokenizer} from "lezer"
+import {ExternalTokenizer, ContextTracker} from "lezer"
 import {
-  newline as newlineToken, eof, newlineEmpty, newlineBracketed, continueBody, endBody,
-  _else, _elif, _except, _finally,
+  newline as newlineToken, eof, newlineEmpty, newlineBracketed, indent, dedent, printKeyword,
   ParenthesizedExpression, TupleExpression, ComprehensionExpression, ArrayExpression, ArrayComprehensionExpression,
-  DictionaryExpression, DictionaryComprehensionExpression, SetExpression, SetComprehensionExpression,
-  compoundStatement,
-  printKeyword
+  DictionaryExpression, DictionaryComprehensionExpression, SetExpression, SetComprehensionExpression
 } from "./parser.terms.js"
 
 const newline = 10, carriageReturn = 13, space = 32, tab = 9, hash = 35, parenOpen = 40, dot = 46
 
 const bracketed = [
   ParenthesizedExpression, TupleExpression, ComprehensionExpression, ArrayExpression, Ar
F438
rayComprehensionExpression,
   DictionaryExpression, DictionaryComprehensionExpression, SetExpression, SetComprehensionExpression
-], parentStatement = [compoundStatement]
-
-const caches = new WeakMap
-
-// Per-input-stream indentation cache. `prev` maps indentation depths
-// to the last position at which a statement indented to that depth
-// was seen. There's an extra set of slots for the _current_
-// indentation, since that needs to be available alongside a previous
-// indentation position at the same level.
-class Cache {
-  constructor() {
-    this.last = this.lastIndent = -1
-    this.prev = []
-  }
-
-  get(pos) {
-    if (this.last == pos) return this.lastIndent
-    for (let i = 0; i < this.prev.length; i++) if (this.prev[i] == pos) return i
-    return -1
-  }
-
-  set(pos, indent) {
-    if (pos == this.last) return
-    if (this.last > -1) this.setPrev(this.last, this.lastIndent)
-    this.last = pos
-    this.lastIndent = indent
-  }
-
-  setPrev(pos, indent) {
-    while (this.prev.length < indent) this.prev.push(-1)
-    this.prev[indent] = pos
-  }
-
-  static for(input) {
-    let found = caches.get(input)
-    if (!found) caches.set(input, found = new Cache)
-    return found
-  }
-}
-
-const maxIndent = 50
+]
 
+let cachedIndent = 0, cachedInput = null, cachedPos = 0
 function getIndent(input, pos) {
-  let cache = Cache.for(input), found = cache.get(pos)
-  if (found > -1) return found
+  if (pos == cachedPos && input == cachedInput) return cachedIndent
+  cachedInput = input; cachedPos = pos
+  return cachedIndent = getIndentInner(input, pos)
+}
 
-  // This shouldn't happen very often (or even at all) in normal
-  // parsing, since the indentations are stored by the newline
-  // tokenizer ahead of time. But it's kind of tricky to prove whether
-  // that always happens in incremental parsing scenarios, so here's a
-  // fallback anyway.
-  let before = input.read(Math.max(0, pos - maxIndent), pos)
-  let count = 0, start = before.length
-  for (; start > 0; start--) {
-    let next = before.charCodeAt(start - 1)
-    if (next == newline || next == carriageReturn) break
-  }
-  for (let i = start; i < before.length; i++) {
-    let ch = before.charCodeAt(i)
-    if (ch == space) count++
-    else if (ch == tab) count += 8 - (count % 8)
-    else break
+function getIndentInner(input, pos) {
+  for (let indent = 0;; pos++) {
+    let ch = input.get(pos)
+    if (ch == space) indent++
+    else if (ch == tab) indent += 8 - (indent % 8)
+    else if (ch == newline || ch == carriageReturn || ch == hash) return -1
+    else return indent
   }
-  cache.setPrev(pos, count)
-  return count
 }
 
   let next = input.get(token.start)
   if (next < 0) {
     token.accept(eof, token.start)
-    return
-  }
-  if (next != newline && next != carriageReturn) return
-  if (stack.startOf(bracketed) != null) {
+  } else if (next != newline && next != carriageReturn) {
+  } else if (stack.startOf(bracketed) != null) {
     token.accept(newlineBracketed, token.start + 1)
-    return
-  }
-  let scan = token.start + 1, indent = 0
-  for (; scan < input.length; scan++) {
-    let ch = input.get(scan)
-    if (ch == space) indent++
-    else if (ch == tab) indent += 8 - (indent % 8)
-    else if (ch == newline || ch == carriageReturn || ch == hash) {
-      token.accept(newlineEmpty, token.start + 1)
-      return
-    } else {
-      break
-    }
+  } else if (getIndent(input, token.start + 1) < 0) {
+    token.accept(newlineEmpty, token.start + 1)
+  } else {
+    token.accept(newlineToken, token.start + 1)
   }
-  token.accept(newlineToken, token.start + 1)
-  Cache.for(input).set(scan, indent)
 }, {contextual: true, fallback: true})
 
-export const bodyContinue = new ExternalTokenizer((input, token, stack) => {
-  let parent = stack.startOf(parentStatement)
-  let parentIndent = parent == null ? 0 : getIndent(input, parent)
-  let indentHere = getIndent(input, token.start)
-  token.accept(indentHere <= parentIndent ? endBody : continueBody, token.start)
-}, {contextual: true, fallback: true})
+export const indentation = new ExternalTokenizer((input, token, stack) => {
+  let prev = input.get(token.start - 1), depth
+  if ((prev == newline || prev == carriageReturn) &&
+      (depth = getIndent(input, token.start)) >= 0 &&
+      depth != stack.context.depth &&
+      stack.startOf(bracketed) == null)
+    token.accept(depth < stack.context.depth ? dedent : indent, token.start)
+})
 
-let keywords = {else: _else, elif: _elif, except: _except, finally: _finally}
+function IndentLevel(parent, depth) {
+  this.parent = parent
+  this.depth = depth
+  this.hash = (parent ? parent.hash + parent.hash << 8 : 0) + depth + (depth << 4)
+}
 
-// Matches else/elif/except/finally, but only when at same indentation
-// as their parent statement
-export const statementContinueKeyword = new ExternalTokenizer((input, token, stack) => {
-  let pos = token.start, next = input.get(token.start), m
-  if (next == 101 /* 'e' */ && (m = /^(?:else|elif|except)\b/.exec(input.read(pos, pos + 7))) ||
-      next == 102 /* 'f' */ && (m = /^finally\b/.exec(input.read(pos, pos + 8)))) {
-    let parent = stack.startOf(parentStatement)
-    let parentIndent = parent == null ? 0 : getIndent(input, parent)
-    if (getIndent(input, token.start) == parentIndent) token.accept(keywords[m[0]], pos + m[0].length)
-  }
-}, {contextual: true, fallback: true})
+const topIndent = new IndentLevel(null, 0)
+
+export const trackIndent = new ContextTracker({
+  start: topIndent,
+  shift(context, term, input, stack) {
+    return term == indent ? new IndentLevel(context, getIndent(input, stack.pos)) :
+      term == dedent ? context.parent : context
+  },
+  hash(context) { return context.hash }
+})
 
 export const legacyPrint = new ExternalTokenizer((input, token) => {
   let pos = token.start