about summary refs log tree commit diff stats
path: root/shell/tokenize.mu
diff options
context:
space:
mode:
authorKartik K. Agaram <vc@akkartik.com>2021-06-18 19:46:19 -0700
committerKartik K. Agaram <vc@akkartik.com>2021-06-18 19:52:54 -0700
commitdd133c2a095228e8424a388ca575a8086ee34690 (patch)
treeecc408188e62dd66feec8e01e14d577d89b01fe7 /shell/tokenize.mu
parentb5306cabd38da962842aea7d536d44e7edca50bc (diff)
downloadmu-dd133c2a095228e8424a388ca575a8086ee34690.tar.gz
start implementing indent-sensitivity
General plan:
  stop skipping newlines during tokenization
  introduce a new indent token, initially skip it transparently
  start doing cleverer things
Diffstat (limited to 'shell/tokenize.mu')
-rw-r--r--shell/tokenize.mu28
1 files changed, 26 insertions, 2 deletions
diff --git a/shell/tokenize.mu b/shell/tokenize.mu
index e019a3b4..8c7583a9 100644
--- a/shell/tokenize.mu
+++ b/shell/tokenize.mu
@@ -4,6 +4,7 @@ type token {
   # type 0: default
   # type 1: stream
   text-data: (handle stream byte)
+  # type 2: skip (end of line or end of file)
 }
 
 fn tokenize in: (addr gap-buffer), out: (addr stream token), trace: (addr trace) {
@@ -11,7 +12,6 @@ fn tokenize in: (addr gap-buffer), out: (addr stream token), trace: (addr trace)
   trace-lower trace
   rewind-gap-buffer in
   {
-    skip-whitespace-from-gap-buffer in
     var done?/eax: boolean <- gap-buffer-scan-done? in
     compare done?, 0/false
     break-if-!=
@@ -25,7 +25,10 @@ fn tokenize in: (addr gap-buffer), out: (addr stream token), trace: (addr trace)
       break-if-=
       return
     }
-    var skip?/eax: boolean <- comment-token? token
+    var comment?/eax: boolean <- comment-token? token
+    compare comment?, 0/false
+    loop-if-!=
+    var skip?/eax: boolean <- skip-token? token
     compare skip?, 0/false
     loop-if-!=
     write-to-stream out, token  # shallow-copy text-data
@@ -293,6 +296,16 @@ fn test-tokenize-stream-literal-in-tree {
 fn next-token in: (addr gap-buffer), _out-token: (addr token), trace: (addr trace) {
   trace-text trace, "tokenize", "next-token"
   trace-lower trace
+  skip-whitespace-from-gap-buffer in
+  {
+    var done?/eax: boolean <- gap-buffer-scan-done? in
+    compare done?, 0/false
+    break-if-=
+    var out-token/eax: (addr token) <- copy _out-token
+    var out-token-type/eax: (addr int) <- get out-token, type
+    copy-to *out-token-type, 2/skip
+    return
+  }
   var _g/eax: grapheme <- peek-from-gap-buffer in
   var g/ecx: grapheme <- copy _g
   {
@@ -1126,6 +1139,17 @@ fn comment-token? _in: (addr token) -> _/eax: boolean {
   return 1/true
 }
 
+fn skip-token? _in: (addr token) -> _/eax: boolean {
+  var in/eax: (addr token) <- copy _in
+  var in-type/eax: (addr int) <- get in, type
+  compare *in-type, 2/skip
+  {
+    break-if-=
+    return 0/false
+  }
+  return 1/true
+}
+
 fn allocate-token _out: (addr handle token) {
   var out/eax: (addr handle token) <- copy _out
   allocate out