refact(rivet/tokenizer): simplify Tokenizer.decode_unicode_escaped_rune()

StunxFS · StunxFS · commit ce04b51eed9e · 2023-11-16T20:47:45.000-04:00
diff --git a/lib/rivet/src/ast/CHeader.ri b/lib/rivet/src/ast/CHeader.ri
@@ -2,14 +2,12 @@
 // Use of this source code is governed by an MIT license that can
 // be found in the LICENSE file.
 
-import std/conv;
 import std/traits;
 import std/process;
 import std/strings;
 import { Path } from std/fs;
 
 import ../token;
-import ../report;
 
 // Useful functions to get system `#define`s.
 // Will soon be used to implement `extern (C) import`.
diff --git a/lib/rivet/src/tokenizer/mod.ri b/lib/rivet/src/tokenizer/mod.ri
@@ -307,23 +307,16 @@ func decode_u_escape_single(str: string, idx: uint) -> (uint, string) {
 }
 
 // decode the flagged unicode escape sequences into their utf-8 bytes
-func decode_u_escapes(str: string, start: uint, escapes_pos: []uint) -> string {
-    if escapes_pos.is_empty() {
-        return str;
-    }
-    mut ss := @vec(string, escapes_pos.len * 2 + 1);
-    ss.push(str[..escapes_pos[escapes_pos.len - 1] - start]);
-    for i, pos in escapes_pos {
-        idx := pos - start;
-        (end_idx, segment) := decode_u_escape_single(str, idx);
+func decode_unicode_escaped_rune(str: string) -> string {
+    (end_idx, segment) := decode_u_escape_single(str, 0);
+    return if str.len == end_idx {
+        segment
+    } else {
+        mut ss := @vec(string, 2);
         ss.push(segment);
-        ss.push(if i + 1 < escapes_pos.len {
-            str[end_idx..escapes_pos[i + 1] - start]
-        } else {
-            str[end_idx..]
-        });
-    }
-    return utils.join(ss, "");
+        ss.push(str[end_idx..]);
+        utils.join(ss, "")
+    };
 }
 
 func trim_slash_line_break(s: string) -> string {
diff --git a/lib/rivet/src/tokenizer/next.ri b/lib/rivet/src/tokenizer/next.ri
@@ -584,7 +584,7 @@ extend Tokenizer {
             if ch.len % 2 == 0 and (escaped_hex or escaped_unicode or escaped_octal) {
                 if escaped_unicode {
                     // there can only be one, so attempt to decode it now
-                    ch = decode_u_escapes(ch, 0, [0]);
+                    ch = decode_unicode_escaped_rune(ch);
                 } else {
                     // find escape sequence start positions
                     mut escapes_pos := @vec(uint);