Update strings.prefix_length to handle partial UTF-8 runes.

2026-02-17 08:34:08 +00:00 · 2022-06-16 16:12:15 +02:00
parent 84a424f21e
commit 6f1222e9bf
1 changed files with 15 additions and 6 deletions
--- a/core/strings/strings.odin
+++ b/core/strings/strings.odin
@@ -225,14 +225,23 @@ equal_fold :: proc(u, v: string) -> bool {
 */
 prefix_length :: proc(a, b: string) -> (n: int) {
 	_len := min(len(a), len(b))
-	idx  := 0

-	#no_bounds_check for idx < _len && a[idx] == b[idx] {
-		idx += 1
+	// Scan for matches including partial codepoints.
+	#no_bounds_check for n < _len && a[n] == b[n] {
+		n += 1
+	}

-		if a[idx] & 128 != 128 {
-			// new codepoint or end of multi-byte codepoint, update match length
-			n = idx
+	// Now scan to ignore partial codepoints.
+	if n > 0 {
+		s := a[:n]
+		n = 0
+		for {
+			r0, w := utf8.decode_rune(s[n:])
+			if r0 != utf8.RUNE_ERROR {
+				n += w
+			} else {
+				break
+			}
 		}
 	}
 	return