mirror of
https://github.com/odin-lang/Odin.git
synced 2025-12-29 09:24:33 +00:00
210 lines
4.5 KiB
Odin
210 lines
4.5 KiB
Odin
package strings
|
|
|
|
import "core:mem"
|
|
import "core:unicode/utf8"
|
|
import "core:strconv"
|
|
|
|
Builder :: struct {
|
|
buf: [dynamic]byte,
|
|
}
|
|
|
|
make_builder :: proc(allocator := context.allocator) -> Builder {
|
|
return Builder{make([dynamic]byte)};
|
|
}
|
|
|
|
destroy_builder :: proc(b: ^Builder) {
|
|
delete(b.buf);
|
|
clear(&b.buf);
|
|
}
|
|
|
|
builder_from_slice :: proc(backing: []byte) -> Builder {
|
|
s := transmute(mem.Raw_Slice)backing;
|
|
d := mem.Raw_Dynamic_Array{
|
|
data = s.data,
|
|
len = 0,
|
|
cap = s.len,
|
|
allocator = mem.nil_allocator(),
|
|
};
|
|
return transmute(Builder)d;
|
|
}
|
|
to_string :: proc(b: Builder) -> string {
|
|
return string(b.buf[:]);
|
|
}
|
|
|
|
builder_len :: proc(b: Builder) -> int {
|
|
return len(b.buf);
|
|
}
|
|
builder_cap :: proc(b: Builder) -> int {
|
|
return cap(b.buf);
|
|
}
|
|
|
|
write_byte :: proc(b: ^Builder, x: byte) {
|
|
append(&b.buf, x);
|
|
}
|
|
|
|
write_rune :: proc(b: ^Builder, r: rune) -> int {
|
|
if r < utf8.RUNE_SELF {
|
|
write_byte(b, byte(r));
|
|
return 1;
|
|
}
|
|
|
|
s, n := utf8.encode_rune(r);
|
|
write_bytes(b, s[:n]);
|
|
return n;
|
|
}
|
|
|
|
write_string :: proc(b: ^Builder, s: string) {
|
|
write_bytes(b, cast([]byte)s);
|
|
}
|
|
|
|
write_bytes :: proc(b: ^Builder, x: []byte) {
|
|
append(&b.buf, ..x);
|
|
}
|
|
|
|
@(private)
|
|
static DIGITS_LOWER := "0123456789abcdefx";
|
|
|
|
write_quoted_string :: proc(b: ^Builder, s: string, quote: byte = '"') {
|
|
write_byte(b, quote);
|
|
for width := 0; len(s) > 0; s = s[width:] {
|
|
r := rune(s[0]);
|
|
width = 1;
|
|
if r >= utf8.RUNE_SELF {
|
|
r, width = utf8.decode_rune_in_string(s);
|
|
}
|
|
if width == 1 && r == utf8.RUNE_ERROR {
|
|
write_byte(b, '\\');
|
|
write_byte(b, 'x');
|
|
write_byte(b, DIGITS_LOWER[s[0]>>4]);
|
|
write_byte(b, DIGITS_LOWER[s[0]&0xf]);
|
|
continue;
|
|
}
|
|
|
|
write_escaped_rune(b, r, quote);
|
|
|
|
}
|
|
write_byte(b, quote);
|
|
}
|
|
|
|
|
|
write_encoded_rune :: proc(b: ^Builder, r: rune, write_quote := true) {
|
|
if write_quote do write_byte(b, '\'');
|
|
switch r {
|
|
case '\a': write_string(b, `\a"`);
|
|
case '\b': write_string(b, `\b"`);
|
|
case '\e': write_string(b, `\e"`);
|
|
case '\f': write_string(b, `\f"`);
|
|
case '\n': write_string(b, `\n"`);
|
|
case '\r': write_string(b, `\r"`);
|
|
case '\t': write_string(b, `\t"`);
|
|
case '\v': write_string(b, `\v"`);
|
|
case:
|
|
if r < 32 {
|
|
write_string(b, `\x`);
|
|
buf: [2]byte;
|
|
s := strconv.append_bits(buf[:], u64(r), 16, true, 64, strconv.digits, nil);
|
|
switch len(s) {
|
|
case 0: write_string(b, "00");
|
|
case 1: write_byte(b, '0');
|
|
case 2: write_string(b, s);
|
|
}
|
|
} else {
|
|
write_rune(b, r);
|
|
}
|
|
|
|
}
|
|
if write_quote do write_byte(b, '\'');
|
|
}
|
|
|
|
|
|
write_escaped_rune :: proc(b: ^Builder, r: rune, quote: byte, html_safe := false) {
|
|
is_printable :: proc(r: rune) -> bool {
|
|
if r <= 0xff {
|
|
switch r {
|
|
case 0x20..0x7e:
|
|
return true;
|
|
case 0xa1..0xff: // ¡ through ÿ except for the soft hyphen
|
|
return r != 0xad; //
|
|
}
|
|
}
|
|
|
|
// TODO(bill): A proper unicode library will be needed!
|
|
return false;
|
|
}
|
|
|
|
if html_safe {
|
|
switch r {
|
|
case '<', '>', '&':
|
|
write_byte(b, '\\');
|
|
write_byte(b, 'u');
|
|
for s := 12; s >= 0; s -= 4 {
|
|
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
|
|
}
|
|
return;
|
|
}
|
|
}
|
|
|
|
if r == rune(quote) || r == '\\' {
|
|
write_byte(b, '\\');
|
|
write_byte(b, byte(r));
|
|
return;
|
|
} else if is_printable(r) {
|
|
write_encoded_rune(b, r, false);
|
|
return;
|
|
}
|
|
switch r {
|
|
case '\a': write_string(b, `\a`);
|
|
case '\b': write_string(b, `\b`);
|
|
case '\e': write_string(b, `\e`);
|
|
case '\f': write_string(b, `\f`);
|
|
case '\n': write_string(b, `\n`);
|
|
case '\r': write_string(b, `\r`);
|
|
case '\t': write_string(b, `\t`);
|
|
case '\v': write_string(b, `\v`);
|
|
case:
|
|
switch {
|
|
case r < ' ':
|
|
write_byte(b, '\\');
|
|
write_byte(b, 'x');
|
|
write_byte(b, DIGITS_LOWER[byte(r)>>4]);
|
|
write_byte(b, DIGITS_LOWER[byte(r)&0xf]);
|
|
|
|
case r > utf8.MAX_RUNE:
|
|
r = 0xfffd;
|
|
fallthrough;
|
|
case r < 0x10000:
|
|
write_byte(b, '\\');
|
|
write_byte(b, 'u');
|
|
for s := 12; s >= 0; s -= 4 {
|
|
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
|
|
}
|
|
case:
|
|
write_byte(b, '\\');
|
|
write_byte(b, 'U');
|
|
for s := 28; s >= 0; s -= 4 {
|
|
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
write_u64 :: proc(b: ^Builder, i: u64, base: int = 10) {
|
|
buf: [32]byte;
|
|
s := strconv.append_bits(buf[:], u64(i), base, false, 64, strconv.digits, nil);
|
|
write_string(b, s);
|
|
}
|
|
write_i64 :: proc(b: ^Builder, i: i64, base: int = 10) {
|
|
buf: [32]byte;
|
|
s := strconv.append_bits(buf[:], u64(i), base, true, 64, strconv.digits, nil);
|
|
write_string(b, s);
|
|
}
|
|
|
|
write_uint :: proc(b: ^Builder, i: uint, base: int = 10) {
|
|
write_u64(b, u64(i), base);
|
|
}
|
|
write_int :: proc(b: ^Builder, i: int, base: int = 10) {
|
|
write_i64(b, i64(i), base);
|
|
}
|
|
|