Files
Odin/core/strings/builder.odin

210 lines
4.5 KiB
Odin

package strings
import "core:mem"
import "core:unicode/utf8"
import "core:strconv"
Builder :: struct {
buf: [dynamic]byte,
}
make_builder :: proc(allocator := context.allocator) -> Builder {
return Builder{make([dynamic]byte)};
}
destroy_builder :: proc(b: ^Builder) {
delete(b.buf);
clear(&b.buf);
}
builder_from_slice :: proc(backing: []byte) -> Builder {
s := transmute(mem.Raw_Slice)backing;
d := mem.Raw_Dynamic_Array{
data = s.data,
len = 0,
cap = s.len,
allocator = mem.nil_allocator(),
};
return transmute(Builder)d;
}
to_string :: proc(b: Builder) -> string {
return string(b.buf[:]);
}
builder_len :: proc(b: Builder) -> int {
return len(b.buf);
}
builder_cap :: proc(b: Builder) -> int {
return cap(b.buf);
}
write_byte :: proc(b: ^Builder, x: byte) {
append(&b.buf, x);
}
write_rune :: proc(b: ^Builder, r: rune) -> int {
if r < utf8.RUNE_SELF {
write_byte(b, byte(r));
return 1;
}
s, n := utf8.encode_rune(r);
write_bytes(b, s[:n]);
return n;
}
write_string :: proc(b: ^Builder, s: string) {
write_bytes(b, cast([]byte)s);
}
write_bytes :: proc(b: ^Builder, x: []byte) {
append(&b.buf, ..x);
}
@(private, static)
DIGITS_LOWER := "0123456789abcdefx";
write_quoted_string :: proc(b: ^Builder, s: string, quote: byte = '"') {
write_byte(b, quote);
for width := 0; len(s) > 0; s = s[width:] {
r := rune(s[0]);
width = 1;
if r >= utf8.RUNE_SELF {
r, width = utf8.decode_rune_in_string(s);
}
if width == 1 && r == utf8.RUNE_ERROR {
write_byte(b, '\\');
write_byte(b, 'x');
write_byte(b, DIGITS_LOWER[s[0]>>4]);
write_byte(b, DIGITS_LOWER[s[0]&0xf]);
continue;
}
write_escaped_rune(b, r, quote);
}
write_byte(b, quote);
}
write_encoded_rune :: proc(b: ^Builder, r: rune, write_quote := true) {
if write_quote do write_byte(b, '\'');
switch r {
case '\a': write_string(b, `\a"`);
case '\b': write_string(b, `\b"`);
case '\e': write_string(b, `\e"`);
case '\f': write_string(b, `\f"`);
case '\n': write_string(b, `\n"`);
case '\r': write_string(b, `\r"`);
case '\t': write_string(b, `\t"`);
case '\v': write_string(b, `\v"`);
case:
if r < 32 {
write_string(b, `\x`);
buf: [2]byte;
s := strconv.append_bits(buf[:], u64(r), 16, true, 64, strconv.digits, nil);
switch len(s) {
case 0: write_string(b, "00");
case 1: write_byte(b, '0');
case 2: write_string(b, s);
}
} else {
write_rune(b, r);
}
}
if write_quote do write_byte(b, '\'');
}
write_escaped_rune :: proc(b: ^Builder, r: rune, quote: byte, html_safe := false) {
is_printable :: proc(r: rune) -> bool {
if r <= 0xff {
switch r {
case 0x20..0x7e:
return true;
case 0xa1..0xff: // ¡ through ÿ except for the soft hyphen
return r != 0xad; //
}
}
// TODO(bill): A proper unicode library will be needed!
return false;
}
if html_safe {
switch r {
case '<', '>', '&':
write_byte(b, '\\');
write_byte(b, 'u');
for s := 12; s >= 0; s -= 4 {
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
}
return;
}
}
if r == rune(quote) || r == '\\' {
write_byte(b, '\\');
write_byte(b, byte(r));
return;
} else if is_printable(r) {
write_encoded_rune(b, r, false);
return;
}
switch r {
case '\a': write_string(b, `\a`);
case '\b': write_string(b, `\b`);
case '\e': write_string(b, `\e`);
case '\f': write_string(b, `\f`);
case '\n': write_string(b, `\n`);
case '\r': write_string(b, `\r`);
case '\t': write_string(b, `\t`);
case '\v': write_string(b, `\v`);
case:
switch {
case r < ' ':
write_byte(b, '\\');
write_byte(b, 'x');
write_byte(b, DIGITS_LOWER[byte(r)>>4]);
write_byte(b, DIGITS_LOWER[byte(r)&0xf]);
case r > utf8.MAX_RUNE:
r = 0xfffd;
fallthrough;
case r < 0x10000:
write_byte(b, '\\');
write_byte(b, 'u');
for s := 12; s >= 0; s -= 4 {
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
}
case:
write_byte(b, '\\');
write_byte(b, 'U');
for s := 28; s >= 0; s -= 4 {
write_byte(b, DIGITS_LOWER[r>>uint(s) & 0xf]);
}
}
}
}
write_u64 :: proc(b: ^Builder, i: u64, base: int = 10) {
buf: [32]byte;
s := strconv.append_bits(buf[:], u64(i), base, false, 64, strconv.digits, nil);
write_string(b, s);
}
write_i64 :: proc(b: ^Builder, i: i64, base: int = 10) {
buf: [32]byte;
s := strconv.append_bits(buf[:], u64(i), base, true, 64, strconv.digits, nil);
write_string(b, s);
}
write_uint :: proc(b: ^Builder, i: uint, base: int = 10) {
write_u64(b, u64(i), base);
}
write_int :: proc(b: ^Builder, i: int, base: int = 10) {
write_i64(b, i64(i), base);
}