Files
Nim/lib/system/strs_v3.nim
ringabout f1a7bfce47 switch on
2023-12-11 14:12:47 +00:00

266 lines
8.9 KiB
Nim

#
#
# Nim's Runtime Library
# (c) Copyright 2024 Nim contributors
#
# See the file "copying.txt", included in this
# distribution, for details about the copyright.
#
## Default new string implementation used by Nim's core.
type
NimStrPayloadBase = object
## cap lives at the negative offset of p: p - wordSize
cap: int
NimStringV3 {.core.} = object
rawlen: int ## the lowest bit is used to indict whether it's a const or intern string
## TODO: would it be better to use distinct?
p: ptr UncheckedArray[char] ## can be nil if len == 0.
## cap lives at the negative offset of p: p - wordSize
## non-zero terminated
const nimStrVersion {.core.} = 3
# TODO: fixme what about s.p != nil?
template isLiteral(s): bool = (s.rawlen and 1) == 1
template strHead(p: pointer): pointer =
cast[pointer](cast[int](p) -% sizeof(NimStrPayloadBase))
template strCap(p: pointer): int =
cast[ptr NimStrPayloadBase](strHead(p))[].cap
template `strCap=`(p: pointer, size: int) =
cast[ptr NimStrPayloadBase](strHead(p))[].cap = size
proc nimStrLenV3(s: NimStringV3): int {.compilerRtl, inl.} = s.rawlen shr 1
template toRawLen(len: int): int = len shl 1
template incRawLen(s: var NimStringV3, value: int = 1) =
s.rawlen += value shl 1
template setRawLen(s: var NimStringV3, len: int) =
if isLiteral(s):
s.rawLen = toRawLen(len) or 1
else:
s.rawLen = toRawLen(len)
proc markIntern(s: var NimStringV3): bool =
s.rawlen = s.rawlen or 1
result = not isLiteral(s)
proc unsafeUnmarkIntern(s: var NimStringV3) =
s.rawlen = s.rawlen and (not 1) # unmark?
when compileOption("threads"):
deallocShared(strHead(s.p))
else:
dealloc(strHead(s.p))
template contentSize(cap): int = cap + sizeof(NimStrPayloadBase)
template frees(s) =
if not isLiteral(s) and s.p != nil:
when compileOption("threads"):
deallocShared(strHead(s.p))
else:
dealloc(strHead(s.p))
template allocPayload(newLen: int): ptr UncheckedArray[char] =
when compileOption("threads"):
cast[ptr UncheckedArray[char]](allocShared(contentSize(newLen)) +! sizeof(NimStrPayloadBase))
else:
cast[ptr UncheckedArray[char]](alloc(contentSize(newLen)) +! sizeof(NimStrPayloadBase))
template allocPayload0(newLen: int): ptr UncheckedArray[char] =
when compileOption("threads"):
cast[ptr UncheckedArray[char]](allocShared0(contentSize(newLen)) +! sizeof(NimStrPayloadBase))
else:
cast[ptr UncheckedArray[char]](alloc0(contentSize(newLen)) +! sizeof(NimStrPayloadBase))
template reallocPayload(p: pointer, newLen: int): ptr UncheckedArray[char] =
when compileOption("threads"):
cast[ptr UncheckedArray[char]](reallocShared(p, contentSize(newLen)) +! sizeof(NimStrPayloadBase))
else:
cast[ptr UncheckedArray[char]](realloc(p, contentSize(newLen)) +! sizeof(NimStrPayloadBase))
template reallocPayload0(p: pointer; oldLen, newLen: int): ptr UncheckedArray[char] =
when compileOption("threads"):
cast[ptr UncheckedArray[char]](reallocShared0(p, contentSize(oldLen), contentSize(newLen)) +! sizeof(NimStrPayloadBase))
else:
cast[ptr UncheckedArray[char]](realloc0(p, contentSize(oldLen), contentSize(newLen)) +! sizeof(NimStrPayloadBase))
proc resize(old: int): int {.inline.} =
if old <= 0: result = 4
elif old <= high(int16): result = old * 2
else: result = old * 3 div 2 # for large arrays * 3/2 is better
proc prepareAdd(s: var NimStringV3; addLen: int) {.compilerRtl.} =
let newLen = s.nimStrLenV3 + addLen
if isLiteral(s):
let oldP = s.p
# can't mutate a literal, so we need a fresh copy here:
s.p = allocPayload(newLen)
s.p.strCap = newLen
if s.nimStrLenV3 > 0:
# we are about to append
copyMem(unsafeAddr s.p[0], unsafeAddr oldP[0], min(s.nimStrLenV3, newLen))
else:
if s.p != nil:
let oldCap = s.p.strCap
if newLen > oldCap:
let newCap = max(newLen, resize(oldCap))
s.p = reallocPayload(strHead(s.p), newCap)
s.p.strCap = newCap
if newLen < newCap:
zeroMem(cast[pointer](addr s.p[newLen]), newCap - newLen)
else:
s.p = allocPayload(newLen)
s.p.strCap = newLen
proc nimAddCharV1(s: var NimStringV3; c: char) {.compilerRtl, inl.} =
#if (s.p == nil) or (s.len+1 > s.p.cap and not strlitFlag):
prepareAdd(s, 1)
s.p[s.nimStrLenV3] = c
incRawLen s
proc toNimStr(str: cstring, len: int): NimStringV3 {.compilerproc.} =
if len <= 0:
result = NimStringV3(rawlen: 0, p: nil)
else:
var p = allocPayload(len)
p.strCap = len
copyMem(unsafeAddr p[0], str, len)
result = NimStringV3(rawlen: toRawLen(len), p: p)
proc cstrToNimstr(str: cstring): NimStringV3 {.compilerRtl.} =
if str == nil: toNimStr(str, 0)
else: toNimStr(str, str.len)
proc nimToCStringConv(s: NimStringV3): cstring {.compilerproc, nonReloadable, inline.} =
if s.nimStrLenV3 == 0: result = cstring""
else:
## TODO: fixme: inject conversions somewhere else and be cleaned up
## but let it leak for now
let len = s.nimStrLenV3
result = cast[cstring](allocShared0(len+1))
copyMem(result, unsafeAddr s.p[0], len)
proc appendString(dest: var NimStringV3; src: NimStringV3) {.compilerproc, inline.} =
if src.nimStrLenV3 > 0:
copyMem(unsafeAddr dest.p[dest.nimStrLenV3], unsafeAddr src.p[0], src.nimStrLenV3)
incRawLen(dest, src.nimStrLenV3)
proc appendChar(dest: var NimStringV3; c: char) {.compilerproc, inline.} =
dest.p[dest.nimStrLenV3] = c
incRawLen(dest)
proc rawNewString(space: int): NimStringV3 {.compilerproc.} =
# this is also 'system.newStringOfCap'.
if space <= 0:
result = NimStringV3(rawlen: 0, p: nil)
else:
var p = allocPayload(space)
p.strCap = space
result = NimStringV3(rawlen: 0, p: p)
proc mnewString(len: int): NimStringV3 {.compilerproc.} =
if len <= 0:
result = NimStringV3(rawlen: 0, p: nil)
else:
var p = allocPayload0(len)
p.strCap = len
result = NimStringV3(rawlen: toRawLen(len), p: p)
proc setLengthStrV2(s: var NimStringV3, newLen: int) {.compilerRtl.} =
if newLen == 0:
discard "do not free the buffer here, pattern 's.setLen 0' is common for avoiding allocations"
else:
if isLiteral(s):
let oldP = s.p
s.p = allocPayload(newLen)
s.p.strCap = newLen
if s.nimStrLenV3 > 0:
copyMem(unsafeAddr s.p[0], unsafeAddr oldP[0], min(s.nimStrLenV3, newLen))
if newLen > s.nimStrLenV3:
zeroMem(cast[pointer](addr s.p[s.nimStrLenV3]), newLen - s.nimStrLenV3)
else:
zeroMem(cast[pointer](addr s.p[0]), newLen)
elif newLen > s.nimStrLenV3:
if s.p != nil:
let oldCap = s.p.strCap
if newLen > oldCap:
let newCap = max(newLen, resize(oldCap))
s.p = reallocPayload0(strHead(s.p), oldCap, newCap)
s.p.strCap = newCap
else:
s.p = allocPayload0(newLen)
s.p.strCap = newLen
setRawLen(s, newLen)
proc nimAsgnStrV2(a: var NimStringV3, b: NimStringV3) {.compilerRtl.} =
if a.p == b.p: return
if isLiteral(b):
# we can shallow copy literals:
frees(a)
a.rawlen = b.rawlen
a.p = b.p
else:
if isLiteral(a) or a.p == nil or a.p.strCap < b.nimStrLenV3:
# we have to allocate the 'cap' here, consider
# 'let y = newStringOfCap(); var x = y'
# on the other hand... These get turned into moves now.
frees(a)
a.p = allocPayload(b.nimStrLenV3)
a.p.strCap = b.nimStrLenV3
a.rawlen = b.rawlen
copyMem(unsafeAddr a.p[0], unsafeAddr b.p[0], b.nimStrLenV3)
proc nimPrepareStrMutationImpl(s: var NimStringV3) =
let oldP = s.p
# can't mutate a literal, so we need a fresh copy here:
s.p = allocPayload(s.nimStrLenV3)
s.p.strCap = s.nimStrLenV3
s.rawlen = s.rawlen and (not 1)
copyMem(unsafeAddr s.p[0], unsafeAddr oldP[0], s.nimStrLenV3)
proc nimPrepareStrMutationV2(s: var NimStringV3) {.compilerRtl, inl.} =
if isLiteral(s):
nimPrepareStrMutationImpl(s)
proc prepareMutation*(s: var string) {.inline.} =
# string literals are "copy on write", so you need to call
# `prepareMutation` before modifying the strings via `addr`.
{.cast(noSideEffect).}:
let s = unsafeAddr s
nimPrepareStrMutationV2(cast[ptr NimStringV3](s)[])
proc nimAddStrV1(s: var NimStringV3; src: NimStringV3) {.compilerRtl, inl.} =
#if (s.p == nil) or (s.len+1 > s.p.cap and not strlitFlag):
prepareAdd(s, src.nimStrLenV3)
appendString s, src
proc nimDestroyStrV1(s: NimStringV3) {.compilerRtl, inl.} =
frees(s)
proc nimStrAtLe(s: string; idx: int; ch: char): bool {.compilerRtl, inl.} =
result = idx < s.len and s[idx] <= ch
func capacity*(self: string): int {.inline.} =
## Returns the current capacity of the string. Intern strings
## don't have a capacity and 0 will be returned
# See https://github.com/nim-lang/RFCs/issues/460
runnableExamples:
var str = newStringOfCap(cap = 42)
str.add "Nim"
assert str.capacity == 42
let str = cast[ptr NimStringV3](unsafeAddr self)
if isLiteral(str):
result = 0
else:
result = if str.p != nil: str.p.strCap else: 0