mirror of
https://github.com/nim-lang/Nim.git
synced 2025-12-28 17:04:41 +00:00
297 lines
9.0 KiB
Nim
297 lines
9.0 KiB
Nim
#
|
|
#
|
|
# The Nim Compiler
|
|
# (c) Copyright 2018 Andreas Rumpf
|
|
#
|
|
# See the file "copying.txt", included in this
|
|
# distribution, for details about the copyright.
|
|
#
|
|
|
|
## Layouter for nimpretty.
|
|
|
|
import idents, lexer, lineinfos, llstream, options, msgs, strutils,
|
|
pathutils
|
|
from os import changeFileExt
|
|
|
|
const
|
|
MaxLineLen = 80
|
|
LineCommentColumn = 30
|
|
|
|
type
|
|
SplitKind = enum
|
|
splitComma, splitParLe, splitAnd, splitOr, splitIn, splitBinary
|
|
|
|
SemicolonKind = enum
|
|
detectSemicolonKind, useSemicolon, dontTouch
|
|
|
|
Emitter* = object
|
|
config: ConfigRef
|
|
fid: FileIndex
|
|
lastTok: TTokType
|
|
inquote: bool
|
|
semicolons: SemicolonKind
|
|
col, lastLineNumber, lineSpan, indentLevel, indWidth: int
|
|
keepIndents*: int
|
|
doIndentMore*: int
|
|
content: string
|
|
indentStack: seq[int]
|
|
fixedUntil: int # marks where we must not go in the content
|
|
altSplitPos: array[SplitKind, int] # alternative split positions
|
|
|
|
proc openEmitter*(em: var Emitter, cache: IdentCache;
|
|
config: ConfigRef, fileIdx: FileIndex) =
|
|
let fullPath = Absolutefile config.toFullPath(fileIdx)
|
|
em.indWidth = getIndentWidth(fileIdx, llStreamOpen(fullPath, fmRead),
|
|
cache, config)
|
|
if em.indWidth == 0: em.indWidth = 2
|
|
em.config = config
|
|
em.fid = fileIdx
|
|
em.lastTok = tkInvalid
|
|
em.inquote = false
|
|
em.col = 0
|
|
em.content = newStringOfCap(16_000)
|
|
em.indentStack = newSeqOfCap[int](30)
|
|
em.indentStack.add 0
|
|
em.lastLineNumber = 1
|
|
|
|
proc closeEmitter*(em: var Emitter) =
|
|
if fileExists(em.config.outFile) and readFile(em.config.outFile.string) == em.content:
|
|
discard "do nothing, see #9499"
|
|
return
|
|
var f = llStreamOpen(em.config.outFile, fmWrite)
|
|
if f == nil:
|
|
rawMessage(em.config, errGenerated, "cannot open file: " & em.config.outFile.string)
|
|
return
|
|
f.llStreamWrite em.content
|
|
llStreamClose(f)
|
|
|
|
proc countNewlines(s: string): int =
|
|
result = 0
|
|
for i in 0..<s.len:
|
|
if s[i] == '\L': inc result
|
|
|
|
proc calcCol(em: var Emitter; s: string) =
|
|
var i = s.len-1
|
|
em.col = 0
|
|
while i >= 0 and s[i] != '\L':
|
|
dec i
|
|
inc em.col
|
|
|
|
template wr(x) =
|
|
em.content.add x
|
|
inc em.col, x.len
|
|
|
|
template goodCol(col): bool = col in 40..MaxLineLen
|
|
|
|
const
|
|
openPars = {tkParLe, tkParDotLe,
|
|
tkBracketLe, tkBracketLeColon, tkCurlyDotLe,
|
|
tkCurlyLe}
|
|
splitters = openPars + {tkComma, tkSemicolon}
|
|
oprSet = {tkOpr, tkDiv, tkMod, tkShl, tkShr, tkIn, tkNotin, tkIs,
|
|
tkIsnot, tkNot, tkOf, tkAs, tkDotDot, tkAnd, tkOr, tkXor}
|
|
|
|
template rememberSplit(kind) =
|
|
if goodCol(em.col):
|
|
em.altSplitPos[kind] = em.content.len
|
|
|
|
template moreIndent(em): int =
|
|
(if em.doIndentMore > 0: em.indWidth*2 else: em.indWidth)
|
|
|
|
proc softLinebreak(em: var Emitter, lit: string) =
|
|
# XXX Use an algorithm that is outlined here:
|
|
# https://llvm.org/devmtg/2013-04/jasper-slides.pdf
|
|
# +2 because we blindly assume a comma or ' &' might follow
|
|
if not em.inquote and em.col+lit.len+2 >= MaxLineLen:
|
|
if em.lastTok in splitters:
|
|
while em.content.len > 0 and em.content[em.content.high] == ' ':
|
|
setLen(em.content, em.content.len-1)
|
|
wr("\L")
|
|
em.col = 0
|
|
for i in 1..em.indentLevel+moreIndent(em): wr(" ")
|
|
else:
|
|
# search backwards for a good split position:
|
|
for a in em.altSplitPos:
|
|
if a > em.fixedUntil:
|
|
var spaces = 0
|
|
while a+spaces < em.content.len and em.content[a+spaces] == ' ':
|
|
inc spaces
|
|
if spaces > 0: delete(em.content, a, a+spaces-1)
|
|
let ws = "\L" & repeat(' ',em.indentLevel+moreIndent(em))
|
|
em.col = em.content.len - a
|
|
em.content.insert(ws, a)
|
|
break
|
|
|
|
proc emitTok*(em: var Emitter; L: TLexer; tok: TToken) =
|
|
|
|
template endsInWhite(em): bool =
|
|
em.content.len == 0 or em.content[em.content.high] in {' ', '\L'}
|
|
template endsInAlpha(em): bool =
|
|
em.content.len > 0 and em.content[em.content.high] in SymChars+{'_'}
|
|
|
|
proc emitComment(em: var Emitter; tok: TToken) =
|
|
let lit = strip fileSection(em.config, em.fid, tok.commentOffsetA, tok.commentOffsetB)
|
|
em.lineSpan = countNewlines(lit)
|
|
if em.lineSpan > 0: calcCol(em, lit)
|
|
if not endsInWhite(em):
|
|
wr(" ")
|
|
if em.lineSpan == 0 and max(em.col, LineCommentColumn) + lit.len <= MaxLineLen:
|
|
for i in 1 .. LineCommentColumn - em.col: wr(" ")
|
|
wr lit
|
|
|
|
if tok.tokType == tkComment and tok.literal.startsWith("#!nimpretty"):
|
|
case tok.literal
|
|
of "#!nimpretty off":
|
|
inc em.keepIndents
|
|
wr("\L")
|
|
em.lastLineNumber = tok.line + 1
|
|
of "#!nimpretty on":
|
|
dec em.keepIndents
|
|
em.lastLineNumber = tok.line
|
|
wr("\L")
|
|
#for i in 1 .. tok.indent: wr " "
|
|
wr tok.literal
|
|
em.col = 0
|
|
em.lineSpan = 0
|
|
return
|
|
|
|
var preventComment = false
|
|
if tok.tokType == tkComment and tok.line == em.lastLineNumber and tok.indent >= 0:
|
|
# we have an inline comment so handle it before the indentation token:
|
|
emitComment(em, tok)
|
|
preventComment = true
|
|
em.fixedUntil = em.content.high
|
|
|
|
elif tok.indent >= 0:
|
|
if em.lastTok in (splitters + oprSet) or em.keepIndents > 0:
|
|
em.indentLevel = tok.indent
|
|
else:
|
|
if tok.indent > em.indentStack[^1]:
|
|
em.indentStack.add tok.indent
|
|
else:
|
|
# dedent?
|
|
while em.indentStack.len > 1 and em.indentStack[^1] > tok.indent:
|
|
discard em.indentStack.pop()
|
|
em.indentLevel = em.indentStack.high * em.indWidth
|
|
#[ we only correct the indentation if it is not in an expression context,
|
|
so that code like
|
|
|
|
const splitters = {tkComma, tkSemicolon, tkParLe, tkParDotLe,
|
|
tkBracketLe, tkBracketLeColon, tkCurlyDotLe,
|
|
tkCurlyLe}
|
|
|
|
is not touched.
|
|
]#
|
|
# remove trailing whitespace:
|
|
while em.content.len > 0 and em.content[em.content.high] == ' ':
|
|
setLen(em.content, em.content.len-1)
|
|
wr("\L")
|
|
for i in 2..tok.line - em.lastLineNumber: wr("\L")
|
|
em.col = 0
|
|
for i in 1..em.indentLevel:
|
|
wr(" ")
|
|
em.fixedUntil = em.content.high
|
|
|
|
case tok.tokType
|
|
of tokKeywordLow..tokKeywordHigh:
|
|
if endsInAlpha(em):
|
|
wr(" ")
|
|
elif not em.inquote and not endsInWhite(em) and
|
|
em.lastTok notin openPars:
|
|
#and tok.tokType in oprSet
|
|
wr(" ")
|
|
|
|
if not em.inquote:
|
|
wr(TokTypeToStr[tok.tokType])
|
|
|
|
case tok.tokType
|
|
of tkAnd: rememberSplit(splitAnd)
|
|
of tkOr: rememberSplit(splitOr)
|
|
of tkIn, tkNotin:
|
|
rememberSplit(splitIn)
|
|
wr(" ")
|
|
else: discard
|
|
else:
|
|
# keywords in backticks are not normalized:
|
|
wr(tok.ident.s)
|
|
|
|
of tkColon:
|
|
wr(TokTypeToStr[tok.tokType])
|
|
wr(" ")
|
|
of tkSemicolon, tkComma:
|
|
wr(TokTypeToStr[tok.tokType])
|
|
rememberSplit(splitComma)
|
|
wr(" ")
|
|
of tkParDotLe, tkParLe, tkBracketDotLe, tkBracketLe,
|
|
tkCurlyLe, tkCurlyDotLe, tkBracketLeColon:
|
|
if tok.strongSpaceA > 0 and not em.endsInWhite:
|
|
wr(" ")
|
|
wr(TokTypeToStr[tok.tokType])
|
|
rememberSplit(splitParLe)
|
|
of tkParRi,
|
|
tkBracketRi, tkCurlyRi,
|
|
tkBracketDotRi,
|
|
tkCurlyDotRi,
|
|
tkParDotRi,
|
|
tkColonColon, tkDot:
|
|
wr(TokTypeToStr[tok.tokType])
|
|
of tkEquals:
|
|
if not em.inquote and not em.endsInWhite: wr(" ")
|
|
wr(TokTypeToStr[tok.tokType])
|
|
if not em.inquote: wr(" ")
|
|
of tkOpr, tkDotDot:
|
|
if tok.strongSpaceA == 0 and tok.strongSpaceB == 0:
|
|
# if not surrounded by whitespace, don't produce any whitespace either:
|
|
wr(tok.ident.s)
|
|
else:
|
|
if not em.endsInWhite: wr(" ")
|
|
wr(tok.ident.s)
|
|
template isUnary(tok): bool =
|
|
tok.strongSpaceB == 0 and tok.strongSpaceA > 0
|
|
|
|
if not isUnary(tok):
|
|
wr(" ")
|
|
rememberSplit(splitBinary)
|
|
of tkAccent:
|
|
if not em.inquote and endsInAlpha(em): wr(" ")
|
|
wr(TokTypeToStr[tok.tokType])
|
|
em.inquote = not em.inquote
|
|
of tkComment:
|
|
if not preventComment:
|
|
emitComment(em, tok)
|
|
of tkIntLit..tkStrLit, tkRStrLit, tkTripleStrLit, tkGStrLit, tkGTripleStrLit, tkCharLit:
|
|
let lit = fileSection(em.config, em.fid, tok.offsetA, tok.offsetB)
|
|
softLinebreak(em, lit)
|
|
if endsInAlpha(em) and tok.tokType notin {tkGStrLit, tkGTripleStrLit}: wr(" ")
|
|
em.lineSpan = countNewlines(lit)
|
|
if em.lineSpan > 0: calcCol(em, lit)
|
|
wr lit
|
|
of tkEof: discard
|
|
else:
|
|
let lit = if tok.ident != nil: tok.ident.s else: tok.literal
|
|
softLinebreak(em, lit)
|
|
if endsInAlpha(em): wr(" ")
|
|
wr lit
|
|
|
|
em.lastTok = tok.tokType
|
|
em.lastLineNumber = tok.line + em.lineSpan
|
|
em.lineSpan = 0
|
|
|
|
proc starWasExportMarker*(em: var Emitter) =
|
|
if em.content.endsWith(" * "):
|
|
setLen(em.content, em.content.len-3)
|
|
em.content.add("*")
|
|
dec em.col, 2
|
|
|
|
proc commaWasSemicolon*(em: var Emitter) =
|
|
if em.semicolons == detectSemicolonKind:
|
|
em.semicolons = if em.content.endsWith(", "): dontTouch else: useSemicolon
|
|
if em.semicolons == useSemicolon and em.content.endsWith(", "):
|
|
setLen(em.content, em.content.len-2)
|
|
em.content.add("; ")
|
|
|
|
proc curlyRiWasPragma*(em: var Emitter) =
|
|
if em.content.endsWith("}"):
|
|
setLen(em.content, em.content.len-1)
|
|
em.content.add(".}")
|