diff options
author | Araq <rumpf_a@web.de> | 2012-12-02 11:11:54 +0100 |
---|---|---|
committer | Araq <rumpf_a@web.de> | 2012-12-02 11:11:54 +0100 |
commit | d7adc7c3289feae7de617953452eb71fb75f40da (patch) | |
tree | 330efde736e816c5b14e0a390c2deb8781b93401 /compiler | |
parent | 76885c754a8f51a0ea34f76dd0843b1949ac7fde (diff) | |
download | Nim-d7adc7c3289feae7de617953452eb71fb75f40da.tar.gz |
dont use unsafeNew in ropes.nim for now
Diffstat (limited to 'compiler')
-rwxr-xr-x | compiler/ropes.nim | 757 |
1 files changed, 512 insertions, 245 deletions
diff --git a/compiler/ropes.nim b/compiler/ropes.nim index af05c68a7..f27bf70f7 100755 --- a/compiler/ropes.nim +++ b/compiler/ropes.nim @@ -66,54 +66,49 @@ type # performance of the code generator (assignments # copy the format strings # though it is not necessary) - PRope* = ref TRope - TRope*{.acyclic.} = object of TObject # the empty rope is represented - # by nil to safe space - left, right: PRope - L: int # < 0 if a leaf - d: array [0..PayloadSize, char] # != nil if a leaf - - TRopeSeq* = seq[PRope] - -proc con*(a, b: PRope): PRope -proc con*(a: PRope, b: string): PRope -proc con*(a: string, b: PRope): PRope -proc con*(a: varargs[PRope]): PRope -proc app*(a: var PRope, b: PRope) -proc app*(a: var PRope, b: string) -proc prepend*(a: var PRope, b: PRope) -proc toRope*(s: string): PRope -proc toRope*(i: BiggestInt): PRope -proc ropeLen*(a: PRope): int -proc writeRopeIfNotEqual*(r: PRope, filename: string): bool -proc ropeToStr*(p: PRope): string -proc ropef*(frmt: TFormatStr, args: varargs[PRope]): PRope -proc appf*(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) -proc RopeEqualsFile*(r: PRope, f: string): bool - # returns true if the rope r is the same as the contents of file f -proc RopeInvariant*(r: PRope): bool - # exported for debugging -# implementation - -proc ropeLen(a: PRope): int = - if a == nil: result = 0 - else: result = a.L.abs - -proc newRope(data: string = nil): PRope = - if data != nil: - unsafeNew(result, sizeof(TRope)-PayloadSize+len(data)) - result.L = -len(data) - # copy including '\0': - copyMem(addr result.d, cstring(data), len(data)) - else: - unsafeNew(result, sizeof(TRope)-PayloadSize) - -proc eqContent(r: PRope, s: string): bool = - assert r.L < 0 - if -r.L == s.len: - result = equalMem(addr(r.d), cstring(s), s.len) - -when false: + +when true: + # working version: + type + PRope* = ref TRope + TRope*{.acyclic.} = object of TObject # the empty rope is represented + # by nil to safe space + left*, right*: PRope + length*: int + data*: string # != nil if a leaf + + TRopeSeq* = seq[PRope] + + proc con*(a, b: PRope): PRope + proc con*(a: PRope, b: string): PRope + proc con*(a: string, b: PRope): PRope + proc con*(a: varargs[PRope]): PRope + proc app*(a: var PRope, b: PRope) + proc app*(a: var PRope, b: string) + proc prepend*(a: var PRope, b: PRope) + proc toRope*(s: string): PRope + proc toRope*(i: BiggestInt): PRope + proc ropeLen*(a: PRope): int + proc writeRopeIfNotEqual*(r: PRope, filename: string): bool + proc ropeToStr*(p: PRope): string + proc ropef*(frmt: TFormatStr, args: varargs[PRope]): PRope + proc appf*(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) + proc RopeEqualsFile*(r: PRope, f: string): bool + # returns true if the rope r is the same as the contents of file f + proc RopeInvariant*(r: PRope): bool + # exported for debugging + # implementation + + proc ropeLen(a: PRope): int = + if a == nil: result = 0 + else: result = a.length + + proc newRope(data: string = nil): PRope = + new(result) + if data != nil: + result.length = len(data) + result.data = data + proc newMutableRope*(capacity = 30): PRope = ## creates a new rope that supports direct modifications of the rope's ## 'data' and 'length' fields. @@ -123,204 +118,476 @@ when false: proc freezeMutableRope*(r: PRope) {.inline.} = r.length = r.data.len -var - cache: array[0..2048*2 -1, PRope] - -proc RopeInvariant(r: PRope): bool = - if r == nil: - result = true - else: - result = true # - # if r.data <> snil then - # result := true - # else begin - # result := (r.left <> nil) and (r.right <> nil); - # if result then result := ropeInvariant(r.left); - # if result then result := ropeInvariant(r.right); - # end - -proc insertInCache(s: string): PRope = - var h = hash(s) and high(cache) - result = cache[h] - if isNil(result) or not eqContent(result, s): - result = newRope(s) - cache[h] = result - -proc toRope(s: string): PRope = - if s.len == 0: + var + cache: array[0..2048*2 -1, PRope] + + proc RopeInvariant(r: PRope): bool = + if r == nil: + result = true + else: + result = true # + # if r.data <> snil then + # result := true + # else begin + # result := (r.left <> nil) and (r.right <> nil); + # if result then result := ropeInvariant(r.left); + # if result then result := ropeInvariant(r.right); + # end + + proc insertInCache(s: string): PRope = + var h = hash(s) and high(cache) + result = cache[h] + if isNil(result) or result.data != s: + result = newRope(s) + cache[h] = result + + proc toRope(s: string): PRope = + if s.len == 0: + result = nil + else: + result = insertInCache(s) + assert(RopeInvariant(result)) + + proc RopeSeqInsert(rs: var TRopeSeq, r: PRope, at: Natural) = + var length = len(rs) + if at > length: + setlen(rs, at + 1) + else: + setlen(rs, length + 1) # move old rope elements: + for i in countdown(length, at + 1): + rs[i] = rs[i - 1] # this is correct, I used pen and paper to validate it + rs[at] = r + + proc newRecRopeToStr(result: var string, resultLen: var int, r: PRope) = + var stack = @[r] + while len(stack) > 0: + var it = pop(stack) + while it.data == nil: + add(stack, it.right) + it = it.left + assert(it.data != nil) + CopyMem(addr(result[resultLen]), addr(it.data[0]), it.length) + Inc(resultLen, it.length) + assert(resultLen <= len(result)) + + proc ropeToStr(p: PRope): string = + if p == nil: + result = "" + else: + result = newString(p.length) + var resultLen = 0 + newRecRopeToStr(result, resultLen, p) + + proc con(a, b: PRope): PRope = + if a == nil: result = b + elif b == nil: result = a + else: + result = newRope() + result.length = a.length + b.length + result.left = a + result.right = b + + proc con(a: PRope, b: string): PRope = result = con(a, toRope(b)) + proc con(a: string, b: PRope): PRope = result = con(toRope(a), b) + + proc con(a: varargs[PRope]): PRope = + for i in countup(0, high(a)): result = con(result, a[i]) + + proc toRope(i: BiggestInt): PRope = result = toRope($i) + + proc app(a: var PRope, b: PRope) = a = con(a, b) + proc app(a: var PRope, b: string) = a = con(a, b) + proc prepend(a: var PRope, b: PRope) = a = con(b, a) + + proc writeRope*(f: TFile, c: PRope) = + var stack = @[c] + while len(stack) > 0: + var it = pop(stack) + while it.data == nil: + add(stack, it.right) + it = it.left + assert(it != nil) + assert(it.data != nil) + write(f, it.data) + + proc WriteRope*(head: PRope, filename: string, useWarning = false) = + var f: tfile + if open(f, filename, fmWrite): + if head != nil: WriteRope(f, head) + close(f) + else: + rawMessage(if useWarning: warnCannotOpenFile else: errCannotOpenFile, + filename) + + proc ropef(frmt: TFormatStr, args: varargs[PRope]): PRope = + var i = 0 + var length = len(frmt) result = nil - else: - result = insertInCache(s) - assert(RopeInvariant(result)) - -proc RopeSeqInsert(rs: var TRopeSeq, r: PRope, at: Natural) = - var length = len(rs) - if at > length: - setlen(rs, at + 1) - else: - setlen(rs, length + 1) # move old rope elements: - for i in countdown(length, at + 1): - rs[i] = rs[i - 1] # this is correct, I used pen and paper to validate it - rs[at] = r - -proc newRecRopeToStr(result: var string, resultLen: var int, r: PRope) = - var stack = @[r] - while len(stack) > 0: - var it = pop(stack) - while it.L >= 0: - add(stack, it.right) - it = it.left - assert(it.L < 0) - CopyMem(addr(result[resultLen]), addr(it.d[0]), -it.L) - Inc(resultLen, -it.L) - assert(resultLen <= len(result)) - -proc ropeToStr(p: PRope): string = - if p == nil: - result = "" - else: - result = newString(p.L.abs) - var resultLen = 0 - newRecRopeToStr(result, resultLen, p) - -proc con(a, b: PRope): PRope = - if a == nil: result = b - elif b == nil: result = a - else: - result = newRope() - result.L = a.L.abs + b.L.abs - result.left = a - result.right = b - -proc con(a: PRope, b: string): PRope = result = con(a, toRope(b)) -proc con(a: string, b: PRope): PRope = result = con(toRope(a), b) - -proc con(a: varargs[PRope]): PRope = - for i in countup(0, high(a)): result = con(result, a[i]) - -proc toRope(i: BiggestInt): PRope = result = toRope($i) - -proc app(a: var PRope, b: PRope) = a = con(a, b) -proc app(a: var PRope, b: string) = a = con(a, b) -proc prepend(a: var PRope, b: PRope) = a = con(b, a) - -proc writeRope*(f: TFile, c: PRope) = - var stack = @[c] - while len(stack) > 0: - var it = pop(stack) - while it.L >= 0: - add(stack, it.right) - it = it.left - assert(it != nil) - assert(it.L < 0) - write(f, cstring(it.d), -it.L) - -proc WriteRope*(head: PRope, filename: string, useWarning = false) = - var f: tfile - if open(f, filename, fmWrite): - if head != nil: WriteRope(f, head) - close(f) - else: - rawMessage(if useWarning: warnCannotOpenFile else: errCannotOpenFile, - filename) - -proc ropef(frmt: TFormatStr, args: varargs[PRope]): PRope = - var i = 0 - var length = len(frmt) - result = nil - var num = 0 - while i <= length - 1: - if frmt[i] == '$': - inc(i) # skip '$' - case frmt[i] - of '$': - app(result, "$") - inc(i) - of '#': - inc(i) - app(result, args[num]) - inc(num) - of '0'..'9': - var j = 0 - while true: - j = (j * 10) + Ord(frmt[i]) - ord('0') + var num = 0 + while i <= length - 1: + if frmt[i] == '$': + inc(i) # skip '$' + case frmt[i] + of '$': + app(result, "$") + inc(i) + of '#': inc(i) - if (i > length + 0 - 1) or not (frmt[i] in {'0'..'9'}): break - num = j - if j > high(args) + 1: - internalError("ropes: invalid format string $" & $(j)) - else: - app(result, args[j - 1]) - of 'n': - if optLineDir notin gOptions: app(result, tnl) - inc i - of 'N': - app(result, tnl) + app(result, args[num]) + inc(num) + of '0'..'9': + var j = 0 + while true: + j = (j * 10) + Ord(frmt[i]) - ord('0') + inc(i) + if (i > length + 0 - 1) or not (frmt[i] in {'0'..'9'}): break + num = j + if j > high(args) + 1: + internalError("ropes: invalid format string $" & $(j)) + else: + app(result, args[j - 1]) + of 'n': + if optLineDir notin gOptions: app(result, tnl) + inc i + of 'N': + app(result, tnl) + inc(i) + else: InternalError("ropes: invalid format string $" & frmt[i]) + var start = i + while i < length: + if frmt[i] != '$': inc(i) + else: break + if i - 1 >= start: + app(result, substr(frmt, start, i - 1)) + assert(RopeInvariant(result)) + + proc appf(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) = + app(c, ropef(frmt, args)) + + const + bufSize = 1024 # 1 KB is reasonable + + proc auxRopeEqualsFile(r: PRope, bin: var tfile, buf: Pointer): bool = + if r.data != nil: + if r.length > bufSize: + internalError("ropes: token too long") + return + var readBytes = readBuffer(bin, buf, r.length) + result = readBytes == r.length and + equalMem(buf, addr(r.data[0]), r.length) # BUGFIX + else: + result = auxRopeEqualsFile(r.left, bin, buf) + if result: result = auxRopeEqualsFile(r.right, bin, buf) + + proc RopeEqualsFile(r: PRope, f: string): bool = + var bin: tfile + result = open(bin, f) + if not result: + return # not equal if file does not exist + var buf = alloc(BufSize) + result = auxRopeEqualsFile(r, bin, buf) + if result: + result = readBuffer(bin, buf, bufSize) == 0 # really at the end of file? + dealloc(buf) + close(bin) + + proc crcFromRopeAux(r: PRope, startVal: TCrc32): TCrc32 = + if r.data != nil: + result = startVal + for i in countup(0, len(r.data) - 1): + result = updateCrc32(r.data[i], result) + else: + result = crcFromRopeAux(r.left, startVal) + result = crcFromRopeAux(r.right, result) + + proc newCrcFromRopeAux(r: PRope, startVal: TCrc32): TCrc32 = + # XXX profiling shows this is actually expensive + var stack: TRopeSeq = @[r] + result = startVal + while len(stack) > 0: + var it = pop(stack) + while it.data == nil: + add(stack, it.right) + it = it.left + assert(it.data != nil) + var i = 0 + var L = len(it.data) + while i < L: + result = updateCrc32(it.data[i], result) inc(i) - else: InternalError("ropes: invalid format string $" & frmt[i]) - var start = i - while i < length: - if frmt[i] != '$': inc(i) - else: break - if i - 1 >= start: - app(result, substr(frmt, start, i - 1)) - assert(RopeInvariant(result)) - -proc appf(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) = - app(c, ropef(frmt, args)) - -const - bufSize = 1024 # 1 KB is reasonable - -proc auxRopeEqualsFile(r: PRope, bin: var tfile, buf: Pointer): bool = - if r.L < 0: - if -r.L > bufSize: - internalError("ropes: token too long") - return - var readBytes = readBuffer(bin, buf, -r.L) - result = readBytes == -r.L and - equalMem(buf, addr(r.d[0]), readBytes) - else: - result = auxRopeEqualsFile(r.left, bin, buf) - if result: result = auxRopeEqualsFile(r.right, bin, buf) - -proc RopeEqualsFile(r: PRope, f: string): bool = - var bin: tfile - result = open(bin, f) - if not result: - return # not equal if file does not exist - var buf = alloc(BufSize) - result = auxRopeEqualsFile(r, bin, buf) - if result: - result = readBuffer(bin, buf, bufSize) == 0 # really at the end of file? - dealloc(buf) - close(bin) - -proc newCrcFromRopeAux(r: PRope, startVal: TCrc32): TCrc32 = - # XXX profiling shows this is actually expensive - var stack: TRopeSeq = @[r] - result = startVal - while len(stack) > 0: - var it = pop(stack) - while it.L >= 0: - add(stack, it.right) - it = it.left - assert(it.L < 0) + + proc crcFromRope(r: PRope): TCrc32 = + result = newCrcFromRopeAux(r, initCrc32) + + proc writeRopeIfNotEqual(r: PRope, filename: string): bool = + # returns true if overwritten + var c: TCrc32 + c = crcFromFile(filename) + if c != crcFromRope(r): + writeRope(r, filename) + result = true + else: + result = false + +else: + # optimized but broken version: + + type + PRope* = ref TRope + TRope*{.acyclic.} = object of TObject # the empty rope is represented + # by nil to safe space + left, right: PRope + L: int # < 0 if a leaf + d: array [0..PayloadSize, char] # != nil if a leaf + + TRopeSeq* = seq[PRope] + + proc con*(a, b: PRope): PRope + proc con*(a: PRope, b: string): PRope + proc con*(a: string, b: PRope): PRope + proc con*(a: varargs[PRope]): PRope + proc app*(a: var PRope, b: PRope) + proc app*(a: var PRope, b: string) + proc prepend*(a: var PRope, b: PRope) + proc toRope*(s: string): PRope + proc toRope*(i: BiggestInt): PRope + proc ropeLen*(a: PRope): int + proc writeRopeIfNotEqual*(r: PRope, filename: string): bool + proc ropeToStr*(p: PRope): string + proc ropef*(frmt: TFormatStr, args: varargs[PRope]): PRope + proc appf*(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) + proc RopeEqualsFile*(r: PRope, f: string): bool + # returns true if the rope r is the same as the contents of file f + proc RopeInvariant*(r: PRope): bool + # exported for debugging + # implementation + + proc ropeLen(a: PRope): int = + if a == nil: result = 0 + else: result = a.L.abs + + proc newRope(data: string = nil): PRope = + if data != nil: + unsafeNew(result, sizeof(TRope)-PayloadSize+len(data)+1) + result.L = -len(data) + # copy including '\0': + copyMem(addr result.d, cstring(data), len(data)) + else: + unsafeNew(result, sizeof(TRope)-PayloadSize+1) + + proc eqContent(r: PRope, s: string): bool = + assert r.L < 0 + if -r.L == s.len: + result = equalMem(addr(r.d), cstring(s), s.len) + + when false: + proc newMutableRope*(capacity = 30): PRope = + ## creates a new rope that supports direct modifications of the rope's + ## 'data' and 'length' fields. + new(result) + result.data = newStringOfCap(capacity) + + proc freezeMutableRope*(r: PRope) {.inline.} = + r.length = r.data.len + + var + cache: array[0..2048*2 -1, PRope] + + proc RopeInvariant(r: PRope): bool = + if r == nil: + result = true + else: + result = true # + # if r.data <> snil then + # result := true + # else begin + # result := (r.left <> nil) and (r.right <> nil); + # if result then result := ropeInvariant(r.left); + # if result then result := ropeInvariant(r.right); + # end + + proc insertInCache(s: string): PRope = + var h = hash(s) and high(cache) + result = cache[h] + if isNil(result) or not eqContent(result, s): + result = newRope(s) + cache[h] = result + + proc toRope(s: string): PRope = + if s.len == 0: + result = nil + else: + result = insertInCache(s) + assert(RopeInvariant(result)) + + proc RopeSeqInsert(rs: var TRopeSeq, r: PRope, at: Natural) = + var length = len(rs) + if at > length: + setlen(rs, at + 1) + else: + setlen(rs, length + 1) # move old rope elements: + for i in countdown(length, at + 1): + rs[i] = rs[i - 1] # this is correct, I used pen and paper to validate it + rs[at] = r + + proc newRecRopeToStr(result: var string, resultLen: var int, r: PRope) = + var stack = @[r] + while len(stack) > 0: + var it = pop(stack) + while it.L >= 0: + add(stack, it.right) + it = it.left + assert(it.L < 0) + CopyMem(addr(result[resultLen]), addr(it.d[0]), -it.L) + Inc(resultLen, -it.L) + assert(resultLen <= len(result)) + + proc ropeToStr(p: PRope): string = + if p == nil: + result = "" + else: + result = newString(p.L.abs) + var resultLen = 0 + newRecRopeToStr(result, resultLen, p) + + proc con(a, b: PRope): PRope = + if a == nil: result = b + elif b == nil: result = a + else: + result = newRope() + result.L = a.L.abs + b.L.abs + result.left = a + result.right = b + + proc con(a: PRope, b: string): PRope = result = con(a, toRope(b)) + proc con(a: string, b: PRope): PRope = result = con(toRope(a), b) + + proc con(a: varargs[PRope]): PRope = + for i in countup(0, high(a)): result = con(result, a[i]) + + proc toRope(i: BiggestInt): PRope = result = toRope($i) + + proc app(a: var PRope, b: PRope) = a = con(a, b) + proc app(a: var PRope, b: string) = a = con(a, b) + proc prepend(a: var PRope, b: PRope) = a = con(b, a) + + proc writeRope*(f: TFile, c: PRope) = + var stack = @[c] + while len(stack) > 0: + var it = pop(stack) + while it.L >= 0: + add(stack, it.right) + it = it.left + assert(it != nil) + assert(it.L < 0) + write(f, cstring(it.d), -it.L) + + proc WriteRope*(head: PRope, filename: string, useWarning = false) = + var f: tfile + if open(f, filename, fmWrite): + if head != nil: WriteRope(f, head) + close(f) + else: + rawMessage(if useWarning: warnCannotOpenFile else: errCannotOpenFile, + filename) + + proc ropef(frmt: TFormatStr, args: varargs[PRope]): PRope = var i = 0 - var L = -it.L - while i < L: - result = updateCrc32(it.d[i], result) - inc(i) - -proc crcFromRope(r: PRope): TCrc32 = - result = newCrcFromRopeAux(r, initCrc32) - -proc writeRopeIfNotEqual(r: PRope, filename: string): bool = - # returns true if overwritten - var c: TCrc32 - c = crcFromFile(filename) - if c != crcFromRope(r): - writeRope(r, filename) - result = true - else: - result = false + var length = len(frmt) + result = nil + var num = 0 + while i <= length - 1: + if frmt[i] == '$': + inc(i) # skip '$' + case frmt[i] + of '$': + app(result, "$") + inc(i) + of '#': + inc(i) + app(result, args[num]) + inc(num) + of '0'..'9': + var j = 0 + while true: + j = (j * 10) + Ord(frmt[i]) - ord('0') + inc(i) + if (i > length + 0 - 1) or not (frmt[i] in {'0'..'9'}): break + num = j + if j > high(args) + 1: + internalError("ropes: invalid format string $" & $(j)) + else: + app(result, args[j - 1]) + of 'n': + if optLineDir notin gOptions: app(result, tnl) + inc i + of 'N': + app(result, tnl) + inc(i) + else: InternalError("ropes: invalid format string $" & frmt[i]) + var start = i + while i < length: + if frmt[i] != '$': inc(i) + else: break + if i - 1 >= start: + app(result, substr(frmt, start, i - 1)) + assert(RopeInvariant(result)) + + proc appf(c: var PRope, frmt: TFormatStr, args: varargs[PRope]) = + app(c, ropef(frmt, args)) + + const + bufSize = 1024 # 1 KB is reasonable + + proc auxRopeEqualsFile(r: PRope, bin: var tfile, buf: Pointer): bool = + if r.L < 0: + if -r.L > bufSize: + internalError("ropes: token too long") + return + var readBytes = readBuffer(bin, buf, -r.L) + result = readBytes == -r.L and + equalMem(buf, addr(r.d[0]), readBytes) + else: + result = auxRopeEqualsFile(r.left, bin, buf) + if result: result = auxRopeEqualsFile(r.right, bin, buf) + + proc RopeEqualsFile(r: PRope, f: string): bool = + var bin: tfile + result = open(bin, f) + if not result: + return # not equal if file does not exist + var buf = alloc(BufSize) + result = auxRopeEqualsFile(r, bin, buf) + if result: + result = readBuffer(bin, buf, bufSize) == 0 # really at the end of file? + dealloc(buf) + close(bin) + + proc newCrcFromRopeAux(r: PRope, startVal: TCrc32): TCrc32 = + # XXX profiling shows this is actually expensive + var stack: TRopeSeq = @[r] + result = startVal + while len(stack) > 0: + var it = pop(stack) + while it.L >= 0: + add(stack, it.right) + it = it.left + assert(it.L < 0) + var i = 0 + var L = -it.L + while i < L: + result = updateCrc32(it.d[i], result) + inc(i) + + proc crcFromRope(r: PRope): TCrc32 = + result = newCrcFromRopeAux(r, initCrc32) + + proc writeRopeIfNotEqual(r: PRope, filename: string): bool = + # returns true if overwritten + var c: TCrc32 + c = crcFromFile(filename) + if c != crcFromRope(r): + writeRope(r, filename) + result = true + else: + result = false |