diff options
author | Araq <rumpf_a@web.de> | 2011-04-18 23:41:31 +0200 |
---|---|---|
committer | Araq <rumpf_a@web.de> | 2011-04-18 23:41:31 +0200 |
commit | d1b766cec03277ac4086ddf7bd371d7bc20b2b4d (patch) | |
tree | 5967e085776933b5f4ea31a4669b77dc5a952423 | |
parent | 48dd9679bd2196369a8a6f93f6225ad730683c25 (diff) | |
download | Nim-d1b766cec03277ac4086ddf7bd371d7bc20b2b4d.tar.gz |
hashtables: 1st version; parseutils additions
-rw-r--r-- | lib/pure/collections/hashtables.nim | 146 | ||||
-rwxr-xr-x | lib/pure/parseutils.nim | 24 | ||||
-rwxr-xr-x | lib/system.nim | 6 | ||||
-rw-r--r-- | tests/accept/compile/ttempl4.nim | 4 | ||||
-rwxr-xr-x | web/news.txt | 1 |
5 files changed, 175 insertions, 6 deletions
diff --git a/lib/pure/collections/hashtables.nim b/lib/pure/collections/hashtables.nim new file mode 100644 index 000000000..1a78586ab --- /dev/null +++ b/lib/pure/collections/hashtables.nim @@ -0,0 +1,146 @@ +# +# +# Nimrod's Runtime Library +# (c) Copyright 2011 Andreas Rumpf, Dominik Picheta +# +# See the file "copying.txt", included in this +# distribution, for details about the copyright. +# + +## The ``hashtables`` module implements an efficient hash table that is +## a mapping from keys to values. + +import + os, hashes, strutils + +type + TKeyValuePair[A, B] = tuple[key: A, val: B] + TKeyValuePairSeq[A, B] = seq[TKeyValuePair[A, B]] + THashTable*[A, B] = object of TObject + counter: int + data: TKeyValuePairSeq[A, B] + + PHashTable*[A, B] = ref THashTable[A, B] ## use this type to declare tables + +proc len*[A, B](t: PHashTable[A, B]): int = + ## returns the number of keys in `t`. + result = t.counter + +iterator pairs*[A, B](t: PHashTable[A, B]): tuple[key: A, val: B] = + ## iterates over any (key, value) pair in the table `t`. + for h in 0..high(t.data): + if not isNil(t.data[h].key) and not isNil(t.data[h].val): + yield (t.data[h].key, t.data[h].val) + +const + growthFactor = 2 + startSize = 64 + +proc myhash[A](key: A): THash = + result = hashes.hash(key) + +proc myCmp[A](key: A, key2: A): bool = + result = cmp(key, key2) == 0 + +proc mustRehash(length, counter: int): bool = + assert(length > counter) + result = (length * 2 < counter * 3) or (length - counter < 4) + +proc nextTry(h, maxHash: THash): THash {.inline.} = + result = ((5 * h) + 1) and maxHash + +proc RawGet[A, B](t: PHashTable[A, B], key: A): int = + var h: THash = myhash(key) and high(t.data) # start with real hash value + while not isNil(t.data[h].key) and not isNil(t.data[h].val): + if mycmp(t.data[h].key, key): + return h + h = nextTry(h, high(t.data)) + result = -1 + +proc `[]`*[A, B](t: PHashTable[A, B], key: A): B = + ## retrieves the value at ``t[key]``. If `key` is not in `t`, + ## default empty value for the type `B` is returned + ## and no exception is raised. One can check with ``hasKey`` whether the key + ## exists. + var index = RawGet(t, key) + if index >= 0: result = t.data[index].val + +proc hasKey*[A, B](t: PHashTable[A, B], key: A): bool = + ## returns true iff `key` is in the table `t`. + result = rawGet(t, key) >= 0 + +proc RawInsert[A, B](t: PHashTable[A, B], data: var TKeyValuePairSeq[A, B], + key: A, val: B) = + var h: THash = myhash(key) and high(data) + while not isNil(data[h].key): + h = nextTry(h, high(data)) + data[h].key = key + data[h].val = val + +proc Enlarge[A, B](t: PHashTable[A, B]) = + var n: TKeyValuePairSeq[A, B] + newSeq(n, len(t.data) * growthFactor) + for i in countup(0, high(t.data)): + if not isNil(t.data[i].key): RawInsert(t, n, t.data[i].key, t.data[i].val) + swap(t.data, n) + +proc `[]=`*[A, B](t: PHashTable[A, B], key: A, val: B) = + ## puts a (key, value)-pair into `t`. + var index = RawGet(t, key) + if index >= 0: + t.data[index].val = val + else: + if mustRehash(len(t.data), t.counter): Enlarge(t) + RawInsert(t, t.data, key, val) + inc(t.counter) + +proc default[T](): T = nil + +proc del*[A, B](t: PHashTable[A, B], key: A) = + ## deletes `key` from hash table `t`. + var index = RawGet(t, key) + if index >= 0: + t.data[index].key = default[A]() + else: + raise newException(EInvalidIndex, "Key not found.") + +proc newHashTable*[A, B](): PHashTable[A, B] = + ## creates a new string table that is empty. + new(result) + result.counter = 0 + newSeq(result.data, startSize) + +proc `$`*[A, B](t: PHashTable[A, B]): string = + ## The `$` operator for string tables. + if t.len == 0: + result = "{:}" + else: + result = "{" + for key, val in pairs(t): + if result.len > 1: result.add(", ") + result.add($key) + result.add(": ") + result.add($val) + result.add("}") + +when isMainModule: + var table = newHashTable[string, float]() + table["test"] = 1.2345 + table["111"] = 1.000043 + echo table + table.del("111") + echo table + echo repr(table["111"]) + echo(repr(table["1212"])) + table["111"] = 1.5 + table["011"] = 67.9 + echo table + table.del("test") + table.del("111") + echo table + + + echo hash("test") + echo hash("test") + + diff --git a/lib/pure/parseutils.nim b/lib/pure/parseutils.nim index 07c54f88c..90bb5d79f 100755 --- a/lib/pure/parseutils.nim +++ b/lib/pure/parseutils.nim @@ -77,10 +77,12 @@ proc parseIdent*(s: string, ident: var string, start = 0): int = result = i-start proc parseToken*(s: string, token: var string, validChars: set[char], - start = 0): int {.inline.} = + start = 0): int {.inline, deprecated.} = ## parses a token and stores it in ``token``. Returns ## the number of the parsed characters or 0 in case of an error. A token ## consists of the characters in `validChars`. + ## + ## **Deprecated since version 0.8.12**: Use ``parseWhile`` instead. var i = start while s[i] in validChars: inc(i) result = i-start @@ -110,6 +112,26 @@ proc skipWhile*(s: string, toSkip: set[char], start = 0): int {.inline.} = ## Returns number of characters skipped. while s[result+start] in toSkip and s[result+start] != '\0': inc(result) +proc parseUntil*(s: string, token: var string, until: set[char], + start = 0): int {.inline.} = + ## parses a token and stores it in ``token``. Returns + ## the number of the parsed characters or 0 in case of an error. A token + ## consists of the characters notin `until`. + var i = start + while s[i] notin until: inc(i) + result = i-start + token = copy(s, start, i-1) + +proc parseWhile*(s: string, token: var string, validChars: set[char], + start = 0): int {.inline.} = + ## parses a token and stores it in ``token``. Returns + ## the number of the parsed characters or 0 in case of an error. A token + ## consists of the characters in `validChars`. + var i = start + while s[i] in validChars: inc(i) + result = i-start + token = copy(s, start, i-1) + {.push overflowChecks: on.} # this must be compiled with overflow checking turned on: proc rawParseInt(s: string, b: var biggestInt, start = 0): int = diff --git a/lib/system.nim b/lib/system.nim index 6490ce416..46ca5b61d 100755 --- a/lib/system.nim +++ b/lib/system.nim @@ -1717,10 +1717,10 @@ elif defined(ecmaScript) or defined(NimrodVM): if x < y: return -1 return 1 -proc quit*(errormsg: string) {.noReturn.} = - ## a shorthand for ``echo(errormsg); quit(quitFailure)``. +proc quit*(errormsg: string, errorcode = QuitFailure) {.noReturn.} = + ## a shorthand for ``echo(errormsg); quit(errorcode)``. echo(errormsg) - quit(quitFailure) + quit(errorcode) {.pop.} # checks {.pop.} # hints diff --git a/tests/accept/compile/ttempl4.nim b/tests/accept/compile/ttempl4.nim index 273605669..a5ad2000f 100644 --- a/tests/accept/compile/ttempl4.nim +++ b/tests/accept/compile/ttempl4.nim @@ -2,7 +2,7 @@ template `:=`(name, val: expr): stmt = var name = val -ha := 1 -hu := "ta-da" +ha := 1 * 4 +hu := "ta-da" == "ta-da" echo ha, hu diff --git a/web/news.txt b/web/news.txt index 3a35a9f21..ce48b4e90 100755 --- a/web/news.txt +++ b/web/news.txt @@ -49,6 +49,7 @@ Additions - Added ``smtp`` module. - Added ``re.findAll``, ``pegs.findAll``. - Added ``os.findExe``. +- Added ``parseutils.parseUntil`` and ``parseutils.parseWhile``. - Added ``strutils.align``, ``strutils.tokenize``, ``strutils.wordWrap``. - Pegs support a *captured search loop operator* ``{@}``. - Pegs support new built-ins: ``\letter``, ``\upper``, ``\lower``, |