summary refs log tree commit diff stats
path: root/compiler/semthreads.nim
diff options
context:
space:
mode:
Diffstat (limited to 'compiler/semthreads.nim')
-rw-r--r--compiler/semthreads.nim316
1 files changed, 316 insertions, 0 deletions
diff --git a/compiler/semthreads.nim b/compiler/semthreads.nim
new file mode 100644
index 000000000..9d78123d6
--- /dev/null
+++ b/compiler/semthreads.nim
@@ -0,0 +1,316 @@
+#
+#
+#           The Nimrod Compiler
+#        (c) Copyright 2011 Andreas Rumpf
+#
+#    See the file "copying.txt", included in this
+#    distribution, for details about the copyright.
+#
+
+## Semantic analysis that deals with threads: Possible race conditions should
+## be reported some day.
+##
+## 
+## ========================
+## No heap sharing analysis
+## ========================
+##
+## The only crucial operation that can violate the heap invariants is the
+## write access. The analysis needs to distinguish between 'unknown', 'mine',
+## and 'theirs' memory and pointers. Assignments 'whatever <- unknown' are 
+## invalid, and so are 'theirs <- mine' but not 'mine <- theirs'. Since
+## strings and sequences are heap allocated they are affected too:
+##
+## .. code-block:: nimrod
+##   proc p() = 
+##     global = "alloc this string" # ugh!
+##
+## Thus the analysis is concerned with any type that contains a GC'ed
+## reference...
+## If the type system would distinguish between 'ref' and '!ref' and threads
+## could not have '!ref' as input parameters the analysis could simply need to
+## reject any write access to a global variable which contains GC'ed data.
+## However, '!ref' is not implemented yet and this scheme would be too
+## restrictive anyway.
+##
+## The assignment target is essential for the algorithm: only 
+## write access to heap locations and global variables are critical and need
+## to be checked. Access via 'var' parameters is no problem to analyse since
+## we need the arguments' locations in the analysis.
+##
+## However, this is tricky: 
+##  
+##  var x = globalVar     # 'x' points to 'theirs'
+##  while true:
+##    globalVar = x       # OK: 'theirs <- theirs'
+##    x = "new string"    # ugh: 'x is toUnknown'!
+##
+##  --> Solution: toUnknown is never allowed anywhere!
+##
+##
+## Beware that the same proc might need to be
+## analysed multiple times! Oh and watch out for recursion! Recursion is handled
+## by a stack of symbols that we are processing, if we come back to the same
+## symbol, we have to skip this check (assume no error in the recursive case).
+## However this is wrong. We need to check for the particular combination
+## of (procsym, threadOwner(arg1), threadOwner(arg2), ...)!
+
+import
+  ast, astalgo, strutils, hashes, options, msgs, idents, types, os,
+  renderer, tables
+
+type
+  TThreadOwner = enum
+    toUndefined, # not computed yet 
+    toVoid,      # no return type
+    toNil,       # cycle in computation or nil: can be overwritten
+    toTheirs,    # some other heap
+    toMine       # mine heap
+
+  TCall = object {.pure.}
+    callee: PSym              # what if callee is an indirect call?
+    args: seq[TThreadOwner]
+
+  PProcCtx = ref TProcCtx
+  TProcCtx = object {.pure.}
+    nxt: PProcCtx             # can be stacked
+    mapping: tables.TTable[int, TThreadOwner] # int = symbol ID
+    owner: PSym               # current owner
+
+var
+  computed = tables.initTable[TCall, TThreadOwner]()
+
+proc hash(c: TCall): THash =
+  result = hash(c.callee.id)
+  for a in items(c.args): result = result !& hash(ord(a))
+  result = !$result
+
+proc `==`(a, b: TCall): bool =
+  if a.callee != b.callee: return
+  if a.args.len != b.args.len: return
+  for i in 0..a.args.len-1:
+    if a.args[i] != b.args[i]: return
+  result = true
+
+proc newProcCtx(owner: PSym): PProcCtx =
+  assert owner != nil
+  new(result)
+  result.mapping = tables.InitTable[int, TThreadOwner]()
+  result.owner = owner
+
+proc analyse(c: PProcCtx, n: PNode): TThreadOwner
+
+proc analyseSym(c: PProcCtx, n: PNode): TThreadOwner =
+  var v = n.sym
+  result = c.mapping[v.id]
+  if result != toUndefined: return
+  case v.kind
+  of skVar:
+    if sfGlobal in v.flags:
+      result = if sfThreadVar in v.flags: toMine else: toTheirs
+    else:
+      result = toNil
+  of skTemp, skForVar: result = toNil
+  of skConst: result = toMine
+  of skParam: 
+    result = c.mapping[v.id]
+    if result == toUndefined:
+      InternalError(n.info, "param not set: " & v.name.s)
+  else:
+    result = toNil
+  c.mapping[v.id] = result
+
+proc lvalueSym(n: PNode): PNode =
+  result = n
+  while result.kind in {nkDotExpr, nkBracketExpr, nkDerefExpr, nkHiddenDeref}:
+    result = result.sons[0]
+
+proc writeAccess(c: PProcCtx, n: PNode, owner: TThreadOwner) =
+  if owner notin {toNil, toMine, toTheirs}:
+    InternalError(n.info, "writeAccess: " & $owner)
+  var a = lvalueSym(n)
+  if a.kind == nkSym: 
+    var v = a.sym
+    var lastOwner = analyseSym(c, a)
+    case lastOwner
+    of toNil:
+      c.mapping[v.id] = owner # fine, toNil can be overwritten
+    of toVoid, toUndefined: InternalError(n.info, "writeAccess")
+    of toTheirs, toMine:
+      if lastOwner != owner and owner != toNil:
+        LocalError(n.info, errDifferentHeaps)
+  else:
+    # we could not backtrack to a concrete symbol, but that's fine:
+    var lastOwner = analyseSym(c, n)
+    case lastOwner
+    of toNil: nil # fine, toNil can be overwritten
+    of toVoid, toUndefined: InternalError(n.info, "writeAccess")
+    of toTheirs, toMine:
+      if lastOwner != owner and owner != toNil:
+        LocalError(n.info, errDifferentHeaps)
+
+proc analyseAssign(c: PProcCtx, le, ri: PNode) =
+  var y = analyse(c, ri) # read access; ok
+  writeAccess(c, le, y)
+
+proc analyseAssign(c: PProcCtx, n: PNode) =
+  analyseAssign(c, n.sons[0], n.sons[1])
+
+proc analyseCall(c: PProcCtx, n: PNode): TThreadOwner =
+  var prc = n[0].sym
+  var newCtx = newProcCtx(prc)
+  var call: TCall
+  call.callee = prc
+  newSeq(call.args, n.len-1)
+  for i in 1..n.len-1:
+    call.args[i-1] = analyse(c, n[i])
+  if not computed.hasKey(call):
+    computed[call] = toUndefined # we are computing it
+    for i in 1..n.len-1: 
+      var formal = skipTypes(prc.typ, abstractInst).n.sons[i].sym 
+      newCtx.mapping[formal.id] = call.args[i-1]
+    pushInfoContext(n.info)
+    computed[call] = analyse(newCtx, prc.ast.sons[codePos])
+    popInfoContext()
+  else:
+    # ugh, cycle! We are already computing it but don't know the outcome yet...
+    if prc.typ.sons[0] == nil: result = toVoid
+    else: result = toNil
+
+proc analyseVarTuple(c: PProcCtx, n: PNode) =
+  if n.kind != nkVarTuple: InternalError(n.info, "analyseVarTuple")
+  var L = n.len
+  for i in countup(0, L-3): AnalyseAssign(c, n.sons[i], n.sons[L-1])
+
+proc analyseSingleVar(c: PProcCtx, a: PNode) =
+  if a.sons[2].kind != nkEmpty: AnalyseAssign(c, a.sons[0], a.sons[2])
+
+proc analyseVarSection(c: PProcCtx, n: PNode): TThreadOwner = 
+  for i in countup(0, sonsLen(n) - 1): 
+    var a = n.sons[i]
+    if a.kind == nkCommentStmt: continue 
+    if a.kind == nkIdentDefs: 
+      assert(a.sons[0].kind == nkSym)
+      analyseSingleVar(c, a)
+    else:
+      analyseVarTuple(c, a)
+  result = toVoid
+
+proc analyseConstSection(c: PProcCtx, t: PNode): TThreadOwner =
+  for i in countup(0, sonsLen(t) - 1): 
+    var it = t.sons[i]
+    if it.kind == nkCommentStmt: continue 
+    if it.kind != nkConstDef: InternalError(t.info, "analyseConstSection")
+    if sfFakeConst in it.sons[0].sym.flags: analyseSingleVar(c, it)
+  result = toVoid
+
+template aggregateOwner(result, ana: expr) =
+  var a = ana # eval once
+  if result != a:
+    if result == toNil: result = a
+    else: localError(n.info, errDifferentHeaps)
+
+proc analyse(c: PProcCtx, n: PNode): TThreadOwner =
+  case n.kind
+  of nkCall, nkInfix, nkPrefix, nkPostfix, nkCommand, 
+     nkCallStrLit, nkHiddenCallConv:
+    if n[0].kind != nkSym or n[0].sym.kind != skProc:
+      Message(n.info, warnAnalysisLoophole, renderTree(n))
+      result = toNil
+    else:
+      var prc = n[0].sym
+      # XXX create thread!?
+      case prc.magic
+      of mNew, mNewFinalize, mNewSeq, mSetLengthStr, mSetLengthSeq,
+          mAppendSeqElem, mReset, mAppendStrCh, mAppendStrStr:
+        writeAccess(c, n[1], toMine)
+        result = toVoid
+      of mSwap:
+        var a = analyse(c, n[2])
+        writeAccess(c, n[1], a)
+        writeAccess(c, n[2], a)
+        result = toVoid
+      else:
+        result = analyseCall(c, n)
+  of nkAsgn, nkFastAsgn:
+    analyseAssign(c, n)
+    result = toVoid
+  of nkSym: result = analyseSym(c, n)
+  of nkEmpty, nkNone: result = toVoid
+  of nkNilLit, nkCharLit..nkFloat64Lit: result = toNil
+  of nkStrLit..nkTripleStrLit: result = toMine
+  of nkDotExpr, nkBracketExpr, nkDerefExpr, nkHiddenDeref:
+    # field access:
+    # pointer deref or array access:
+    result = analyse(c, n.sons[0])    
+  of nkBind: result = analyse(c, n.sons[0])
+  of nkPar, nkCurly, nkBracket:
+    # container construction:
+    result = toNil # nothing until later
+    for i in 0..n.len-1: aggregateOwner(result, analyse(c, n[i]))
+  of nkAddr, nkHiddenAddr:
+    var a = lvalueSym(n)
+    if a.kind == nkSym:
+      result = analyseSym(c, a)
+      assert result in {toNil, toMine, toTheirs}
+      if result == toNil:
+        # assume toMine here for consistency:
+        c.mapping[a.sym.id] = toMine
+        result = toMine
+    else:
+      # should never really happen:
+      result = analyse(c, n.sons[0])
+  of nkIfExpr: 
+    result = toNil
+    for i in countup(0, sonsLen(n) - 1):
+      var it = n.sons[i]
+      case it.kind
+      of nkElifExpr:
+        discard analyse(c, it.sons[0])
+        aggregateOwner(result, analyse(c, it.sons[1]))
+      of nkElseExpr:
+        aggregateOwner(result, analyse(c, it.sons[0]))
+      else: internalError(n.info, "analyseIfExpr()")
+  of nkStmtListExpr, nkBlockExpr:
+    var n = if n.kind == nkBlockExpr: n.sons[1] else: n
+    var L = sonsLen(n)
+    for i in countup(0, L-2): discard analyse(c, n.sons[i])
+    if L > 0: result = analyse(c, n.sons[L-1])
+    else: result = toVoid
+  of nkHiddenStdConv, nkHiddenSubConv, nkConv, nkCast: 
+    result = analyse(c, n.sons[1])
+  of nkStringToCString, nkCStringToString, nkChckRangeF, nkChckRange64,
+     nkChckRange, nkCheckedFieldExpr, nkPassAsOpenArray, nkObjDownConv, 
+     nkObjUpConv:
+    result = analyse(c, n.sons[0])
+  of nkRaiseStmt:
+    var a = analyse(c, n.sons[0])
+    if a != toMine: LocalError(n.info, errDifferentHeaps)
+    result = toVoid
+  of nkVarSection: result = analyseVarSection(c, n)
+  of nkConstSection: result = analyseConstSection(c, n)
+  of nkTypeSection, nkCommentStmt: result = toVoid
+  of nkIfStmt, nkWhileStmt, nkTryStmt, nkCaseStmt, nkStmtList, nkBlockStmt:
+    for i in 0 .. <n.len: discard analyse(c, n[i])
+    result = toVoid
+  of nkBreakStmt, nkContinueStmt: result = toVoid
+  of nkReturnStmt, nkDiscardStmt: 
+    if n.sons[0].kind != nkEmpty: result = analyse(c, n.sons[0])
+    else: result = toVoid
+  of nkAsmStmt, nkPragma, nkIteratorDef, nkProcDef, nkMethodDef,
+     nkConverterDef, nkMacroDef, nkTemplateDef: 
+      result = toVoid
+  else: InternalError(n.info, "analysis not implemented for: " & $n.kind)
+
+proc AnalyseThread*(threadCreation: PNode) =
+  var n = threadCreation
+  # thread proc is second param of ``createThread``:
+  if n[2].kind != nkSym or n[2].sym.kind != skProc:
+    Message(n.info, warnAnalysisLoophole, renderTree(n))
+    return
+  var prc = n[2].sym
+  var c = newProcCtx(prc)
+  var formal = skipTypes(prc.typ, abstractInst).n.sons[1].sym 
+  c.mapping[formal.id] = toTheirs # thread receives foreign data!
+  discard analyse(c, prc.ast.sons[codePos])
+