summary refs log tree commit diff stats
path: root/tools/trimcc.nim
blob: 41795e1aa2ac43d3217e851ed8bab67fdcd43dc9 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
# Trim C compiler installation to a minimum

import strutils, os, pegs, strtabs, math, times

const
  Essential = """gcc.exe g++.exe gdb.exe ld.exe as.exe c++.exe cpp.exe cc1.exe
crtbegin.o crtend.o crt2.o dllcrt2.o libgcc_s_dw2-1.dll libgcc_s_sjlj-1.dll
libgcc_s_seh-1.dll libexpat-1.dll libwinpthread-1.dll aio.h dlfcn.h fcntl.h
fenv.h fmtmsg.h fnmatch.h ftw.h errno.h glob.h gtmath.h if.h in.h ipc.h
langinfo.h locale.h math.h mman.h netdb.h nl_types.h poll.h pthread.h pwd.h
sched.h select.h semaphore.h signal.h socket.h spawn.h stat.h statvfs.h stdio.h
stdlib.h string.h strings.h tcp.h time.h types.h ucontext.h uio.h utsname.h
unistd.h wait.h varargs.h windows.h zlib.h
""".split

proc includes(headerpath, headerfile: string, whitelist: StringTableRef) =
  whitelist[headerfile] = "processed"
  for line in lines(headerpath):
    if line =~ peg"""s <- ws '#include' ws ('"' / '<') {[^">]+} ('"' / '>') ws
                     comment <- '/*' @ '*/' / '//' .*
                     ws <- (comment / \s+)* """:
      let m = matches[0].extractFilename
      if whitelist.getOrDefault(m) != "processed":
        whitelist[m] = "found"

proc processIncludes(dir: string, whitelist: StringTableRef) =
  for kind, path in walkDir(dir):
    case kind
    of pcFile:
      let name = extractFilename(path)
      if ('.' notin name and "include" in path) or ("c++" in path):
        let n = whitelist.getOrDefault(name)
        if n != "processed": whitelist[name] = "found"
      if name.endsWith(".h"):
        let n = whitelist.getOrDefault(name)
        if n == "found": includes(path, name, whitelist)
    of pcDir: processIncludes(path, whitelist)
    else: discard

proc gatherFiles(dir: string, whitelist: StringTableRef, result: var seq[string]) =
  for kind, path in walkDir(dir):
    case kind
    of pcFile:
      let name = extractFilename(path)
      if not whitelist.hasKey(name):
        result.add(path)
    of pcDir:
      gatherFiles(path, whitelist, result)
    else:
      discard

proc gatherEmptyFolders(dir: string, whitelist: StringTableRef, result: var seq[string]) =
  var empty = true
  for kind, path in walkDir(dir):
    case kind
    of pcFile:
      empty = false
    of pcDir:
      let (none, name) = splitPath(path)
      if not whitelist.hasKey(name):
        gatherEmptyFolders(path, whitelist, result)
      empty = false
    else:
      discard
  if empty:
    result.add(dir)

proc newName(f: string): string =
  let (dir, name, ext) = splitFile(f)
  return dir / "trim_" & name & ext

proc ccStillWorks(): bool =
  const
    c1 = r"nim c --verbosity:0 --force_build koch"
    c2 = r"nim c --verbosity:0 --force_build --threads:on --out:tempOne.exe tools/trimcc"
    c3 = r"nim c --verbosity:0 --force_build --threads:on --out:tempTwo.exe tools/fakeDeps"
    c4 = r".\koch.exe"
    c5 = r".\tempOne.exe"
    c6 = r".\tempTwo.exe"
  result = execShellCmd(c1) == 0 and execShellCmd(c2) == 0 and
           execShellCmd(c3) == 0 and execShellCmd(c4) == 0 and
           execShellCmd(c5) == 0 and execShellCmd(c6) == 0

proc trialDeletion(files: seq[string], a, b: int, whitelist: StringTableRef): bool =
  result = true
  var single = (a == min(b, files.high))
  for path in files[a .. min(b, files.high)]:
    try:
      moveFile(dest=newName(path), source=path)
    except OSError:
      return false

  # Test if compilation still works, even with the moved files.
  if ccStillWorks():
    for path in files[a .. min(b, files.high)]:
      try:
        removeFile(newName(path))
        echo "Optional: ", path
      except OSError:
        echo "Warning, couldn't move ", path
        moveFile(dest=path, source=newName(path))
        return false
  else:
    for path in files[a .. min(b, files.high)]:
      echo "Required: ", path
      moveFile(dest=path, source=newName(path))
      if single:
        whitelist[path] = "found"
      result = false

proc main(dir: string) =
  # Construct a whitelist of files to not remove
  var whitelist = newStringTable(modeCaseInsensitive)
  for e in Essential:
    whitelist[e] = "found"
  while true:
    let oldLen = whitelist.len
    processIncludes(dir, whitelist)
    if oldLen == whitelist.len:
      break

  # Remove batches of files
  var nearlyDone = false
  while true:
    # Gather files to test
    var allFiles = newSeq[string]()
    gatherFiles(dir, whitelist, allFiles)

    # Determine the initial size of groups to check
    var
      maxBucketSize = len(allFiles)
      bucketSize = 1

    # Loop through the list of files, deleting batches
    var i = 0
    while i < allFiles.len:
      var success = trialDeletion(allFiles, i, i+bucketSize-1, whitelist)
      inc i, bucketSize

      # If we aren't on the last pass, adjust the batch size based on success
      if not nearlyDone:
        if success:
          bucketSize = min(bucketSize * 2, maxBucketSize)
        else:
          bucketSize = max(bucketSize div 2, 1)
      echo "Bucket size is now ", bucketSize

    # After looping through all the files, check if we need to break.
    if nearlyDone:
      break
    if bucketSize == 1:
      nearlyDone = true

  while true:
    var
      emptyFolders = newSeq[string]()
      changed = false

    gatherEmptyFolders(dir, whitelist, emptyFolders)
    for path in emptyFolders:
      removeDir(path)
      if not ccStillWorks():
        createDir(path)
        whitelist[path] = "found"
      else:
        changed = true
    if not changed:
      break

if paramCount() == 1:
  doAssert ccStillWorks()
  main(paramStr(1))
else:
  quit "Usage: trimcc c_compiler_directory", QuitSuccess