From 07147a670a2ea537e8e221b0ac43a2c923962dac Mon Sep 17 00:00:00 2001 From: Kartik Agaram Date: Sun, 29 Apr 2018 23:48:49 -0700 Subject: 4236 - experimental script for parallel building https://www.reddit.com/r/oilshell/comments/8bg9t1/the_problem_of_make_inside_shell_scripts/dxroayn --- build4 | 284 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 284 insertions(+) create mode 100755 build4 diff --git a/build4 b/build4 new file mode 100755 index 00000000..852d7185 --- /dev/null +++ b/build4 @@ -0,0 +1,284 @@ +#!/bin/sh +# Experimental alternative to build2 that can run steps in parallel if their +# dependencies are met. Caveats: +# +# 1. We rely on the OS to schedule steps, so thousands of independent tasks +# will likely be counter-productive. +# 2. Can run out of virtual memory if you spawn too many say $CC processes. +# 3. Compilation errors can cause the script to hang. +# 4. Ugly as heck! Really needs simpler versions to compare against. And +# even then, diff gets confused. +# 5. There's a mechanical difficulty: we use mktemp to reliably create +# temporary filenames, which has the side effect of also creating the +# files. So zero-size files are considered equivalent to empty files. +# When some commands have trouble with this (e.g. ar) we need to delete +# the empty file, which can expose us to a race condition wrt mktemp. + +set -e # stop immediately on error + +# Some environment variables that can be passed in. For example, to turn off +# optimization: +# $ CFLAGS=-g ./build2 +test "$CXX" || export CXX=c++ +test "$CC" || export CC=cc +test "$CFLAGS" || export CFLAGS="-g -O2" +export CFLAGS="$CFLAGS -Wall -Wextra -ftrapv -fno-strict-aliasing" + +# Outline: +# [0-9]*.cc -> mu.cc -> .build/*.cc -> .build/*.o -> .build/mu_bin +# (layers) | | | | +# tangle cleave $CXX $CXX + +# can also be called with a layer to only build until +# $ ./build2 --until 050 +UNTIL_LAYER=${2:-zzz} + +# there's two mechanisms for fast builds here: +# - if a command is quick to run, always run it but update the result only on any change +# - otherwise run it only if the output is 'older_than' the inputs +# +# avoid combining both mechanisms for a single file +# otherwise you'll see spurious messages about files being updated +# risk: a file may unnecessarily update without changes, causing unnecessary work downstream + +# return 1 if $1 is older than _any_ of the remaining args +older_than() { + local target=$1 + shift + if [ ! -s $target ] + then +#? echo "$target has size zero" +#? echo "updating $target" >&2 + return 0 # success + fi + local f + for f in $* + do + if [ $f -nt $target ] + then +#? echo "updating $target" >&2 + return 0 # success + fi + done + return 1 # failure +} + +# redirect to $1, unless it's already identical +update() { + if [ ! -e $1 ] + then + cat > $1 + else + cat > $1.tmp + diff -q $1 $1.tmp >/dev/null && rm $1.tmp || mv $1.tmp $1 + fi +} + +update_cp() { + if [ ! -e $2/$1 ] + then + cp $1 $2 + elif [ $1 -nt $2/$1 ] + then + cp $1 $2 + fi +} + +noisy_cd() { + cd $1 + echo "-- `pwd`" >&2 +} + +mv_if_exists() { + test -e $1 && mv $1 $2 + return 0 +} + +wait_for_all() { + # could use inotify on Linux + while ! all_exist "$@" + do + sleep 1 + done +} + +all_exist() { + for f in "$@" + do + test -e $f || return 1 + done + return 0 +} + +TMP=`mktemp` +mv_if_exists enumerate/enumerate $TMP +( + wait_for_all enumerate/enumerate.cc + older_than $TMP enumerate/enumerate.cc && { + echo "building enumerate" + $CXX $CFLAGS enumerate/enumerate.cc -o $TMP + echo "done building enumerate" + } + mv $TMP enumerate/enumerate +) & + +TMP=`mktemp` +mv_if_exists tangle/tangle $TMP +( + wait_for_all tangle/*.cc + older_than $TMP tangle/*.cc && { + echo "building tangle" + cd tangle + # auto-generate various lists (ending in '_list' by convention) { + # list of types + { + grep -h "^struct .* {" [0-9]*.cc |sed 's/\(struct *[^ ]*\).*/\1;/' + grep -h "^typedef " [0-9]*.cc + } |update type_list + # list of function declarations, so I can define them in any order + grep -h "^[^ #].*) {" [0-9]*.cc |sed 's/ {.*/;/' |update function_list + # list of code files to compile + ls [0-9]*.cc |grep -v "\.test\.cc$" |sed 's/.*/#include "&"/' |update file_list + # list of test files to compile + ls [0-9]*.test.cc |sed 's/.*/#include "&"/' |update test_file_list + # list of tests to run + grep -h "^[[:space:]]*void test_" [0-9]*.cc |sed 's/^\s*void \(.*\)() {$/\1,/' |update test_list + # } + # Now that we have all the _lists, compile 'tangle' + $CXX $CFLAGS boot.cc -o $TMP + cd .. + echo "done building tangle" + } + mv $TMP tangle/tangle +) & + +wait_for_all enumerate/enumerate +echo "enumerating layers" +LAYERS=$(./enumerate/enumerate --until $UNTIL_LAYER |grep '\.cc$') +echo "done enumerating layers" + +TMP=`mktemp` +mv_if_exists mu.cc $TMP +( + wait_for_all $LAYERS enumerate/enumerate tangle/tangle + older_than $TMP $LAYERS enumerate/enumerate tangle/tangle && { + echo "running tangle" + # no update here; rely on 'update' calls downstream + ./tangle/tangle $LAYERS > $TMP + echo "done running tangle" + } + mv $TMP mu.cc +) & + +TMP=`mktemp` +mv_if_exists cleave/cleave $TMP +( + wait_for_all cleave/cleave.cc + older_than $TMP cleave/cleave.cc && { + echo "building cleave" + $CXX $CFLAGS cleave/cleave.cc -o $TMP + rm -rf .build + echo "done building cleave" + } + mv $TMP cleave/cleave +) & + +wait_for_all mu.cc cleave/cleave # cleave/cleave just for the .build cleanup +mkdir -p .build +# auto-generate function declarations, so I can define them in any order +# functions start out unindented, have all args on the same line, and end in ') {' +# +# \/ ignore methods +grep -h "^[^[:space:]#].*) {$" mu.cc |grep -v ":.*(" |sed 's/ {.*/;/' |update .build/function_list +# auto-generate list of tests to run +grep -h "^\s*void test_" mu.cc |sed 's/^\s*void \(.*\)() {.*/\1,/' |update .build/test_list +mkdir -p .build/termbox +update_cp termbox/termbox.h .build/termbox + +TMP=`mktemp` +mv_if_exists mu_bin $TMP +( + wait_for_all mu.cc cleave/cleave termbox/*.c termbox/*.h termbox/*.inl + older_than $TMP mu.cc *_list cleave/cleave termbox/* && { + echo "building mu_bin" + ./cleave/cleave mu.cc .build + cd .build + # create the list of global variable declarations from the corresponding definitions + grep ';' global_definitions_list |sed 's/[=(].*/;/' |sed 's/^[^\/# ]/extern &/' |sed 's/^extern extern /extern /' |update global_declarations_list + for f in mu_*.cc + do + OBJ=`echo $f |sed 's/\.cc$/.o/'` + TMP=`mktemp` + mv_if_exists $OBJ $TMP + ( + older_than $TMP $f header global_declarations_list function_list test_list && { + echo "building $OBJ" + $CXX $CFLAGS -c $f -o $TMP + echo "done building $OBJ" + } + mv $TMP $OBJ + ) & + done + cd ../termbox + TMP=`mktemp` + mv_if_exists utf8.o $TMP + ( + older_than $TMP utf8.c && { + echo "building termbox/utf8.o" + $CC $CFLAGS -c utf8.c -o $TMP + echo "done building termbox/utf8.o" + } + mv $TMP utf8.o + ) & + TMP=`mktemp` + mv_if_exists termbox.o $TMP + ( + older_than $TMP termbox.c termbox.h input.inl output.inl bytebuffer.inl && { + echo "building termbox/termbox.o" + $CC $CFLAGS -c termbox.c -o $TMP + echo "done building termbox/termbox.o" + } + mv $TMP termbox.o + ) & + TMP=`mktemp` + mv_if_exists libtermbox.a $TMP + ( + wait_for_all termbox.o utf8.o + older_than $TMP termbox.o utf8.o && { + echo "building termbox/libtermbox.a" + rm $TMP; ar rcs $TMP termbox.o utf8.o # race condition; later mktemp may end up reusing this file + echo "done building termbox/libtermbox.a" + } + mv $TMP libtermbox.a + ) & + cd .. + MU_OBJS=`echo .build/mu_*.cc |sed 's/\.cc/.o/g'` + echo wait_for_all $MU_OBJS termbox/libtermbox.a + wait_for_all $MU_OBJS termbox/libtermbox.a + echo "building .build/mu_bin" + $CXX $CFLAGS $MU_OBJS termbox/libtermbox.a -o $TMP + echo "done building .build/mu_bin" + echo "done building mu_bin" + } + mv $TMP mu_bin +) & + +## [0-9]*.mu -> core.mu + +wait_for_all enumerate/enumerate +echo "building core.mu" +MU_LAYERS=$(./enumerate/enumerate --until $UNTIL_LAYER |grep '\.mu$') || exit 0 # ok if no .mu files +cat $MU_LAYERS |update core.mu +echo "done building core.mu" + +wait_for_all mu_bin +exit 0 + +# scenarios considered: +# 0 status when nothing needs updating +# no output when nothing needs updating +# no output for mu.cc when .mu files modified +# touch mu.cc but don't modify it; no output on second build +# touch a .cc layer but don't modify it; no output on second build +# only a single layer is recompiled when changing a C++ function +# stop immediately after failure in tangle -- cgit 1.4.1-2-gfad0 artik Agaram <vc@akkartik.com> 2019-01-11 18:08:21 -0800 4921' href='/akkartik/mu/commit/html/subx/039debug.cc.html?h=hlt&id=db8a9ab553535551ce80dcd5ce07cffb85f5cfb7'>db8a9ab5 ^
ac07e589 ^
ce2c1efc ^
e92fa89e ^
104e521c ^















ce2c1efc ^
104e521c ^















c8a3ccbe ^
104e521c ^
52daf072 ^















c8a3ccbe ^
52daf072 ^

c8a3ccbe ^


52daf072 ^





c8a3ccbe ^
52daf072 ^

c8a3ccbe ^


52daf072 ^



c8a3ccbe ^



52daf072 ^

c8a3ccbe ^
52daf072 ^


c8a3ccbe ^
52daf072 ^

c8a3ccbe ^
52daf072 ^

c8a3ccbe ^
52daf072 ^
c8a3ccbe ^
52daf072 ^

c8a3ccbe ^
52daf072 ^















ce2c1efc ^
52daf072 ^
c8a3ccbe ^
52daf072 ^





c8a3ccbe ^

52daf072 ^

c8a3ccbe ^

52daf072 ^

ce2c1efc ^



c8a3ccbe ^
ce2c1efc ^


c8a3ccbe ^
695f9bf8 ^
ce2c1efc ^
c8a3ccbe ^
ce2c1efc ^


52daf072 ^
ce2c1efc ^





































104e521c ^



1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211