blob: 852d7185cf80a03fc38996c5a851e758f19034db (
plain) (
tree)
|
|
#!/bin/sh
# Experimental alternative to build2 that can run steps in parallel if their
# dependencies are met. Caveats:
#
# 1. We rely on the OS to schedule steps, so thousands of independent tasks
# will likely be counter-productive.
# 2. Can run out of virtual memory if you spawn too many say $CC processes.
# 3. Compilation errors can cause the script to hang.
# 4. Ugly as heck! Really needs simpler versions to compare against. And
# even then, diff gets confused.
# 5. There's a mechanical difficulty: we use mktemp to reliably create
# temporary filenames, which has the side effect of also creating the
# files. So zero-size files are considered equivalent to empty files.
# When some commands have trouble with this (e.g. ar) we need to delete
# the empty file, which can expose us to a race condition wrt mktemp.
set -e # stop immediately on error
# Some environment variables that can be passed in. For example, to turn off
# optimization:
# $ CFLAGS=-g ./build2
test "$CXX" || export CXX=c++
test "$CC" || export CC=cc
test "$CFLAGS" || export CFLAGS="-g -O2"
export CFLAGS="$CFLAGS -Wall -Wextra -ftrapv -fno-strict-aliasing"
# Outline:
# [0-9]*.cc -> mu.cc -> .build/*.cc -> .build/*.o -> .build/mu_bin
# (layers) | | | |
# tangle cleave $CXX $CXX
# can also be called with a layer to only build until
# $ ./build2 --until 050
UNTIL_LAYER=${2:-zzz}
# there's two mechanisms for fast builds here:
# - if a command is quick to run, always run it but update the result only on any change
# - otherwise run it only if the output is 'older_than' the inputs
#
# avoid combining both mechanisms for a single file
# otherwise you'll see spurious messages about files being updated
# risk: a file may unnecessarily update without changes, causing unnecessary work downstream
# return 1 if $1 is older than _any_ of the remaining args
older_than() {
local target=$1
shift
if [ ! -s $target ]
then
#? echo "$target has size zero"
#? echo "updating $target" >&2
return 0 # success
fi
local f
for f in $*
do
if [ $f -nt $target ]
then
#? echo "updating $target" >&2
return 0 # success
fi
done
return 1 # failure
}
# redirect to $1, unless it's already identical
update() {
if [ ! -e $1 ]
then
cat > $1
else
cat > $1.tmp
diff -q $1 $1.tmp >/dev/null && rm $1.tmp || mv $1.tmp $1
fi
}
update_cp() {
if [ ! -e $2/$1 ]
then
cp $1 $2
elif [ $1 -nt $2/$1 ]
then
cp $1 $2
fi
}
noisy_cd() {
cd $1
echo "-- `pwd`" >&2
}
mv_if_exists() {
test -e $1 && mv $1 $2
return 0
}
wait_for_all() {
# could use inotify on Linux
while ! all_exist "$@"
do
sleep 1
done
}
all_exist() {
for f in "$@"
do
test -e $f || return 1
done
return 0
}
TMP=`mktemp`
mv_if_exists enumerate/enumerate $TMP
(
wait_for_all enumerate/enumerate.cc
older_than $TMP enumerate/enumerate.cc && {
echo "building enumerate"
$CXX $CFLAGS enumerate/enumerate.cc -o $TMP
echo "done building enumerate"
}
mv $TMP enumerate/enumerate
) &
TMP=`mktemp`
mv_if_exists tangle/tangle $TMP
(
wait_for_all tangle/*.cc
older_than $TMP tangle/*.cc && {
echo "building tangle"
cd tangle
# auto-generate various lists (ending in '_list' by convention) {
# list of types
{
grep -h "^struct .* {" [0-9]*.cc |sed 's/\(struct *[^ ]*\).*/\1;/'
grep -h "^typedef " [0-9]*.cc
} |update type_list
# list of function declarations, so I can define them in any order
grep -h "^[^ #].*) {" [0-9]*.cc |sed 's/ {.*/;/' |update function_list
# list of code files to compile
ls [0-9]*.cc |grep -v "\.test\.cc$" |sed 's/.*/#include "&"/' |update file_list
# list of test files to compile
ls [0-9]*.test.cc |sed 's/.*/#include "&"/' |update test_file_list
# list of tests to run
grep -h "^[[:space:]]*void test_" [0-9]*.cc |sed 's/^\s*void \(.*\)() {$/\1,/' |update test_list
# }
# Now that we have all the _lists, compile 'tangle'
$CXX $CFLAGS boot.cc -o $TMP
cd ..
echo "done building tangle"
}
mv $TMP tangle/tangle
) &
wait_for_all enumerate/enumerate
echo "enumerating layers"
LAYERS=$(./enumerate/enumerate --until $UNTIL_LAYER |grep '\.cc$')
echo "done enumerating layers"
TMP=`mktemp`
mv_if_exists mu.cc $TMP
(
wait_for_all $LAYERS enumerate/enumerate tangle/tangle
older_than $TMP $LAYERS enumerate/enumerate tangle/tangle && {
echo "running tangle"
# no update here; rely on 'update' calls downstream
./tangle/tangle $LAYERS > $TMP
echo "done running tangle"
}
mv $TMP mu.cc
) &
TMP=`mktemp`
mv_if_exists cleave/cleave $TMP
(
wait_for_all cleave/cleave.cc
older_than $TMP cleave/cleave.cc && {
echo "building cleave"
$CXX $CFLAGS cleave/cleave.cc -o $TMP
rm -rf .build
echo "done building cleave"
}
mv $TMP cleave/cleave
) &
wait_for_all mu.cc cleave/cleave # cleave/cleave just for the .build cleanup
mkdir -p .build
# auto-generate function declarations, so I can define them in any order
# functions start out unindented, have all args on the same line, and end in ') {'
#
# \/ ignore methods
grep -h "^[^[:space:]#].*) {$" mu.cc |grep -v ":.*(" |sed 's/ {.*/;/' |update .build/function_list
# auto-generate list of tests to run
grep -h "^\s*void test_" mu.cc |sed 's/^\s*void \(.*\)() {.*/\1,/' |update .build/test_list
mkdir -p .build/termbox
update_cp termbox/termbox.h .build/termbox
TMP=`mktemp`
mv_if_exists mu_bin $TMP
(
wait_for_all mu.cc cleave/cleave termbox/*.c termbox/*.h termbox/*.inl
older_than $TMP mu.cc *_list cleave/cleave termbox/* && {
echo "building mu_bin"
./cleave/cleave mu.cc .build
cd .build
# create the list of global variable declarations from the corresponding definitions
grep ';' global_definitions_list |sed 's/[=(].*/;/' |sed 's/^[^\/# ]/extern &/' |sed 's/^extern extern /extern /' |update global_declarations_list
for f in mu_*.cc
do
OBJ=`echo $f |sed 's/\.cc$/.o/'`
TMP=`mktemp`
mv_if_exists $OBJ $TMP
(
older_than $TMP $f header global_declarations_list function_list test_list && {
echo "building $OBJ"
$CXX $CFLAGS -c $f -o $TMP
echo "done building $OBJ"
}
mv $TMP $OBJ
) &
done
cd ../termbox
TMP=`mktemp`
mv_if_exists utf8.o $TMP
(
older_than $TMP utf8.c && {
echo "building termbox/utf8.o"
$CC $CFLAGS -c utf8.c -o $TMP
echo "done building termbox/utf8.o"
}
mv $TMP utf8.o
) &
TMP=`mktemp`
mv_if_exists termbox.o $TMP
(
older_than $TMP termbox.c termbox.h input.inl output.inl bytebuffer.inl && {
echo "building termbox/termbox.o"
$CC $CFLAGS -c termbox.c -o $TMP
echo "done building termbox/termbox.o"
}
mv $TMP termbox.o
) &
TMP=`mktemp`
mv_if_exists libtermbox.a $TMP
(
wait_for_all termbox.o utf8.o
older_than $TMP termbox.o utf8.o && {
echo "building termbox/libtermbox.a"
rm $TMP; ar rcs $TMP termbox.o utf8.o # race condition; later mktemp may end up reusing this file
echo "done building termbox/libtermbox.a"
}
mv $TMP libtermbox.a
) &
cd ..
MU_OBJS=`echo .build/mu_*.cc |sed 's/\.cc/.o/g'`
echo wait_for_all $MU_OBJS termbox/libtermbox.a
wait_for_all $MU_OBJS termbox/libtermbox.a
echo "building .build/mu_bin"
$CXX $CFLAGS $MU_OBJS termbox/libtermbox.a -o $TMP
echo "done building .build/mu_bin"
echo "done building mu_bin"
}
mv $TMP mu_bin
) &
## [0-9]*.mu -> core.mu
wait_for_all enumerate/enumerate
echo "building core.mu"
MU_LAYERS=$(./enumerate/enumerate --until $UNTIL_LAYER |grep '\.mu$') || exit 0 # ok if no .mu files
cat $MU_LAYERS |update core.mu
echo "done building core.mu"
wait_for_all mu_bin
exit 0
# scenarios considered:
# 0 status when nothing needs updating
# no output when nothing needs updating
# no output for mu.cc when .mu files modified
# touch mu.cc but don't modify it; no output on second build
# touch a .cc layer but don't modify it; no output on second build
# only a single layer is recompiled when changing a C++ function
# stop immediately after failure in tangle
|