maxmcd
diff --git a/‎.github/workflows/go.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/go.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Makefile‎
Lines changed: 13 additions & 1 deletion b/‎Makefile‎
Lines changed: 13 additions & 1 deletion
diff --git a/‎go.mod‎
Lines changed: 7 additions & 4 deletions b/‎go.mod‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎go.sum‎
Lines changed: 43 additions & 451 deletions b/‎go.sum‎
Lines changed: 43 additions & 451 deletions
diff --git a/‎lib/default.bramble‎
Lines changed: 4 additions & 50 deletions b/‎lib/default.bramble‎
Lines changed: 4 additions & 50 deletions
diff --git a/‎lib/go/default.bramble‎
Lines changed: 1 addition & 1 deletion b/‎lib/go/default.bramble‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎notes/22-gc.md‎
Lines changed: 5 additions & 0 deletions b/‎notes/22-gc.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎notes/23-full-directory-searching.md‎
Lines changed: 1 addition & 0 deletions b/‎notes/23-full-directory-searching.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎notes/24-early-cuttoff-optimization.md‎
Lines changed: 16 additions & 0 deletions b/‎notes/24-early-cuttoff-optimization.md‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎notes/25-dynamic-dependencies.md‎
Lines changed: 63 additions & 0 deletions b/‎notes/25-dynamic-dependencies.md‎
Lines changed: 63 additions & 0 deletions
@@ -16,7 +16,7 @@ jobs:
         uses: actions/checkout@v2
       - name: Run all tests
         run: |
-          make test
+          make ci_test
       # for your debugging needs
       # - name: Setup tmate session
       #   uses: mxschmitt/action-tmate@v3
@@ -3,7 +3,16 @@
 test: go_test \
 	integration_test
 
-go_test: install
+ci_test: go_ci_test \
+	integration_ci_test
+
+gotestsum:
+	go get gotest.tools/gotestsum
+
+go_ci_test: gotestsum
+	gotestsum -- -race -v ./...
+
+go_test:
 	go test -race -v ./...
 
 # just use LICENSE as a file we can harmlessly "touch" and use as a cache marker
@@ -14,6 +23,9 @@ LICENSE: main.go pkg/*/*.go
 
 install: LICENSE
 
+integration_ci_test: install gotestsum
+	env BRAMBLE_INTEGRATION_TEST=truthy gotestsum -- -v ./pkg/bramble/
+
 integration_test: install
 	env BRAMBLE_INTEGRATION_TEST=truthy go test -v ./pkg/bramble/
 
 
@@ -1,18 +1,20 @@
 module github.com/maxmcd/bramble
 
-go 1.15
+go 1.16
 
 require (
 	github.com/BurntSushi/toml v0.3.1
 	github.com/certifi/gocertifi v0.0.0-20200922220541-2c3bb06c6054
 	github.com/containerd/console v1.0.0
 	github.com/creack/pty v1.1.11
+	github.com/davecgh/go-spew v1.1.1
+	github.com/docker/docker v1.4.2-0.20191101170500-ac7306503d23
 	github.com/fsouza/go-dockerclient v1.6.5
-	github.com/go-git/go-git/v5 v5.2.0
-	github.com/hashicorp/terraform v0.14.4
+	github.com/go-git/go-git/v5 v5.3.0
 	github.com/jaguilar/vt100 v0.0.0-20201024211400-81de19cb81a4
+	github.com/maxmcd/dag v0.0.0-20210316172417-f02e4b03c6e9
 	github.com/mholt/archiver/v3 v3.3.1-0.20200626164424-d44471c49aa7
-	github.com/moby/moby v1.13.1
+	github.com/minio/sha256-simd v1.0.0
 	github.com/morikuni/aec v1.0.0
 	github.com/peterbourgon/ff/v3 v3.0.0
 	github.com/pkg/errors v0.9.1
@@ -22,6 +24,7 @@ require (
 	go.uber.org/zap v1.10.0
 	golang.org/x/crypto v0.0.0-20210220033148-5ea612d1eb83
 	golang.org/x/sys v0.0.0-20210305230114-8fe3ee5dd75b
+	golang.org/x/sys v0.0.0-20210324051608-47abb6519492
 	golang.org/x/time v0.0.0-20200630173020-3af7569d3a1e
 )
 
 
@@ -26,61 +26,15 @@ def zig():
 def busybox():
     b = std.fetch_url("https://brmbl.s3.amazonaws.com/busybox-x86_64.tar.gz")
 
-    commands = """
-[, [[, acpid, add-shell, addgroup, adduser, adjtimex, arch, arp, arping, ash, awk,
-base64, basename, bc, beep, blkdiscard, blkid, blockdev, bootchartd, brctl, bunzip2,
-bzcat, bzip2, cal, cat, chat, chattr, chgrp, chmod, chown, chpasswd, chpst, chroot,
-chrt, chvt, cksum, clear, cmp, comm, conspy, cp, cpio, crond, crontab, cryptpw,
-cttyhack, cut, date, dc, dd, deallocvt, delgroup, deluser, depmod, devmem, df,
-dhcprelay, diff, dirname, dmesg, dnsd, dnsdomainname, dos2unix, dpkg, dpkg-deb, du,
-dumpkmap, dumpleases, echo, ed, egrep, eject, env, envdir, envuidgid, ether-wake,
-expand, expr, factor, fakeidentd, fallocate, false, fatattr, fbset, fbsplash, fdflush,
-fdformat, fdisk, fgconsole, fgrep, find, findfs, flock, fold, free, freeramdisk, fsck,
-fsck.minix, fsfreeze, fstrim, fsync, ftpd, ftpget, ftpput, fuser, getopt, getty, grep,
-groups, gunzip, gzip, halt, hd, hdparm, head, hexdump, hexedit, hostid, hostname, httpd,
-hush, hwclock, i2cdetect, i2cdump, i2cget, i2cset, i2ctransfer, id, ifconfig, ifdown,
-ifenslave, ifplugd, ifup, inetd, init, insmod, install, ionice, iostat, ip, ipaddr,
-ipcalc, ipcrm, ipcs, iplink, ipneigh, iproute, iprule, iptunnel, kbd_mode, kill,
-killall, killall5, klogd, last, less, link, linux32, linux64, linuxrc, ln, loadfont,
-loadkmap, logger, login, logname, logread, losetup, lpd, lpq, lpr, ls, lsattr, lsmod,
-lsof, lspci, lsscsi, lsusb, lzcat, lzma, lzop, makedevs, makemime, man, md5sum, mdev,
-mesg, microcom, mkdir, mkdosfs, mke2fs, mkfifo, mkfs.ext2, mkfs.minix, mkfs.vfat, mknod,
-mkpasswd, mkswap, mktemp, modinfo, modprobe, more, mount, mountpoint, mpstat, mt, mv,
-nameif, nanddump, nandwrite, nbd-client, nc, netstat, nice, nl, nmeter, nohup, nologin,
-nproc, nsenter, nslookup, ntpd, nuke, od, openvt, partprobe, passwd, paste, patch,
-pgrep, pidof, ping, ping6, pipe_progress, pivot_root, pkill, pmap, popmaildir, poweroff,
-powertop, printenv, printf, ps, pscan, pstree, pwd, pwdx, raidautorun, rdate, rdev,
-readahead, readlink, readprofile, realpath, reboot, reformime, remove-shell, renice,
-reset, resize, resume, rev, rm, rmdir, rmmod, route, rpm, rpm2cpio, rtcwake, run-init,
-run-parts, runlevel, runsv, runsvdir, rx, script, scriptreplay, sed, sendmail, seq,
-setarch, setconsole, setfattr, setfont, setkeycodes, setlogcons, setpriv, setserial,
-setsid, setuidgid, sh, sha1sum, sha256sum, sha3sum, sha512sum, showkey, shred, shuf,
-slattach, sleep, smemcap, softlimit, sort, split, ssl_client, start-stop-daemon, stat,
-strings, stty, su, sulogin, sum, sv, svc, svlogd, svok, swapoff, swapon, switch_root,
-sync, sysctl, syslogd, tac, tail, tar, taskset, tc, tcpsvd, tee, telnet, telnetd, test,
-tftp, tftpd, time, timeout, top, touch, tr, traceroute, traceroute6, true, truncate, ts,
-tty, ttysize, tunctl, ubiattach, ubidetach, ubimkvol, ubirename, ubirmvol, ubirsvol,
-ubiupdatevol, udhcpc, udhcpc6, udhcpd, udpsvd, uevent, umount, uname, unexpand, uniq,
-unix2dos, unlink, unlzma, unshare, unxz, unzip, uptime, users, usleep, uudecode,
-uuencode, vconfig, vi, vlock, volname, w, wall, watch, watchdog, wc, wget, which, who,
-whoami, whois, xargs, xxd, xz, xzcat, yes, zcat, zcip
-    """
-
-    command_list = " ".join(commands.strip().split("\n")).split(", ")
-    command_list.remove("ln")
-    command_symlinks = "\n".join([("./ln -s busybox %s" % c) for c in command_list])
-    command_symlinks
-    script = (
-        """
+    script = """
     set -e
     $busybox_download/busybox-x86_64 mkdir $out/bin
     $busybox_download/busybox-x86_64 cp $busybox_download/busybox-x86_64 $out/bin/busybox
     cd $out/bin
-    ./busybox ln -s busybox ln
-    %s
+    for command in $(./busybox --list); do
+        ./busybox ln -s busybox $command
+    done
     """
-        % command_symlinks
-    )
 
     return derivation(
         name="busybox",
 
@@ -3,7 +3,7 @@ load(nix_seed="github.com/maxmcd/bramble/lib/nix-seed")
 load("github.com/maxmcd/bramble/lib")
 
 
-def _bootstrap():
+def bootstrap():
     go1_4 = std.fetch_url("https://dl.google.com/go/go1.4-bootstrap-20171003.tar.gz")
     path = "%s/bin:%s/bin" % (nix_seed.stdenv(), lib.busybox())
     return derivation(
 
@@ -0,0 +1,5 @@
+GC
+
+We want to clean up files we don't need any more. Easiest way to do this is to enumerate all files that we do need and then delete everything else.
+
+For the first version of GC, let's just keep everything we could possibly use?
@@ -0,0 +1 @@
+https://github.com/golang/go/issues/30058
@@ -0,0 +1,16 @@
+Nix handles early cutoff with fixed output derivations. These must be manually kept up to date.
+
+Because the dependency graph in Bramble is (currently) constructed using the hash of input derivations any change to build input will result in a full rebuild.
+
+I think it's important when thinking about a solution here to remember that all build inputs are either filesystem files or `fetch` derivations, so don't get too creative about storing build state.
+
+### Always use the build output as the derivation hash
+
+When currently injecting a derivation into a child derivation we use a format like this: `{{ tmb75glr3iqxaso2gn27ytrmr4ufkv6d-.drv:out }}`. Alternatively we could replace that with the hash of the output.
+
+I think this is what the steps would look like with this approach:
+
+1. Calculate the entire derivation graph. If we already have build outputs computed use them as the named hash.
+2. Find the first derivation that needs to be built. Build it, replace all the child derivations derivation hashes with the output hash. Continue building.
+
+What's the cost here? We wouldn't know the derivations we're going to build without building them, this only means that we don't know in advance which things we're going to have to build. This seems fine (and I think is mandatory for this feature).
@@ -0,0 +1,63 @@
+## Dynamic Dependencies
+
+Nix and Bazel don't allow dynamic dependencies. I think there is an argument to be made that this is the reason their ergonomics are so poor. Nix libs that are intended to build arbitrary projects in a given language rely heavily on code generation. Arguably this is a type of dynamic dependencies.
+
+I think it would be interesting to explore first class support for dynamic dependencies in Bramble. Maybe if they are easy to use and set up we can limit the amount of derivations that need network access. If you can generate arbitrary calls to `fetch_url` within a derivation, then maybe you can get away with just that.
+
+One Idea:
+
+There is a specific type of derivation that outputs starlark code. It is a different color than regular derivations (so we can detect it statically), and only outputs starlark code. This starlark code is run once the derivation is done building. We would need to update the dependency graph as we build.
+
+This has some weird implications because we would still need to reference the build output. Do we just need to ensure that the generated code just outputs a single derivation?
+
+So let's think about numpy.
+
+```python
+def foo():
+    pip_install("numpy")
+```
+
+There is no real way to do this because numpy will need to download its own dependencies. So we could either:
+
+1. Download them within the derivations using the network, but then other depedencies might generate their own independent depedencies, which would be duplicated and might conflict.
+2. Generate code for each dependency, which totally works, but dosn't have first class support.
+
+
+```python
+def foo():
+    pip_install("numpy")
+
+def pip_install(name):
+    deps = fetch_url("dependency_finder.gov/"+name)
+    derivation(script="""
+    out = ""
+    for dep in deps:
+        out += "fetch_url(dep)\n"
+    return out
+    """)
+```
+
+Terrible pseudo-code, but basically this derivation returns starlark code with the deps we need to download.
+
+If we go this route, we would need to be able to check if we've generated this derivation on the fly. I think if we don't do that, it would be very hard to do things like: validating current url hashes, without actually building.
+
+We could just stick the outputted starlark into the store somewhere, but it might be better to generate code and keep it in the source of the project. If the interface is just like in the example above `fetch_url("numpy")` then what if a new version of numpy is published? Any time there was a rebuild the url hash would mismatch. I think ideally if we want to replicate something like a Cargo.lock we would need the output of the code generating derivation to be placed within the project tree. That way, that generated file could reference very specific versions of software to fetch. If the end user wanted to fetch a new version they would simply delete the generated file.
+
+This doesn't really remove the need for derivations that access the network. The code generating derivation would still need to make a request for the `numpy` source in order to calculate dependencies.
+
+This kind of thing would mean that you could truly write a derivation like `pip_install("numpy")` without code generation that would require certain setup.
+
+We could also prevent code generated by a code generating derivation from calling another code generating derivation, at least at the start, to limit all kinds gnarly behavior.
+
+----
+
+More thoughts.
+
+This might actually be a good idea. We could then move forward with limiting network functionality only to derivations that use the network. That way we could be sure that after we've processed all derivations initially we can proceed from there without ever using the network.
+
+One complication here is that bramble libraries could use this as well, so we can't generate bramble code and then store it next to the initial source file. Generate code could also depend on passed parmeters, so we wouldn't be able to check a file's lock file just by analyzing the source of that file, we'd need to be sure we were testing it with whatever parmeters were passed to functions in that file.
+
+wait, maybe not, the generating function will always be called without arguments. so maybe we just put the code in the project next to the file that calls the function.
+
+Ok, either way, that needs to be sorted out, and we might want to consider just adding generated code to the lockfile.
+
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +GC
++
 +We want to clean up files we don't need any more. Easiest way to do this is to enumerate all files that we do need and then delete everything else.
++
 +For the first version of GC, let's just keep everything we could possibly use?
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+https://github.com/golang/go/issues/30058`