-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathMakefile
More file actions
208 lines (176 loc) · 7.41 KB
/
Makefile
File metadata and controls
208 lines (176 loc) · 7.41 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
# Terraphim Personalized Medicine System
# Makefile for building pre-serialized medical dataset artifacts
#
# One-time setup on developer machine:
# make artifacts
# git lfs push origin main # or: make upload-artifacts
#
# On judge/reviewer machine (after git clone):
# git lfs pull # fast: downloads compressed artifacts
# cargo run -p terraphim-api # cold-start <5s (loads pre-built artifacts)
#
# S3 fallback (if artifacts exceed 1 GB LFS quota):
# ARTIFACT_BUCKET=my-bucket make upload-s3
# ARTIFACT_BUCKET=my-bucket make fetch-s3
ARTIFACT_DIR := data/artifacts
UMLS_INPUT := data/automata/words_cui.tsv
SNOMED_VERSION := 20240201
UMLS_ARTIFACT := $(ARTIFACT_DIR)/umls_automata.bin.zst
SNOMED_ARTIFACT := $(ARTIFACT_DIR)/snomed_hierarchy.bin.zst
CPIC_ARTIFACT := $(ARTIFACT_DIR)/cpic_database.bin.zst
SNOMED_CONCEPTS := data/snomed/extracted/sct2_Concept_Full_INT_$(SNOMED_VERSION).txt
SNOMED_DESCRIPTIONS := data/snomed/extracted/sct2_Description_Full-en_INT_$(SNOMED_VERSION).txt
SNOMED_RELATIONSHIPS := data/snomed/extracted/sct2_Relationship_Full_INT_$(SNOMED_VERSION).txt
# Release configuration
VERSION := $(shell git describe --tags --always --dirty 2>/dev/null || echo "0.1.0")
PACKAGE_NAME := terraphim-medgemma-$(VERSION)-linux-x86_64
RELEASE_DIR := target/release
DIST_DIR := dist
.PHONY: all artifacts fetch-artifacts upload-s3 fetch-s3 clean-artifacts test snomed-fhir snomed-fhir-check
.PHONY: build-release package checksum clean-release install
all: test
## Build all three pre-serialized artifacts
artifacts: $(UMLS_ARTIFACT) $(SNOMED_ARTIFACT) $(CPIC_ARTIFACT)
@echo ""
@echo "=== Artifacts built ==="
@ls -lh $(ARTIFACT_DIR)/*.bin.zst
## UMLS Aho-Corasick artifact (~14 min build, <100ms load)
$(UMLS_ARTIFACT): $(UMLS_INPUT)
@mkdir -p $(ARTIFACT_DIR)
cargo run --release --bin build-umls-artifact -- \
--input $(UMLS_INPUT) \
--output $(UMLS_ARTIFACT)
## SNOMED CT hierarchy artifact (requires RF2 download first)
$(SNOMED_ARTIFACT): $(SNOMED_CONCEPTS) $(SNOMED_DESCRIPTIONS) $(SNOMED_RELATIONSHIPS)
@mkdir -p $(ARTIFACT_DIR)
cargo run --release --bin build-snomed-artifact -- \
--concepts $(SNOMED_CONCEPTS) \
--descriptions $(SNOMED_DESCRIPTIONS) \
--relationships $(SNOMED_RELATIONSHIPS) \
--output $(SNOMED_ARTIFACT)
## Download SNOMED RF2 files
## Option A (primary): UMLS API key — fastest, full RF2 release
## UMLS_API_KEY=xxx make $(SNOMED_CONCEPTS)
## Option B (fallback): Public FHIR server — no key needed, slower (~2h for full set)
## make snomed-fhir
$(SNOMED_CONCEPTS):
@if [ -n "$(UMLS_API_KEY)" ]; then \
SNOMED_VERSION=$(SNOMED_VERSION) ./scripts/download_snomed.sh; \
else \
echo "No UMLS_API_KEY set. Using public FHIR fallback (no key required)."; \
python3 scripts/download_snomed_fhir.py --output data/snomed/extracted; \
fi
## Download SNOMED via public FHIR API (no UMLS key required)
snomed-fhir:
python3 scripts/download_snomed_fhir.py --output data/snomed/extracted
## Test FHIR connectivity only
snomed-fhir-check:
python3 scripts/download_snomed_fhir.py --dry-run
## CPIC pharmacogenomics artifact (downloads from live API)
$(CPIC_ARTIFACT):
@mkdir -p $(ARTIFACT_DIR)
cargo run --release --bin build-cpic-artifact -- \
--output $(CPIC_ARTIFACT)
## Pull artifacts from Git LFS
fetch-artifacts:
git lfs pull
## Upload artifacts to S3 (fallback when LFS quota exceeded)
upload-s3:
@test -n "$(ARTIFACT_BUCKET)" || (echo "Error: ARTIFACT_BUCKET not set" && exit 1)
aws s3 cp $(ARTIFACT_DIR)/ s3://$(ARTIFACT_BUCKET)/artifacts/ \
--recursive --exclude "*" --include "*.bin.zst"
## Download artifacts from S3 (fallback)
fetch-s3:
@test -n "$(ARTIFACT_BUCKET)" || (echo "Error: ARTIFACT_BUCKET not set" && exit 1)
@mkdir -p $(ARTIFACT_DIR)
aws s3 cp s3://$(ARTIFACT_BUCKET)/artifacts/ $(ARTIFACT_DIR)/ \
--recursive --exclude "*" --include "*.bin.zst"
## Remove built artifacts (they can be regenerated)
clean-artifacts:
rm -f $(ARTIFACT_DIR)/*.bin.zst
## Run all tests
test:
cargo test --lib --workspace
cd terraphim_pipeline && python -m pytest tests/ -v 2>/dev/null || true
# =============================================================================
# Release and Packaging Targets
# =============================================================================
## Build optimized release binaries for all workspace crates
build-release:
@echo "Building release binaries..."
cargo build --release --workspace \
--bin terraphim-demo \
--bin terraphim-api \
--bin build-umls-artifact \
--bin build-snomed-artifact \
--bin build-cpic-artifact \
--bin umls_benchmark \
--bin evaluation-runner \
--bin primekg-import
@echo ""
@echo "=== Release binaries built ==="
@ls -lh $(RELEASE_DIR)/terraphim-demo $(RELEASE_DIR)/terraphim-api 2>/dev/null || true
## Create distribution tarball with all binaries and data files
package: build-release
@echo "Creating distribution package..."
@mkdir -p $(DIST_DIR)/$(PACKAGE_NAME)
# Copy binaries
cp $(RELEASE_DIR)/terraphim-demo $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/terraphim-api $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/build-umls-artifact $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/build-snomed-artifact $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/build-cpic-artifact $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/umls_benchmark $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/evaluation-runner $(DIST_DIR)/$(PACKAGE_NAME)/
cp $(RELEASE_DIR)/primekg-import $(DIST_DIR)/$(PACKAGE_NAME)/
# Copy data files
@mkdir -p $(DIST_DIR)/$(PACKAGE_NAME)/data/artifacts
@if [ -d "$(ARTIFACT_DIR)" ]; then \
cp $(ARTIFACT_DIR)/*.bin.zst $(DIST_DIR)/$(PACKAGE_NAME)/data/artifacts/ 2>/dev/null || true; \
fi
# Copy documentation
cp README.md $(DIST_DIR)/$(PACKAGE_NAME)/
cp LICENSE $(DIST_DIR)/$(PACKAGE_NAME)/ 2>/dev/null || true
@if [ -d "docs" ]; then \
cp -r docs $(DIST_DIR)/$(PACKAGE_NAME)/; \
fi
# Copy config files
@if [ -d "config" ]; then \
cp -r config $(DIST_DIR)/$(PACKAGE_NAME)/; \
fi
# Create install script
@./scripts/package.sh $(DIST_DIR)/$(PACKAGE_NAME)
# Create tarball
cd $(DIST_DIR) && tar czf $(PACKAGE_NAME).tar.gz $(PACKAGE_NAME)
@echo ""
@echo "=== Package created ==="
@ls -lh $(DIST_DIR)/$(PACKAGE_NAME).tar.gz
## Generate SHA256 checksums for all distribution files
checksum: package
@echo "Generating checksums..."
cd $(DIST_DIR) && sha256sum *.tar.gz > checksums.sha256
@echo ""
@echo "=== Checksums ==="
@cat $(DIST_DIR)/checksums.sha256
## Clean release artifacts
clean-release:
rm -rf $(DIST_DIR)
cargo clean --release
## Install binaries to system (requires sudo)
install: build-release
@echo "Installing Terraphim MedGemma..."
sudo install -m 755 $(RELEASE_DIR)/terraphim-demo /usr/local/bin/
sudo install -m 755 $(RELEASE_DIR)/terraphim-api /usr/local/bin/
sudo install -m 755 $(RELEASE_DIR)/build-umls-artifact /usr/local/bin/
sudo install -m 755 $(RELEASE_DIR)/build-snomed-artifact /usr/local/bin/
sudo install -m 755 $(RELEASE_DIR)/build-cpic-artifact /usr/local/bin/
@echo "Installation complete!"
## Uninstall binaries from system (requires sudo)
uninstall:
@echo "Uninstalling Terraphim MedGemma..."
sudo rm -f /usr/local/bin/terraphim-demo
sudo rm -f /usr/local/bin/terraphim-api
sudo rm -f /usr/local/bin/build-umls-artifact
sudo rm -f /usr/local/bin/build-snomed-artifact
sudo rm -f /usr/local/bin/build-cpic-artifact
@echo "Uninstall complete!"