Skip to content

Commit 62b477d

Browse files
Merge pull request #150 from datakind/feat/testing_h2o_pipeline
testing h2o pipeline on synthetic 2 dataset
2 parents d6329ab + 45888ae commit 62b477d

1 file changed

Lines changed: 12 additions & 4 deletions

File tree

src/webapp/databricks.py

Lines changed: 12 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,6 +35,7 @@
3535

3636
# The name of the deployed pipeline in Databricks. Must match directly.
3737
PDP_INFERENCE_JOB_NAME = "github_sourced_pdp_inference_pipeline"
38+
PDP_H2O_INFERENCE_JOB_NAME = "github_sourced_pdp_h2o_inference_pipeline"
3839

3940

4041
class DatabricksInferenceRunRequest(BaseModel):
@@ -192,16 +193,23 @@ def run_pdp_inference(
192193

193194
db_inst_name = databricksify_inst_name(req.inst_name)
194195

196+
if db_inst_name in ["synthetic_2", "synthetic_uni_2"]:
197+
db_job_name = PDP_H2O_INFERENCE_JOB_NAME
198+
else:
199+
db_job_name = PDP_INFERENCE_JOB_NAME
200+
195201
try:
196-
job = next(w.jobs.list(name=PDP_INFERENCE_JOB_NAME), None)
202+
job = next(w.jobs.list(name=db_job_name), None)
197203
if not job or job.job_id is None:
198204
raise ValueError(
199-
f"run_pdp_inference(): Job '{PDP_INFERENCE_JOB_NAME}' was not found or has no job_id."
205+
f"run_pdp_inference(): Job '{db_job_name}' was not found or has no job_id."
200206
)
201207
job_id = job.job_id
202-
LOGGER.info(f"Resolved job ID for '{PDP_INFERENCE_JOB_NAME}': {job_id}")
208+
LOGGER.info(f"Resolved job ID for '{db_job_name}': {job_id}")
203209
except Exception as e:
204-
LOGGER.exception(f"Job lookup failed for '{PDP_INFERENCE_JOB_NAME}'.")
210+
LOGGER.exception(
211+
f"Job lookup failed for '{db_job_name}' and '{db_inst_name}."
212+
)
205213
raise ValueError(f"run_pdp_inference(): Failed to find job: {e}")
206214

207215
try:

0 commit comments

Comments
 (0)