chris-celerdata
diff --git a/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/UpgradeCli.java‎
Lines changed: 11 additions & 0 deletions b/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/UpgradeCli.java‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/UpgradeConfigurationSelector.java‎
Lines changed: 8 additions & 0 deletions b/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/UpgradeConfigurationSelector.java‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/Cleanup.java‎
Lines changed: 32 additions & 0 deletions b/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/Cleanup.java‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/CleanupCondition.java‎
Lines changed: 28 additions & 0 deletions b/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/CleanupCondition.java‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/CleanupUpgradeConfig.java‎
Lines changed: 105 additions & 0 deletions b/‎datahub-upgrade/src/main/java/com/linkedin/datahub/upgrade/cleanup/CleanupUpgradeConfig.java‎
Lines changed: 105 additions & 0 deletions
@@ -1,5 +1,6 @@
 package com.linkedin.datahub.upgrade;
 
+import com.linkedin.datahub.upgrade.cleanup.Cleanup;
 import com.linkedin.datahub.upgrade.impl.DefaultUpgradeManager;
 import com.linkedin.datahub.upgrade.loadindices.LoadIndices;
 import com.linkedin.datahub.upgrade.removeunknownaspects.RemoveUnknownAspects;
@@ -86,6 +87,10 @@ private static final class Args {
   @Named("reindexDebug")
   private ReindexDebug reindexDebug;
 
+  @Autowired(required = false)
+  @Named("cleanup")
+  private Cleanup cleanup;
+
   @Override
   public void run(String... cmdLineArgs) {
     // Register upgrades with null checks and warnings
@@ -149,6 +154,12 @@ public void run(String... cmdLineArgs) {
       log.info("ReindexDebug upgrade not available - bean not found");
     }
 
+    if (cleanup != null) {
+      _upgradeManager.register(cleanup);
+    } else {
+      log.info("Cleanup upgrade not available - bean not found");
+    }
+
     final Args args = new Args();
     new CommandLine(args).setCaseInsensitiveEnumValuesAllowed(true).parseArgs(cmdLineArgs);
 
 
@@ -1,5 +1,7 @@
 package com.linkedin.datahub.upgrade;
 
+import com.linkedin.datahub.upgrade.cleanup.CleanupCondition;
+import com.linkedin.datahub.upgrade.cleanup.CleanupUpgradeConfig;
 import com.linkedin.datahub.upgrade.conditions.GeneralUpgradeCondition;
 import com.linkedin.datahub.upgrade.conditions.LoadIndicesCondition;
 import com.linkedin.datahub.upgrade.conditions.SqlSetupCondition;
@@ -34,4 +36,10 @@ public static class SqlSetupConfiguration {}
   @Conditional(GeneralUpgradeCondition.class)
   @Import(GeneralUpgradeConfiguration.class)
   public static class GeneralConfiguration {}
+
+  /** Configuration for Cleanup upgrade - teardown of all DataHub infrastructure resources */
+  @Configuration
+  @Conditional(CleanupCondition.class)
+  @Import(CleanupUpgradeConfig.class)
+  public static class CleanupConfiguration {}
 }
@@ -0,0 +1,32 @@
+package com.linkedin.datahub.upgrade.cleanup;
+
+import com.linkedin.datahub.upgrade.Upgrade;
+import com.linkedin.datahub.upgrade.UpgradeStep;
+import java.util.List;
+
+/**
+ * Upgrade that tears down all infrastructure resources created by DataHub setup jobs. Intended to
+ * run as a Helm pre-delete hook so that {@code helm uninstall} leaves no DataHub-specific state in
+ * shared infrastructure (Elasticsearch, Kafka, SQL).
+ *
+ * <p>Execution order: Elasticsearch → Kafka → SQL. Elasticsearch is cleaned first so that indices
+ * are not queried while the database is being dropped.
+ */
+public class Cleanup implements Upgrade {
+
+  private final List<UpgradeStep> steps;
+
+  public Cleanup(List<UpgradeStep> steps) {
+    this.steps = steps;
+  }
+
+  @Override
+  public String id() {
+    return "Cleanup";
+  }
+
+  @Override
+  public List<UpgradeStep> steps() {
+    return steps;
+  }
+}
@@ -0,0 +1,28 @@
+package com.linkedin.datahub.upgrade.cleanup;
+
+import java.util.List;
+import java.util.Objects;
+import java.util.Set;
+import org.springframework.boot.ApplicationArguments;
+import org.springframework.context.annotation.Condition;
+import org.springframework.context.annotation.ConditionContext;
+import org.springframework.core.type.AnnotatedTypeMetadata;
+
+/**
+ * Spring condition that matches when the CLI arguments contain {@code Cleanup}. This ensures the
+ * cleanup-specific Spring configuration is only loaded for the cleanup upgrade path.
+ */
+public class CleanupCondition implements Condition {
+  public static final String CLEANUP_ARG = "Cleanup";
+  public static final Set<String> CLEANUP_ARGS = Set.of(CLEANUP_ARG);
+
+  @Override
+  public boolean matches(ConditionContext context, AnnotatedTypeMetadata metadata) {
+    List<String> nonOptionArgs =
+        context.getBeanFactory().getBean(ApplicationArguments.class).getNonOptionArgs();
+    if (nonOptionArgs == null) {
+      return false;
+    }
+    return nonOptionArgs.stream().filter(Objects::nonNull).anyMatch(CLEANUP_ARGS::contains);
+  }
+}
@@ -0,0 +1,105 @@
+package com.linkedin.datahub.upgrade.cleanup;
+
+import com.linkedin.datahub.upgrade.UpgradeStep;
+import com.linkedin.datahub.upgrade.config.OpenTelemetryConfig;
+import com.linkedin.datahub.upgrade.sqlsetup.SqlSetupArgs;
+import com.linkedin.datahub.upgrade.sqlsetup.config.SqlSetupConfig;
+import com.linkedin.datahub.upgrade.sqlsetup.config.SqlSetupEbeanFactory;
+import com.linkedin.gms.factory.config.ConfigurationProvider;
+import com.linkedin.gms.factory.search.BaseElasticSearchComponentsFactory;
+import com.linkedin.metadata.config.kafka.KafkaConfiguration;
+import com.linkedin.metadata.utils.EnvironmentUtils;
+import io.ebean.Database;
+import java.util.ArrayList;
+import java.util.List;
+import javax.annotation.Nonnull;
+import lombok.extern.slf4j.Slf4j;
+import org.springframework.beans.factory.annotation.Autowired;
+import org.springframework.beans.factory.annotation.Qualifier;
+import org.springframework.boot.actuate.autoconfigure.metrics.MetricsAutoConfiguration;
+import org.springframework.boot.autoconfigure.kafka.KafkaProperties;
+import org.springframework.context.annotation.Bean;
+import org.springframework.context.annotation.ComponentScan;
+import org.springframework.context.annotation.Configuration;
+import org.springframework.context.annotation.Import;
+
+/**
+ * Spring configuration for the Cleanup upgrade. Loads the minimal set of beans needed to tear down
+ * Elasticsearch indices, Kafka topics, and the SQL database.
+ */
+@Slf4j
+@Configuration
+@Import({
+  MetricsAutoConfiguration.class,
+  OpenTelemetryConfig.class,
+  SqlSetupConfig.class,
+  SqlSetupEbeanFactory.class
+})
+@ComponentScan(
+    basePackages = {
+      "com.linkedin.gms.factory.config",
+      "com.linkedin.gms.factory.common",
+      "com.linkedin.gms.factory.entity",
+      "com.linkedin.gms.factory.entityclient",
+      "com.linkedin.gms.factory.plugins",
+      "com.linkedin.gms.factory.entityregistry",
+      "com.linkedin.gms.factory.search",
+      "com.linkedin.gms.factory.timeseries",
+      "com.linkedin.gms.factory.context",
+      "com.linkedin.gms.factory.system_telemetry"
+    })
+public class CleanupUpgradeConfig {
+
+  @Autowired(required = false)
+  private BaseElasticSearchComponentsFactory.BaseElasticSearchComponents esComponents;
+
+  @Autowired(required = false)
+  private ConfigurationProvider configurationProvider;
+
+  @Autowired(required = false)
+  private KafkaProperties kafkaProperties;
+
+  @Autowired(required = false)
+  @Qualifier("ebeanServer")
+  private Database ebeanServer;
+
+  @Autowired(required = false)
+  @Qualifier("sqlSetupArgs")
+  private SqlSetupArgs sqlSetupArgs;
+
+  @Bean(name = "cleanup")
+  @Nonnull
+  public Cleanup createCleanup() {
+    boolean esEnabled = EnvironmentUtils.getBoolean("CLEANUP_ELASTICSEARCH_ENABLED", true);
+    boolean kafkaEnabled = EnvironmentUtils.getBoolean("CLEANUP_KAFKA_ENABLED", true);
+    boolean sqlEnabled = EnvironmentUtils.getBoolean("CLEANUP_SQL_ENABLED", true);
+
+    List<UpgradeStep> steps = new ArrayList<>();
+
+    // Order: ES first (so indices aren't queried during DB drop), then Kafka, then SQL
+    if (esEnabled && esComponents != null) {
+      steps.add(new DeleteElasticsearchIndicesStep(esComponents));
+      log.info("Elasticsearch cleanup step enabled");
+    } else if (esEnabled) {
+      log.warn("Elasticsearch cleanup requested but ES components not available — skipping");
+    }
+
+    KafkaConfiguration kafkaConfig =
+        configurationProvider != null ? configurationProvider.getKafka() : null;
+    if (kafkaEnabled && kafkaConfig != null && kafkaProperties != null) {
+      steps.add(new DeleteKafkaTopicsStep(kafkaConfig, kafkaProperties));
+      log.info("Kafka cleanup step enabled");
+    } else if (kafkaEnabled) {
+      log.warn("Kafka cleanup requested but Kafka config not available — skipping");
+    }
+
+    if (sqlEnabled && ebeanServer != null && sqlSetupArgs != null) {
+      steps.add(new DropDatabaseStep(ebeanServer, sqlSetupArgs));
+      log.info("SQL cleanup step enabled");
+    } else if (sqlEnabled) {
+      log.warn("SQL cleanup requested but database not available — skipping");
+    }
+
+    return new Cleanup(steps);
+  }
+}