apache
diff --git a/‎.github/workflows/pr_build_linux.yml‎
Lines changed: 9 additions & 3 deletions b/‎.github/workflows/pr_build_linux.yml‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎.github/workflows/pr_build_macos.yml‎
Lines changed: 6 additions & 0 deletions b/‎.github/workflows/pr_build_macos.yml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎docs/source/contributor-guide/spark_expressions_support.md‎
Lines changed: 1 addition & 1 deletion b/‎docs/source/contributor-guide/spark_expressions_support.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎native/spark-expr/src/comet_scalar_funcs.rs‎
Lines changed: 2 additions & 1 deletion b/‎native/spark-expr/src/comet_scalar_funcs.rs‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎native/spark-expr/src/datetime_funcs/mod.rs‎
Lines changed: 2 additions & 0 deletions b/‎native/spark-expr/src/datetime_funcs/mod.rs‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎native/spark-expr/src/datetime_funcs/seconds_to_timestamp.rs‎
Lines changed: 192 additions & 0 deletions b/‎native/spark-expr/src/datetime_funcs/seconds_to_timestamp.rs‎
Lines changed: 192 additions & 0 deletions
diff --git a/‎native/spark-expr/src/lib.rs‎
Lines changed: 2 additions & 1 deletion b/‎native/spark-expr/src/lib.rs‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎spark/pom.xml‎
Lines changed: 22 additions & 1 deletion b/‎spark/pom.xml‎
Lines changed: 22 additions & 1 deletion
diff --git a/‎spark/src/main/scala/org/apache/comet/CometSparkSessionExtensions.scala‎
Lines changed: 4 additions & 0 deletions b/‎spark/src/main/scala/org/apache/comet/CometSparkSessionExtensions.scala‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎spark/src/main/scala/org/apache/comet/serde/QueryPlanSerde.scala‎
Lines changed: 1 addition & 0 deletions b/‎spark/src/main/scala/org/apache/comet/serde/QueryPlanSerde.scala‎
Lines changed: 1 addition & 0 deletions
@@ -97,9 +97,10 @@ jobs:
           - name: "Spark 4.0, JDK 21"
             java_version: "21"
             maven_opts: "-Pspark-4.0"
-          # Spark 4.1 is intentionally absent: the lint job invokes -Psemanticdb,
-          # but semanticdb-scalac_2.13.17 is not yet published, so we cannot
-          # currently run scalafix against the spark-4.1 profile.
+          # Spark 4.1 and 4.2 are intentionally absent: the lint job invokes -Psemanticdb,
+          # but semanticdb-scalac for those Scala patch versions (2.13.17 / 2.13.18) is not
+          # yet published, so we cannot currently run scalafix against the spark-4.1 or
+          # spark-4.2 profiles.
       fail-fast: false
     steps:
       - uses: runs-on/action@742bf56072eb4845a0f94b3394673e4903c90ff0  # v2.1.0
@@ -305,6 +306,11 @@ jobs:
             java_version: "17"
             maven_opts: "-Pspark-4.1"
             scan_impl: "auto"
+
+          - name: "Spark 4.2, JDK 17"
+            java_version: "17"
+            maven_opts: "-Pspark-4.2"
+            scan_impl: "auto"
         suite:
           - name: "fuzz"
             value: |
 
@@ -144,6 +144,12 @@ jobs:
             # runtime; the scala-2.13 profile would override it back to 2.13.16 and break.
             maven_opts: "-Pspark-4.1"
 
+          - name: "Spark 4.2, JDK 17, Scala 2.13"
+            java_version: "17"
+            # The spark-4.2 profile pins Scala to 2.13.18 to match Spark 4.2.0-preview4's
+            # runtime; the scala-2.13 profile would override it back to 2.13.16 and break.
+            maven_opts: "-Pspark-4.2"
+
         suite:
           - name: "fuzz"
             value: |
 
@@ -210,7 +210,7 @@
 - [ ] second
 - [ ] timestamp_micros
 - [ ] timestamp_millis
-- [ ] timestamp_seconds
+- [x] timestamp_seconds
 - [ ] to_date
 - [ ] to_timestamp
 - [ ] to_timestamp_ltz
 
@@ -26,7 +26,7 @@ use crate::{
     spark_lpad, spark_make_decimal, spark_read_side_padding, spark_round, spark_rpad, spark_unhex,
     spark_unscaled_value, EvalMode, SparkArrayCompact, SparkArrayPositionFunc, SparkArraysOverlap,
     SparkContains, SparkDateDiff, SparkDateFromUnixDate, SparkDateTrunc, SparkMakeDate,
-    SparkSizeFunc,
+    SparkSecondsToTimestamp, SparkSizeFunc,
 };
 use arrow::datatypes::DataType;
 use datafusion::common::{DataFusionError, Result as DataFusionResult};
@@ -218,6 +218,7 @@ fn all_scalar_functions() -> Vec<Arc<ScalarUDF>> {
         Arc::new(ScalarUDF::new_from_impl(SparkDateFromUnixDate::default())),
         Arc::new(ScalarUDF::new_from_impl(SparkDateTrunc::default())),
         Arc::new(ScalarUDF::new_from_impl(SparkMakeDate::default())),
+        Arc::new(ScalarUDF::new_from_impl(SparkSecondsToTimestamp::default())),
         Arc::new(ScalarUDF::new_from_impl(SparkSizeFunc::default())),
     ]
 }
 
@@ -21,6 +21,7 @@ mod date_trunc;
 mod extract_date_part;
 mod hours;
 mod make_date;
+mod seconds_to_timestamp;
 mod timestamp_trunc;
 mod unix_timestamp;
 
@@ -32,5 +33,6 @@ pub use extract_date_part::SparkMinute;
 pub use extract_date_part::SparkSecond;
 pub use hours::SparkHoursTransform;
 pub use make_date::SparkMakeDate;
+pub use seconds_to_timestamp::SparkSecondsToTimestamp;
 pub use timestamp_trunc::TimestampTruncExpr;
 pub use unix_timestamp::SparkUnixTimestamp;
@@ -0,0 +1,192 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use arrow::array::{
+    Array, Float32Array, Float64Array, Int32Array, Int64Array, TimestampMicrosecondArray,
+};
+use arrow::compute::try_unary;
+use arrow::datatypes::{DataType, TimeUnit};
+use datafusion::common::{utils::take_function_args, DataFusionError, Result, ScalarValue};
+use datafusion::logical_expr::{
+    ColumnarValue, ScalarFunctionArgs, ScalarUDFImpl, Signature, TypeSignature, Volatility,
+};
+use std::any::Any;
+use std::sync::Arc;
+
+const MICROS_PER_SECOND: i64 = 1_000_000;
+
+/// Spark-compatible seconds_to_timestamp (timestamp_seconds) function.
+/// Converts seconds since Unix epoch to a timestamp.
+#[derive(Debug, PartialEq, Eq, Hash)]
+pub struct SparkSecondsToTimestamp {
+    signature: Signature,
+    aliases: Vec<String>,
+}
+
+impl SparkSecondsToTimestamp {
+    pub fn new() -> Self {
+        Self {
+            signature: Signature::one_of(
+                vec![
+                    TypeSignature::Exact(vec![DataType::Int32]),
+                    TypeSignature::Exact(vec![DataType::Int64]),
+                    TypeSignature::Exact(vec![DataType::Float32]),
+                    TypeSignature::Exact(vec![DataType::Float64]),
+                ],
+                Volatility::Immutable,
+            ),
+            aliases: vec!["timestamp_seconds".to_string()],
+        }
+    }
+}
+
+impl Default for SparkSecondsToTimestamp {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl ScalarUDFImpl for SparkSecondsToTimestamp {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn name(&self) -> &str {
+        "seconds_to_timestamp"
+    }
+
+    fn signature(&self) -> &Signature {
+        &self.signature
+    }
+
+    fn return_type(&self, _: &[DataType]) -> Result<DataType> {
+        Ok(DataType::Timestamp(TimeUnit::Microsecond, None))
+    }
+
+    fn invoke_with_args(&self, args: ScalarFunctionArgs) -> Result<ColumnarValue> {
+        let [seconds] = take_function_args(self.name(), args.args)?;
+
+        match seconds {
+            ColumnarValue::Array(arr) => {
+                // Handle Int32 input — no overflow possible since i32 * 1_000_000 fits in i64
+                if let Some(int_array) = arr.as_any().downcast_ref::<Int32Array>() {
+                    let result: TimestampMicrosecondArray =
+                        try_unary(int_array, |s| Ok((s as i64) * MICROS_PER_SECOND))?;
+                    return Ok(ColumnarValue::Array(Arc::new(result)));
+                }
+
+                // Handle Int64 input — error on overflow to match Spark's Math.multiplyExact
+                if let Some(int_array) = arr.as_any().downcast_ref::<Int64Array>() {
+                    let result: TimestampMicrosecondArray = try_unary(int_array, |s| {
+                        s.checked_mul(MICROS_PER_SECOND).ok_or_else(|| {
+                            arrow::error::ArrowError::ComputeError("long overflow".to_string())
+                        })
+                    })?;
+                    return Ok(ColumnarValue::Array(Arc::new(result)));
+                }
+
+                // Handle Float32 input — cast to f64 and use Float64 path
+                if let Some(float_array) = arr.as_any().downcast_ref::<Float32Array>() {
+                    let result: arrow::array::TimestampMicrosecondArray = float_array
+                        .iter()
+                        .map(|opt| {
+                            opt.and_then(|s| {
+                                let s = s as f64;
+                                if s.is_nan() || s.is_infinite() {
+                                    None
+                                } else {
+                                    Some((s * (MICROS_PER_SECOND as f64)) as i64)
+                                }
+                            })
+                        })
+                        .collect();
+                    return Ok(ColumnarValue::Array(Arc::new(result)));
+                }
+
+                // Handle Float64 input — NaN and Infinity return null per Spark behavior
+                if let Some(float_array) = arr.as_any().downcast_ref::<Float64Array>() {
+                    let result: arrow::array::TimestampMicrosecondArray = float_array
+                        .iter()
+                        .map(|opt| {
+                            opt.and_then(|s| {
+                                if s.is_nan() || s.is_infinite() {
+                                    None
+                                } else {
+                                    Some((s * (MICROS_PER_SECOND as f64)) as i64)
+                                }
+                            })
+                        })
+                        .collect();
+                    return Ok(ColumnarValue::Array(Arc::new(result)));
+                }
+
+                Err(DataFusionError::Execution(format!(
+                    "seconds_to_timestamp expects Int32, Int64, Float32 or Float64 input, got {:?}",
+                    arr.data_type()
+                )))
+            }
+            ColumnarValue::Scalar(scalar) => {
+                let ts_micros = match &scalar {
+                    ScalarValue::Int32(Some(s)) => Some((*s as i64) * MICROS_PER_SECOND),
+                    ScalarValue::Int64(Some(s)) => {
+                        Some(s.checked_mul(MICROS_PER_SECOND).ok_or_else(|| {
+                            DataFusionError::ArrowError(
+                                Box::new(arrow::error::ArrowError::ComputeError(
+                                    "long overflow".to_string(),
+                                )),
+                                None,
+                            )
+                        })?)
+                    }
+                    ScalarValue::Float32(Some(s)) => {
+                        let s = *s as f64;
+                        if s.is_nan() || s.is_infinite() {
+                            None
+                        } else {
+                            Some((s * (MICROS_PER_SECOND as f64)) as i64)
+                        }
+                    }
+                    ScalarValue::Float64(Some(s)) => {
+                        if s.is_nan() || s.is_infinite() {
+                            None
+                        } else {
+                            Some((s * (MICROS_PER_SECOND as f64)) as i64)
+                        }
+                    }
+                    ScalarValue::Int32(None)
+                    | ScalarValue::Int64(None)
+                    | ScalarValue::Float32(None)
+                    | ScalarValue::Float64(None)
+                    | ScalarValue::Null => None,
+                    _ => {
+                        return Err(DataFusionError::Execution(format!(
+                            "seconds_to_timestamp expects numeric scalar input, got {:?}",
+                            scalar.data_type()
+                        )))
+                    }
+                };
+                Ok(ColumnarValue::Scalar(ScalarValue::TimestampMicrosecond(
+                    ts_micros, None,
+                )))
+            }
+        }
+    }
+
+    fn aliases(&self) -> &[String] {
+        &self.aliases
+    }
+}
@@ -74,7 +74,8 @@ pub use comet_scalar_funcs::{
 pub use csv_funcs::*;
 pub use datetime_funcs::{
     SparkDateDiff, SparkDateFromUnixDate, SparkDateTrunc, SparkHour, SparkHoursTransform,
-    SparkMakeDate, SparkMinute, SparkSecond, SparkUnixTimestamp, TimestampTruncExpr,
+    SparkMakeDate, SparkMinute, SparkSecond, SparkSecondsToTimestamp, SparkUnixTimestamp,
+    TimestampTruncExpr,
 };
 pub use error::{decimal_overflow_error, SparkError, SparkErrorWithContext, SparkResult};
 pub use hash_funcs::*;
 
@@ -300,7 +300,28 @@ under the License.
     </profile>
     <profile>
       <id>spark-4.2</id>
-      <!-- 4.2 preview profile is build-only; no Iceberg or Jetty test dependencies are wired up. -->
+      <dependencies>
+        <!-- iceberg-spark-runtime-4.2 is not yet published; reuse the 4.0 runtime -->
+        <dependency>
+          <groupId>org.apache.iceberg</groupId>
+          <artifactId>iceberg-spark-runtime-4.0_${scala.binary.version}</artifactId>
+          <version>1.10.0</version>
+          <scope>test</scope>
+        </dependency>
+        <!-- Jetty 11.x for Spark 4.2 (jakarta.servlet); matches Spark 4.2.0-preview4's jetty.version -->
+        <dependency>
+          <groupId>org.eclipse.jetty</groupId>
+          <artifactId>jetty-server</artifactId>
+          <version>11.0.26</version>
+          <scope>test</scope>
+        </dependency>
+        <dependency>
+          <groupId>org.eclipse.jetty</groupId>
+          <artifactId>jetty-servlet</artifactId>
+          <version>11.0.26</version>
+          <scope>test</scope>
+        </dependency>
+      </dependencies>
     </profile>
     <profile>
       <id>generate-docs</id>
 
@@ -169,6 +169,10 @@ object CometSparkSessionExtensions extends Logging {
     org.apache.spark.SPARK_VERSION >= "4.1"
   }
 
+  def isSpark42Plus: Boolean = {
+    org.apache.spark.SPARK_VERSION >= "4.2"
+  }
+
   /**
    * Whether we should override Spark memory configuration for Comet. This only returns true when
    * Comet native execution is enabled and/or Comet shuffle is enabled and Comet doesn't use
 
@@ -219,6 +219,7 @@ object QueryPlanSerde extends Logging with CometExprShim with CometTypeShim {
       classOf[Minute] -> CometMinute,
       classOf[NextDay] -> CometNextDay,
       classOf[Second] -> CometSecond,
+      classOf[SecondsToTimestamp] -> CometSecondsToTimestamp,
       classOf[TruncDate] -> CometTruncDate,
       classOf[TruncTimestamp] -> CometTruncTimestamp,
       classOf[UnixTimestamp] -> CometUnixTimestamp,