diff --git a/fuzz-testing/src/main/scala/org/apache/comet/fuzz/DataGen.scala b/fuzz-testing/src/main/scala/org/apache/comet/fuzz/DataGen.scala index aec46a9d8..0c746e7b2 100644 --- a/fuzz-testing/src/main/scala/org/apache/comet/fuzz/DataGen.scala +++ b/fuzz-testing/src/main/scala/org/apache/comet/fuzz/DataGen.scala @@ -134,8 +134,12 @@ object DataGen { }) case DataTypes.BinaryType => generateColumn(r, DataTypes.StringType, numRows) - .filterNot(_ == null) - .map(_.asInstanceOf[String].getBytes(Charset.defaultCharset())) + .map { + case x: String => + x.getBytes(Charset.defaultCharset()) + case _ => + null + } case DataTypes.DateType => Range(0, numRows).map(_ => new java.sql.Date(1716645600011L + r.nextInt())) case DataTypes.TimestampType | DataTypes.TimestampNTZType => diff --git a/fuzz-testing/src/main/scala/org/apache/comet/fuzz/Meta.scala b/fuzz-testing/src/main/scala/org/apache/comet/fuzz/Meta.scala index 335961404..e585aed69 100644 --- a/fuzz-testing/src/main/scala/org/apache/comet/fuzz/Meta.scala +++ b/fuzz-testing/src/main/scala/org/apache/comet/fuzz/Meta.scala @@ -25,19 +25,20 @@ import org.apache.spark.sql.types.DataTypes object Meta { val dataTypes: Seq[(DataType, Double)] = Seq( - (DataTypes.BooleanType, 0.2), + // (DataTypes.BooleanType, 0.2), (DataTypes.ByteType, 0.2), (DataTypes.ShortType, 0.2), (DataTypes.IntegerType, 0.2), (DataTypes.LongType, 0.2), (DataTypes.FloatType, 0.2), (DataTypes.DoubleType, 0.2), - (DataTypes.createDecimalType(10, 2), 0.2), + // (DataTypes.createDecimalType(10, 2), 0.2), (DataTypes.DateType, 0.2), (DataTypes.TimestampType, 0.2), - (DataTypes.TimestampNTZType, 0.2), - (DataTypes.StringType, 0.2), - (DataTypes.BinaryType, 0.2)) + // (DataTypes.TimestampNTZType, 0.2), + (DataTypes.StringType, 0.2) + // (DataTypes.BinaryType, 0.2) + ) val stringScalarFunc: Seq[Function] = Seq( Function("substring", 3),