You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Describe the bug
When running a crossJoin using BroadcastNestedLoopJoin, the query results in a NPE.
here is the stack trace
src/main/python/cache_test.py::test_cache_broadcast_nested_loop_join[Left-String] 20/07/14 21:34:47 ERROR Executor: Exception in task 5.0 in stage 8.0 (TID 90)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 4.0 in stage 8.0 (TID 89)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 6.0 in stage 8.0 (TID 91)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 9.0 in stage 8.0 (TID 94)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 3.0 in stage 8.0 (TID 88)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 1.0 in stage 8.0 (TID 86)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 10.0 in stage 8.0 (TID 95)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 11.0 in stage 8.0 (TID 96)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 2.0 in stage 8.0 (TID 87)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 8.0 in stage 8.0 (TID 93)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 7.0 in stage 8.0 (TID 92)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR Executor: Exception in task 0.0 in stage 8.0 (TID 85)
java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 WARN TaskSetManager: Lost task 11.0 in stage 8.0 (TID 96, 192.168.0.121, executor driver): java.lang.NullPointerException
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.readObject(GpuBroadcastExchangeExec.scala:90)
at org.apache.spark.sql.rapids.execution.SerializeConcatHostBuffersDeserializeBatch.batch(GpuBroadcastExchangeExec.scala:63)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$2(GpuBroadcastNestedLoopJoinExec.scala:204)
at com.nvidia.spark.rapids.Arm.withResource(Arm.scala:26)
at com.nvidia.spark.rapids.Arm.withResource$(Arm.scala:24)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.withResource(GpuBroadcastNestedLoopJoinExec.scala:130)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$lzycompute$1(GpuBroadcastNestedLoopJoinExec.scala:203)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.builtTable$2(GpuBroadcastNestedLoopJoinExec.scala:202)
at org.apache.spark.sql.rapids.execution.GpuBroadcastNestedLoopJoinExec.$anonfun$doExecuteColumnar$4(GpuBroadcastNestedLoopJoinExec.scala:218)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2(RDD.scala:837)
at org.apache.spark.rdd.RDD.$anonfun$mapPartitions$2$adapted(RDD.scala:837)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:52)
at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:349)
at org.apache.spark.rdd.RDD.iterator(RDD.scala:313)
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99)
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52)
at org.apache.spark.scheduler.Task.run(Task.scala:127)
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:444)
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377)
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:447)
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
at java.lang.Thread.run(Thread.java:748)
20/07/14 21:34:47 ERROR TaskSetManager: Task 11 in stage 8.0 failed 1 times; aborting job
Steps/Code to reproduce bug
Run the cache_test.py#test_cache_broadcast_nested_loop_join
Expected behavior
The cache_test.py#test_cache_broadcast_nested_loop_join should pass
The text was updated successfully, but these errors were encountered:
Describe the bug
When running a crossJoin using BroadcastNestedLoopJoin, the query results in a NPE.
here is the stack trace
Steps/Code to reproduce bug
Run the cache_test.py#test_cache_broadcast_nested_loop_join
Expected behavior
The cache_test.py#test_cache_broadcast_nested_loop_join should pass
The text was updated successfully, but these errors were encountered: