Remove single-buffer compression codec APIs (#5092)

* Remove single-buffer compression codec APIs Signed-off-by: Jason Lowe <jlowe@nvidia.com> * Fix copyrights
NVIDIA · Mar 30, 2022 · 4c63d56 · 4c63d56
1 parent 4e77f85
commit 4c63d56
Show file tree

Hide file tree

Showing 3 changed files with 6 additions and 107 deletions.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2022, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,40 +25,6 @@ class CopyCompressionCodec extends TableCompressionCodec with Arm {
   override val name: String = "COPY"
   override val codecId: Byte = CodecType.COPY
 
-  override def compress(
-      tableId: Int,
-      contigTable: ContiguousTable,
-      stream: Cuda.Stream): CompressedTable = {
-    val buffer = contigTable.getBuffer
-    closeOnExcept(DeviceMemoryBuffer.allocate(buffer.getLength)) { outputBuffer =>
-      outputBuffer.copyFromDeviceBufferAsync(0, buffer, 0, buffer.getLength, stream)
-      val meta = MetaUtils.buildTableMeta(
-        Some(tableId),
-        contigTable,
-        codecId,
-        outputBuffer.getLength)
-      stream.sync()
-      CompressedTable(buffer.getLength, meta, outputBuffer)
-    }
-  }
-
-  override def decompressBufferAsync(
-      outputBuffer: DeviceMemoryBuffer,
-      outputOffset: Long,
-      outputLength: Long,
-      inputBuffer: DeviceMemoryBuffer,
-      inputOffset: Long,
-      inputLength: Long,
-      stream: Cuda.Stream): Unit = {
-    require(outputLength == inputLength)
-    outputBuffer.copyFromDeviceBufferAsync(
-      outputOffset,
-      inputBuffer,
-      inputOffset,
-      inputLength,
-      stream)
-  }
-
   override def createBatchCompressor(
       maxBatchMemorySize: Long,
       stream: Cuda.Stream): BatchedTableCompressor =

diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2022, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -27,39 +27,6 @@ class NvcompLZ4CompressionCodec(codecConfigs: TableCompressionCodecConfig)
   override val name: String = "nvcomp-LZ4"
   override val codecId: Byte = CodecType.NVCOMP_LZ4
 
-  override def compress(
-      tableId: Int,
-      contigTable: ContiguousTable,
-      stream: Cuda.Stream): CompressedTable = {
-    val tableBuffer = contigTable.getBuffer
-    val (compressedSize, oversizedBuffer) =
-      NvcompLZ4CompressionCodec.compress(tableBuffer, codecConfigs, stream)
-    closeOnExcept(oversizedBuffer) { oversizedBuffer =>
-      require(compressedSize <= oversizedBuffer.getLength, "compressed buffer overrun")
-      val tableMeta = MetaUtils.buildTableMeta(
-        Some(tableId),
-        contigTable,
-        CodecType.NVCOMP_LZ4,
-        compressedSize)
-      CompressedTable(compressedSize, tableMeta, oversizedBuffer)
-    }
-  }
-
-  override def decompressBufferAsync(
-      outputBuffer: DeviceMemoryBuffer,
-      outputOffset: Long,
-      outputLength: Long,
-      inputBuffer: DeviceMemoryBuffer,
-      inputOffset: Long,
-      inputLength: Long,
-      stream: Cuda.Stream): Unit = {
-    withResource(outputBuffer.slice(outputOffset, outputLength)) { outSlice =>
-      withResource(inputBuffer.slice(inputOffset, inputLength)) { inSlice =>
-        NvcompLZ4CompressionCodec.decompressAsync(outSlice, inSlice, stream)
-      }
-    }
-  }
-
   override def createBatchCompressor(
       maxBatchMemoryBytes: Long,
       stream: Cuda.Stream): BatchedTableCompressor = {
@@ -85,7 +52,7 @@ object NvcompLZ4CompressionCodec extends Arm {
       input: DeviceMemoryBuffer,
       codecConfigs: TableCompressionCodecConfig,
       stream: Cuda.Stream): (Long, DeviceMemoryBuffer) = {
-    val lz4Config = LZ4Compressor.configure(codecConfigs.lz4ChunkSize, input.getLength())
+    val lz4Config = LZ4Compressor.configure(codecConfigs.lz4ChunkSize, input.getLength)
     withResource(DeviceMemoryBuffer.allocate(lz4Config.getTempBytes)) { tempBuffer =>
       var compressedSize: Long = 0L
       val outputSize = lz4Config.getMaxCompressedBytes
@@ -109,12 +76,12 @@ object NvcompLZ4CompressionCodec extends Arm {
       inputBuffer: DeviceMemoryBuffer,
       stream: Cuda.Stream): Unit = {
     withResource(LZ4Decompressor.configure(inputBuffer, stream)) { decompressConf =>
-      val outputSize = decompressConf.getUncompressedBytes()
+      val outputSize = decompressConf.getUncompressedBytes
       if (outputSize != outputBuffer.getLength) {
         throw new IllegalStateException(
           s"metadata uncompressed size is $outputSize, buffer size is ${outputBuffer.getLength}")
       }
-      val tempSize = decompressConf.getTempBytes()
+      val tempSize = decompressConf.getTempBytes
       withResource(DeviceMemoryBuffer.allocate(tempSize)) { tempBuffer =>
         LZ4Decompressor.decompressAsync(inputBuffer, decompressConf, tempBuffer, outputBuffer,
           stream)

diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2022, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -45,40 +45,6 @@ trait TableCompressionCodec {
   /** The ID used for this codec.  See the definitions in `CodecType`. */
   val codecId: Byte
 
-  /**
-   * Compress a contiguous table.
-   * @note The contiguous table is NOT closed by this operation and must be closed separately.
-   * @note The compressed buffer MAY NOT be ideally sized to the compressed data. It may be
-   *       significantly larger than the size of the compressed data. Releasing this unused
-   *       memory will require making a copy of the data to a buffer of the appropriate size.
-   * @param tableId ID to use for this table
-   * @param contigTable contiguous table to compress
-   * @param stream CUDA stream to use
-   * @return compressed table
-   */
-  def compress(tableId: Int, contigTable: ContiguousTable, stream: Cuda.Stream): CompressedTable
-
-  /**
-   * Decompress the compressed data buffer from a table compression operation asynchronously
-   * using the specified stream.
-   * @note The compressed buffer is NOT closed by this method.
-   * @param outputBuffer buffer where uncompressed data will be written
-   * @param outputOffset offset in the uncompressed buffer to start writing data
-   * @param outputLength expected length of the uncompressed data in bytes
-   * @param inputBuffer buffer containing the compressed data
-   * @param inputOffset offset in the compressed buffer where compressed data starts
-   * @param inputLength length of the compressed data in bytes
-   * @param stream CUDA stream to use
-   */
-  def decompressBufferAsync(
-      outputBuffer: DeviceMemoryBuffer,
-      outputOffset: Long,
-      outputLength: Long,
-      inputBuffer: DeviceMemoryBuffer,
-      inputOffset: Long,
-      inputLength: Long,
-      stream: Cuda.Stream): Unit
-
   /**
    * Create a batched compressor instance
    * @param maxBatchMemorySize The upper limit in bytes of temporary and output memory usage at