1818#include " velox/common/compression/Compression.h"
1919#include " velox/connectors/Connector.h"
2020#include " velox/connectors/hive/HiveConfig.h"
21- #include " velox/connectors/hive/HivePartitionName.h"
2221#include " velox/connectors/hive/PartitionIdGenerator.h"
2322#include " velox/connectors/hive/TableHandle.h"
2423#include " velox/dwio/common/Options.h"
@@ -517,17 +516,6 @@ class HiveDataSink : public DataSink {
517516 };
518517 static std::string stateString (State state);
519518
520- // / Creates a HiveDataSink for writing data to Hive table files.
521- // /
522- // / @param inputType The schema of input data rows to be written.
523- // / @param insertTableHandle Metadata about the table write operation,
524- // / including storage format, compression, bucketing, and partitioning
525- // / configuration.
526- // / @param connectorQueryCtx Query context with session properties, memory
527- // / pools, and spill configuration.
528- // / @param commitStrategy Strategy for committing written data (kNoCommit or
529- // / kTaskCommit).
530- // / @param hiveConfig Hive connector configuration.
531519 HiveDataSink (
532520 RowTypePtr inputType,
533521 std::shared_ptr<const HiveInsertTableHandle> insertTableHandle,
@@ -544,40 +532,6 @@ class HiveDataSink : public DataSink {
544532 uint32_t bucketCount,
545533 std::unique_ptr<core::PartitionFunction> bucketFunction);
546534
547- // / Constructor with explicit bucketing and partitioning parameters.
548- // /
549- // / @param inputType The schema of input data rows to be written.
550- // / @param insertTableHandle Metadata about the table write operation,
551- // / including storage format, compression, location, and serialization
552- // / parameters.
553- // / @param connectorQueryCtx Query context with session properties, memory
554- // / pools, and spill configuration.
555- // / @param commitStrategy Strategy for committing written data (kNoCommit or
556- // / kTaskCommit). Determines whether temporary files need to be renamed on
557- // / commit.
558- // / @param hiveConfig Hive connector configuration with settings for max
559- // / partitions, bucketing limits etc.
560- // / @param bucketCount Number of buckets for bucketed tables (0 if not
561- // / bucketed). Must be less than the configured max bucket count.
562- // / @param bucketFunction Function to compute bucket IDs from row data
563- // / (nullptr if not bucketed). Used to distribute rows across buckets.
564- // / @param partitionChannels Column indices used for partitioning (empty if
565- // / not partitioned). These columns are extracted to determine partition
566- // / directories.
567- // / @param partitionIdGenerator Generates partition IDs from partition column
568- // / values (nullptr if not partitioned). Compute partition key combinations to
569- // / unique IDs.
570- HiveDataSink (
571- RowTypePtr inputType,
572- std::shared_ptr<const HiveInsertTableHandle> insertTableHandle,
573- const ConnectorQueryCtx* connectorQueryCtx,
574- CommitStrategy commitStrategy,
575- const std::shared_ptr<const HiveConfig>& hiveConfig,
576- uint32_t bucketCount,
577- std::unique_ptr<core::PartitionFunction> bucketFunction,
578- const std::vector<column_index_t >& partitionChannels,
579- std::unique_ptr<PartitionIdGenerator> partitionIdGenerator);
580-
581535 void appendData (RowVectorPtr input) override ;
582536
583537 bool finish () override ;
@@ -667,7 +621,7 @@ class HiveDataSink : public DataSink {
667621 io::IoStatistics* ioStats);
668622
669623 // Compute the partition id and bucket id for each row in 'input'.
670- virtual void computePartitionAndBucketIds (const RowVectorPtr& input);
624+ void computePartitionAndBucketIds (const RowVectorPtr& input);
671625
672626 // Get the HiveWriter corresponding to the row
673627 // from partitionIds and bucketIds.
@@ -687,12 +641,6 @@ class HiveDataSink : public DataSink {
687641 // the newly created writer in 'writers_'.
688642 uint32_t appendWriter (const HiveWriterId& id);
689643
690- // Returns the Hive partition directory name for the given partition ID.
691- // Converts the partition values associated with the partition ID into a
692- // Hive-formatted directory path. Returns std::nullopt if the table is
693- // unpartitioned. Should be called only when writing to a partitioned table.
694- virtual std::string getPartitionName (uint32_t partitionId) const ;
695-
696644 std::unique_ptr<facebook::velox::dwio::common::Writer>
697645 maybeCreateBucketSortWriter (
698646 std::unique_ptr<facebook::velox::dwio::common::Writer> writer);
@@ -747,7 +695,6 @@ class HiveDataSink : public DataSink {
747695 const std::shared_ptr<dwio::common::WriterFactory> writerFactory_;
748696 const common::SpillConfig* const spillConfig_;
749697 const uint64_t sortWriterFinishTimeSliceLimitMs_{0 };
750- const bool partitionKeyAsLowerCase_;
751698
752699 std::vector<column_index_t > sortColumnIndices_;
753700 std::vector<CompareFlags> sortCompareFlags_;
0 commit comments