diff --git ql/src/gen/protobuf/gen-java/org/apache/hadoop/hive/ql/io/orc/OrcProto.java ql/src/gen/protobuf/gen-java/org/apache/hadoop/hive/ql/io/orc/OrcProto.java
index 7a96373..d33d66e 100644
--- ql/src/gen/protobuf/gen-java/org/apache/hadoop/hive/ql/io/orc/OrcProto.java
+++ ql/src/gen/protobuf/gen-java/org/apache/hadoop/hive/ql/io/orc/OrcProto.java
@@ -1256,6 +1256,24 @@ public Builder clearSum() {
*/
com.google.protobuf.ByteString
getMaximumBytes();
+
+ // optional sint64 sum = 3;
+ /**
+ * optional sint64 sum = 3;
+ *
+ *
+ * sum will store the total length of all strings in a stripe + *+ */ + boolean hasSum(); + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + long getSum(); } /** * Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.StringStatistics} @@ -1318,6 +1336,11 @@ private StringStatistics( maximum_ = input.readBytes(); break; } + case 24: { + bitField0_ |= 0x00000004; + sum_ = input.readSInt64(); + break; + } } } } catch (com.google.protobuf.InvalidProtocolBufferException e) { @@ -1444,9 +1467,34 @@ public boolean hasMaximum() { } } + // optional sint64 sum = 3; + public static final int SUM_FIELD_NUMBER = 3; + private long sum_; + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public boolean hasSum() { + return ((bitField0_ & 0x00000004) == 0x00000004); + } + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public long getSum() { + return sum_; + } + private void initFields() { minimum_ = ""; maximum_ = ""; + sum_ = 0L; } private byte memoizedIsInitialized = -1; public final boolean isInitialized() { @@ -1466,6 +1514,9 @@ public void writeTo(com.google.protobuf.CodedOutputStream output) if (((bitField0_ & 0x00000002) == 0x00000002)) { output.writeBytes(2, getMaximumBytes()); } + if (((bitField0_ & 0x00000004) == 0x00000004)) { + output.writeSInt64(3, sum_); + } getUnknownFields().writeTo(output); } @@ -1483,6 +1534,10 @@ public int getSerializedSize() { size += com.google.protobuf.CodedOutputStream .computeBytesSize(2, getMaximumBytes()); } + if (((bitField0_ & 0x00000004) == 0x00000004)) { + size += com.google.protobuf.CodedOutputStream + .computeSInt64Size(3, sum_); + } size += getUnknownFields().getSerializedSize(); memoizedSerializedSize = size; return size; @@ -1603,6 +1658,8 @@ public Builder clear() { bitField0_ = (bitField0_ & ~0x00000001); maximum_ = ""; bitField0_ = (bitField0_ & ~0x00000002); + sum_ = 0L; + bitField0_ = (bitField0_ & ~0x00000004); return this; } @@ -1639,6 +1696,10 @@ public Builder clone() { to_bitField0_ |= 0x00000002; } result.maximum_ = maximum_; + if (((from_bitField0_ & 0x00000004) == 0x00000004)) { + to_bitField0_ |= 0x00000004; + } + result.sum_ = sum_; result.bitField0_ = to_bitField0_; onBuilt(); return result; @@ -1665,6 +1726,9 @@ public Builder mergeFrom(org.apache.hadoop.hive.ql.io.orc.OrcProto.StringStatist maximum_ = other.maximum_; onChanged(); } + if (other.hasSum()) { + setSum(other.getSum()); + } this.mergeUnknownFields(other.getUnknownFields()); return this; } @@ -1840,6 +1904,55 @@ public Builder setMaximumBytes( return this; } + // optional sint64 sum = 3; + private long sum_ ; + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public boolean hasSum() { + return ((bitField0_ & 0x00000004) == 0x00000004); + } + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public long getSum() { + return sum_; + } + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public Builder setSum(long value) { + bitField0_ |= 0x00000004; + sum_ = value; + onChanged(); + return this; + } + /** + *
optional sint64 sum = 3;
+ *
+ * + * sum will store the total length of all strings in a stripe + *+ */ + public Builder clearSum() { + bitField0_ = (bitField0_ & ~0x00000004); + sum_ = 0L; + onChanged(); + return this; + } + // @@protoc_insertion_point(builder_scope:org.apache.hadoop.hive.ql.io.orc.StringStatistics) } @@ -3279,15 +3392,492 @@ public boolean hasMaximum() { return ((bitField0_ & 0x00000002) == 0x00000002); } /** - *
optional sint32 maximum = 2;
+ * optional sint32 maximum = 2;
+ */
+ public int getMaximum() {
+ return maximum_;
+ }
+
+ private void initFields() {
+ minimum_ = 0;
+ maximum_ = 0;
+ }
+ private byte memoizedIsInitialized = -1;
+ public final boolean isInitialized() {
+ byte isInitialized = memoizedIsInitialized;
+ if (isInitialized != -1) return isInitialized == 1;
+
+ memoizedIsInitialized = 1;
+ return true;
+ }
+
+ public void writeTo(com.google.protobuf.CodedOutputStream output)
+ throws java.io.IOException {
+ getSerializedSize();
+ if (((bitField0_ & 0x00000001) == 0x00000001)) {
+ output.writeSInt32(1, minimum_);
+ }
+ if (((bitField0_ & 0x00000002) == 0x00000002)) {
+ output.writeSInt32(2, maximum_);
+ }
+ getUnknownFields().writeTo(output);
+ }
+
+ private int memoizedSerializedSize = -1;
+ public int getSerializedSize() {
+ int size = memoizedSerializedSize;
+ if (size != -1) return size;
+
+ size = 0;
+ if (((bitField0_ & 0x00000001) == 0x00000001)) {
+ size += com.google.protobuf.CodedOutputStream
+ .computeSInt32Size(1, minimum_);
+ }
+ if (((bitField0_ & 0x00000002) == 0x00000002)) {
+ size += com.google.protobuf.CodedOutputStream
+ .computeSInt32Size(2, maximum_);
+ }
+ size += getUnknownFields().getSerializedSize();
+ memoizedSerializedSize = size;
+ return size;
+ }
+
+ private static final long serialVersionUID = 0L;
+ @java.lang.Override
+ protected java.lang.Object writeReplace()
+ throws java.io.ObjectStreamException {
+ return super.writeReplace();
+ }
+
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ com.google.protobuf.ByteString data)
+ throws com.google.protobuf.InvalidProtocolBufferException {
+ return PARSER.parseFrom(data);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ com.google.protobuf.ByteString data,
+ com.google.protobuf.ExtensionRegistryLite extensionRegistry)
+ throws com.google.protobuf.InvalidProtocolBufferException {
+ return PARSER.parseFrom(data, extensionRegistry);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(byte[] data)
+ throws com.google.protobuf.InvalidProtocolBufferException {
+ return PARSER.parseFrom(data);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ byte[] data,
+ com.google.protobuf.ExtensionRegistryLite extensionRegistry)
+ throws com.google.protobuf.InvalidProtocolBufferException {
+ return PARSER.parseFrom(data, extensionRegistry);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(java.io.InputStream input)
+ throws java.io.IOException {
+ return PARSER.parseFrom(input);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ java.io.InputStream input,
+ com.google.protobuf.ExtensionRegistryLite extensionRegistry)
+ throws java.io.IOException {
+ return PARSER.parseFrom(input, extensionRegistry);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseDelimitedFrom(java.io.InputStream input)
+ throws java.io.IOException {
+ return PARSER.parseDelimitedFrom(input);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseDelimitedFrom(
+ java.io.InputStream input,
+ com.google.protobuf.ExtensionRegistryLite extensionRegistry)
+ throws java.io.IOException {
+ return PARSER.parseDelimitedFrom(input, extensionRegistry);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ com.google.protobuf.CodedInputStream input)
+ throws java.io.IOException {
+ return PARSER.parseFrom(input);
+ }
+ public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(
+ com.google.protobuf.CodedInputStream input,
+ com.google.protobuf.ExtensionRegistryLite extensionRegistry)
+ throws java.io.IOException {
+ return PARSER.parseFrom(input, extensionRegistry);
+ }
+
+ public static Builder newBuilder() { return Builder.create(); }
+ public Builder newBuilderForType() { return newBuilder(); }
+ public static Builder newBuilder(org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics prototype) {
+ return newBuilder().mergeFrom(prototype);
+ }
+ public Builder toBuilder() { return newBuilder(this); }
+
+ @java.lang.Override
+ protected Builder newBuilderForType(
+ com.google.protobuf.GeneratedMessage.BuilderParent parent) {
+ Builder builder = new Builder(parent);
+ return builder;
+ }
+ /**
+ * Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.DateStatistics}
+ */
+ public static final class Builder extends
+ com.google.protobuf.GeneratedMessage.Builderoptional sint32 minimum = 1;
+ *
+ * + * min,max values saved as days since epoch + *+ */ + public boolean hasMinimum() { + return ((bitField0_ & 0x00000001) == 0x00000001); + } + /** + *
optional sint32 minimum = 1;
+ *
+ * + * min,max values saved as days since epoch + *+ */ + public int getMinimum() { + return minimum_; + } + /** + *
optional sint32 minimum = 1;
+ *
+ * + * min,max values saved as days since epoch + *+ */ + public Builder setMinimum(int value) { + bitField0_ |= 0x00000001; + minimum_ = value; + onChanged(); + return this; + } + /** + *
optional sint32 minimum = 1;
+ *
+ * + * min,max values saved as days since epoch + *+ */ + public Builder clearMinimum() { + bitField0_ = (bitField0_ & ~0x00000001); + minimum_ = 0; + onChanged(); + return this; + } + + // optional sint32 maximum = 2; + private int maximum_ ; + /** + *
optional sint32 maximum = 2;
+ */
+ public boolean hasMaximum() {
+ return ((bitField0_ & 0x00000002) == 0x00000002);
+ }
+ /**
+ * optional sint32 maximum = 2;
+ */
+ public int getMaximum() {
+ return maximum_;
+ }
+ /**
+ * optional sint32 maximum = 2;
+ */
+ public Builder setMaximum(int value) {
+ bitField0_ |= 0x00000002;
+ maximum_ = value;
+ onChanged();
+ return this;
+ }
+ /**
+ * optional sint32 maximum = 2;
+ */
+ public Builder clearMaximum() {
+ bitField0_ = (bitField0_ & ~0x00000002);
+ maximum_ = 0;
+ onChanged();
+ return this;
+ }
+
+ // @@protoc_insertion_point(builder_scope:org.apache.hadoop.hive.ql.io.orc.DateStatistics)
+ }
+
+ static {
+ defaultInstance = new DateStatistics(true);
+ defaultInstance.initFields();
+ }
+
+ // @@protoc_insertion_point(class_scope:org.apache.hadoop.hive.ql.io.orc.DateStatistics)
+ }
+
+ public interface BinaryStatisticsOrBuilder
+ extends com.google.protobuf.MessageOrBuilder {
+
+ // optional sint64 sum = 1;
+ /**
+ * optional sint64 sum = 1;
+ *
+ * + * sum will store the total binary blob length in a stripe + *+ */ + boolean hasSum(); + /** + *
optional sint64 sum = 1;
+ *
+ * + * sum will store the total binary blob length in a stripe + *+ */ + long getSum(); + } + /** + * Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.BinaryStatistics} + */ + public static final class BinaryStatistics extends + com.google.protobuf.GeneratedMessage + implements BinaryStatisticsOrBuilder { + // Use BinaryStatistics.newBuilder() to construct. + private BinaryStatistics(com.google.protobuf.GeneratedMessage.Builder> builder) { + super(builder); + this.unknownFields = builder.getUnknownFields(); + } + private BinaryStatistics(boolean noInit) { this.unknownFields = com.google.protobuf.UnknownFieldSet.getDefaultInstance(); } + + private static final BinaryStatistics defaultInstance; + public static BinaryStatistics getDefaultInstance() { + return defaultInstance; + } + + public BinaryStatistics getDefaultInstanceForType() { + return defaultInstance; + } + + private final com.google.protobuf.UnknownFieldSet unknownFields; + @java.lang.Override + public final com.google.protobuf.UnknownFieldSet + getUnknownFields() { + return this.unknownFields; + } + private BinaryStatistics( + com.google.protobuf.CodedInputStream input, + com.google.protobuf.ExtensionRegistryLite extensionRegistry) + throws com.google.protobuf.InvalidProtocolBufferException { + initFields(); + int mutable_bitField0_ = 0; + com.google.protobuf.UnknownFieldSet.Builder unknownFields = + com.google.protobuf.UnknownFieldSet.newBuilder(); + try { + boolean done = false; + while (!done) { + int tag = input.readTag(); + switch (tag) { + case 0: + done = true; + break; + default: { + if (!parseUnknownField(input, unknownFields, + extensionRegistry, tag)) { + done = true; + } + break; + } + case 8: { + bitField0_ |= 0x00000001; + sum_ = input.readSInt64(); + break; + } + } + } + } catch (com.google.protobuf.InvalidProtocolBufferException e) { + throw e.setUnfinishedMessage(this); + } catch (java.io.IOException e) { + throw new com.google.protobuf.InvalidProtocolBufferException( + e.getMessage()).setUnfinishedMessage(this); + } finally { + this.unknownFields = unknownFields.build(); + makeExtensionsImmutable(); + } + } + public static final com.google.protobuf.Descriptors.Descriptor + getDescriptor() { + return org.apache.hadoop.hive.ql.io.orc.OrcProto.internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_descriptor; + } + + protected com.google.protobuf.GeneratedMessage.FieldAccessorTable + internalGetFieldAccessorTable() { + return org.apache.hadoop.hive.ql.io.orc.OrcProto.internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_fieldAccessorTable + .ensureFieldAccessorsInitialized( + org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.class, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder.class); + } + + public static com.google.protobuf.Parser
optional sint64 sum = 1;
+ *
+ * + * sum will store the total binary blob length in a stripe + *+ */ + public boolean hasSum() { + return ((bitField0_ & 0x00000001) == 0x00000001); + } + /** + *
optional sint64 sum = 1;
+ *
+ * + * sum will store the total binary blob length in a stripe + **/ - public int getMaximum() { - return maximum_; + public long getSum() { + return sum_; } private void initFields() { - minimum_ = 0; - maximum_ = 0; + sum_ = 0L; } private byte memoizedIsInitialized = -1; public final boolean isInitialized() { @@ -3302,10 +3892,7 @@ public void writeTo(com.google.protobuf.CodedOutputStream output) throws java.io.IOException { getSerializedSize(); if (((bitField0_ & 0x00000001) == 0x00000001)) { - output.writeSInt32(1, minimum_); - } - if (((bitField0_ & 0x00000002) == 0x00000002)) { - output.writeSInt32(2, maximum_); + output.writeSInt64(1, sum_); } getUnknownFields().writeTo(output); } @@ -3318,11 +3905,7 @@ public int getSerializedSize() { size = 0; if (((bitField0_ & 0x00000001) == 0x00000001)) { size += com.google.protobuf.CodedOutputStream - .computeSInt32Size(1, minimum_); - } - if (((bitField0_ & 0x00000002) == 0x00000002)) { - size += com.google.protobuf.CodedOutputStream - .computeSInt32Size(2, maximum_); + .computeSInt64Size(1, sum_); } size += getUnknownFields().getSerializedSize(); memoizedSerializedSize = size; @@ -3336,53 +3919,53 @@ public int getSerializedSize() { return super.writeReplace(); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( com.google.protobuf.ByteString data) throws com.google.protobuf.InvalidProtocolBufferException { return PARSER.parseFrom(data); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException { return PARSER.parseFrom(data, extensionRegistry); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(byte[] data) + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom(byte[] data) throws com.google.protobuf.InvalidProtocolBufferException { return PARSER.parseFrom(data); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException { return PARSER.parseFrom(data, extensionRegistry); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom(java.io.InputStream input) + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom(java.io.InputStream input) throws java.io.IOException { return PARSER.parseFrom(input); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( java.io.InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws java.io.IOException { return PARSER.parseFrom(input, extensionRegistry); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseDelimitedFrom(java.io.InputStream input) + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseDelimitedFrom(java.io.InputStream input) throws java.io.IOException { return PARSER.parseDelimitedFrom(input); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseDelimitedFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseDelimitedFrom( java.io.InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws java.io.IOException { return PARSER.parseDelimitedFrom(input, extensionRegistry); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( com.google.protobuf.CodedInputStream input) throws java.io.IOException { return PARSER.parseFrom(input); } - public static org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics parseFrom( + public static org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics parseFrom( com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws java.io.IOException { @@ -3391,7 +3974,7 @@ public int getSerializedSize() { public static Builder newBuilder() { return Builder.create(); } public Builder newBuilderForType() { return newBuilder(); } - public static Builder newBuilder(org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics prototype) { + public static Builder newBuilder(org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics prototype) { return newBuilder().mergeFrom(prototype); } public Builder toBuilder() { return newBuilder(this); } @@ -3403,24 +3986,24 @@ protected Builder newBuilderForType( return builder; } /** - * Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.DateStatistics} + * Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.BinaryStatistics} */ public static final class Builder extends com.google.protobuf.GeneratedMessage.Builder
optional sint32 minimum = 1;
+ * optional sint64 sum = 1;
*
*
- * min,max values saved as days since epoch
+ * sum will store the total binary blob length in a stripe
*
*/
- public boolean hasMinimum() {
+ public boolean hasSum() {
return ((bitField0_ & 0x00000001) == 0x00000001);
}
/**
- * optional sint32 minimum = 1;
+ * optional sint64 sum = 1;
*
*
- * min,max values saved as days since epoch
+ * sum will store the total binary blob length in a stripe
*
*/
- public int getMinimum() {
- return minimum_;
+ public long getSum() {
+ return sum_;
}
/**
- * optional sint32 minimum = 1;
+ * optional sint64 sum = 1;
*
*
- * min,max values saved as days since epoch
+ * sum will store the total binary blob length in a stripe
*
*/
- public Builder setMinimum(int value) {
+ public Builder setSum(long value) {
bitField0_ |= 0x00000001;
- minimum_ = value;
+ sum_ = value;
onChanged();
return this;
}
/**
- * optional sint32 minimum = 1;
+ * optional sint64 sum = 1;
*
*
- * min,max values saved as days since epoch
+ * sum will store the total binary blob length in a stripe
*
*/
- public Builder clearMinimum() {
+ public Builder clearSum() {
bitField0_ = (bitField0_ & ~0x00000001);
- minimum_ = 0;
- onChanged();
- return this;
- }
-
- // optional sint32 maximum = 2;
- private int maximum_ ;
- /**
- * optional sint32 maximum = 2;
- */
- public boolean hasMaximum() {
- return ((bitField0_ & 0x00000002) == 0x00000002);
- }
- /**
- * optional sint32 maximum = 2;
- */
- public int getMaximum() {
- return maximum_;
- }
- /**
- * optional sint32 maximum = 2;
- */
- public Builder setMaximum(int value) {
- bitField0_ |= 0x00000002;
- maximum_ = value;
- onChanged();
- return this;
- }
- /**
- * optional sint32 maximum = 2;
- */
- public Builder clearMaximum() {
- bitField0_ = (bitField0_ & ~0x00000002);
- maximum_ = 0;
+ sum_ = 0L;
onChanged();
return this;
}
- // @@protoc_insertion_point(builder_scope:org.apache.hadoop.hive.ql.io.orc.DateStatistics)
+ // @@protoc_insertion_point(builder_scope:org.apache.hadoop.hive.ql.io.orc.BinaryStatistics)
}
static {
- defaultInstance = new DateStatistics(true);
+ defaultInstance = new BinaryStatistics(true);
defaultInstance.initFields();
}
- // @@protoc_insertion_point(class_scope:org.apache.hadoop.hive.ql.io.orc.DateStatistics)
+ // @@protoc_insertion_point(class_scope:org.apache.hadoop.hive.ql.io.orc.BinaryStatistics)
}
public interface ColumnStatisticsOrBuilder
@@ -3718,6 +4259,20 @@ public Builder clearMaximum() {
* optional .org.apache.hadoop.hive.ql.io.orc.DateStatistics dateStatistics = 7;
*/
org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatisticsOrBuilder getDateStatisticsOrBuilder();
+
+ // optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ boolean hasBinaryStatistics();
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics getBinaryStatistics();
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder getBinaryStatisticsOrBuilder();
}
/**
* Protobuf type {@code org.apache.hadoop.hive.ql.io.orc.ColumnStatistics}
@@ -3853,6 +4408,19 @@ private ColumnStatistics(
bitField0_ |= 0x00000040;
break;
}
+ case 66: {
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder subBuilder = null;
+ if (((bitField0_ & 0x00000080) == 0x00000080)) {
+ subBuilder = binaryStatistics_.toBuilder();
+ }
+ binaryStatistics_ = input.readMessage(org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.PARSER, extensionRegistry);
+ if (subBuilder != null) {
+ subBuilder.mergeFrom(binaryStatistics_);
+ binaryStatistics_ = subBuilder.buildPartial();
+ }
+ bitField0_ |= 0x00000080;
+ break;
+ }
}
}
} catch (com.google.protobuf.InvalidProtocolBufferException e) {
@@ -4041,6 +4609,28 @@ public boolean hasDateStatistics() {
return dateStatistics_;
}
+ // optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ public static final int BINARYSTATISTICS_FIELD_NUMBER = 8;
+ private org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics binaryStatistics_;
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public boolean hasBinaryStatistics() {
+ return ((bitField0_ & 0x00000080) == 0x00000080);
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics getBinaryStatistics() {
+ return binaryStatistics_;
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder getBinaryStatisticsOrBuilder() {
+ return binaryStatistics_;
+ }
+
private void initFields() {
numberOfValues_ = 0L;
intStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.IntegerStatistics.getDefaultInstance();
@@ -4049,6 +4639,7 @@ private void initFields() {
bucketStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.BucketStatistics.getDefaultInstance();
decimalStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.DecimalStatistics.getDefaultInstance();
dateStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.DateStatistics.getDefaultInstance();
+ binaryStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.getDefaultInstance();
}
private byte memoizedIsInitialized = -1;
public final boolean isInitialized() {
@@ -4083,6 +4674,9 @@ public void writeTo(com.google.protobuf.CodedOutputStream output)
if (((bitField0_ & 0x00000040) == 0x00000040)) {
output.writeMessage(7, dateStatistics_);
}
+ if (((bitField0_ & 0x00000080) == 0x00000080)) {
+ output.writeMessage(8, binaryStatistics_);
+ }
getUnknownFields().writeTo(output);
}
@@ -4120,6 +4714,10 @@ public int getSerializedSize() {
size += com.google.protobuf.CodedOutputStream
.computeMessageSize(7, dateStatistics_);
}
+ if (((bitField0_ & 0x00000080) == 0x00000080)) {
+ size += com.google.protobuf.CodedOutputStream
+ .computeMessageSize(8, binaryStatistics_);
+ }
size += getUnknownFields().getSerializedSize();
memoizedSerializedSize = size;
return size;
@@ -4234,6 +4832,7 @@ private void maybeForceBuilderInitialization() {
getBucketStatisticsFieldBuilder();
getDecimalStatisticsFieldBuilder();
getDateStatisticsFieldBuilder();
+ getBinaryStatisticsFieldBuilder();
}
}
private static Builder create() {
@@ -4280,6 +4879,12 @@ public Builder clear() {
dateStatisticsBuilder_.clear();
}
bitField0_ = (bitField0_ & ~0x00000040);
+ if (binaryStatisticsBuilder_ == null) {
+ binaryStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.getDefaultInstance();
+ } else {
+ binaryStatisticsBuilder_.clear();
+ }
+ bitField0_ = (bitField0_ & ~0x00000080);
return this;
}
@@ -4360,6 +4965,14 @@ public Builder clone() {
} else {
result.dateStatistics_ = dateStatisticsBuilder_.build();
}
+ if (((from_bitField0_ & 0x00000080) == 0x00000080)) {
+ to_bitField0_ |= 0x00000080;
+ }
+ if (binaryStatisticsBuilder_ == null) {
+ result.binaryStatistics_ = binaryStatistics_;
+ } else {
+ result.binaryStatistics_ = binaryStatisticsBuilder_.build();
+ }
result.bitField0_ = to_bitField0_;
onBuilt();
return result;
@@ -4397,6 +5010,9 @@ public Builder mergeFrom(org.apache.hadoop.hive.ql.io.orc.OrcProto.ColumnStatist
if (other.hasDateStatistics()) {
mergeDateStatistics(other.getDateStatistics());
}
+ if (other.hasBinaryStatistics()) {
+ mergeBinaryStatistics(other.getBinaryStatistics());
+ }
this.mergeUnknownFields(other.getUnknownFields());
return this;
}
@@ -5159,6 +5775,123 @@ public Builder clearDateStatistics() {
return dateStatisticsBuilder_;
}
+ // optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ private org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics binaryStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.getDefaultInstance();
+ private com.google.protobuf.SingleFieldBuilder<
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder> binaryStatisticsBuilder_;
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public boolean hasBinaryStatistics() {
+ return ((bitField0_ & 0x00000080) == 0x00000080);
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics getBinaryStatistics() {
+ if (binaryStatisticsBuilder_ == null) {
+ return binaryStatistics_;
+ } else {
+ return binaryStatisticsBuilder_.getMessage();
+ }
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public Builder setBinaryStatistics(org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics value) {
+ if (binaryStatisticsBuilder_ == null) {
+ if (value == null) {
+ throw new NullPointerException();
+ }
+ binaryStatistics_ = value;
+ onChanged();
+ } else {
+ binaryStatisticsBuilder_.setMessage(value);
+ }
+ bitField0_ |= 0x00000080;
+ return this;
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public Builder setBinaryStatistics(
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder builderForValue) {
+ if (binaryStatisticsBuilder_ == null) {
+ binaryStatistics_ = builderForValue.build();
+ onChanged();
+ } else {
+ binaryStatisticsBuilder_.setMessage(builderForValue.build());
+ }
+ bitField0_ |= 0x00000080;
+ return this;
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public Builder mergeBinaryStatistics(org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics value) {
+ if (binaryStatisticsBuilder_ == null) {
+ if (((bitField0_ & 0x00000080) == 0x00000080) &&
+ binaryStatistics_ != org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.getDefaultInstance()) {
+ binaryStatistics_ =
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.newBuilder(binaryStatistics_).mergeFrom(value).buildPartial();
+ } else {
+ binaryStatistics_ = value;
+ }
+ onChanged();
+ } else {
+ binaryStatisticsBuilder_.mergeFrom(value);
+ }
+ bitField0_ |= 0x00000080;
+ return this;
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public Builder clearBinaryStatistics() {
+ if (binaryStatisticsBuilder_ == null) {
+ binaryStatistics_ = org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.getDefaultInstance();
+ onChanged();
+ } else {
+ binaryStatisticsBuilder_.clear();
+ }
+ bitField0_ = (bitField0_ & ~0x00000080);
+ return this;
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder getBinaryStatisticsBuilder() {
+ bitField0_ |= 0x00000080;
+ onChanged();
+ return getBinaryStatisticsFieldBuilder().getBuilder();
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ public org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder getBinaryStatisticsOrBuilder() {
+ if (binaryStatisticsBuilder_ != null) {
+ return binaryStatisticsBuilder_.getMessageOrBuilder();
+ } else {
+ return binaryStatistics_;
+ }
+ }
+ /**
+ * optional .org.apache.hadoop.hive.ql.io.orc.BinaryStatistics binaryStatistics = 8;
+ */
+ private com.google.protobuf.SingleFieldBuilder<
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder>
+ getBinaryStatisticsFieldBuilder() {
+ if (binaryStatisticsBuilder_ == null) {
+ binaryStatisticsBuilder_ = new com.google.protobuf.SingleFieldBuilder<
+ org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatistics.Builder, org.apache.hadoop.hive.ql.io.orc.OrcProto.BinaryStatisticsOrBuilder>(
+ binaryStatistics_,
+ getParentForChildren(),
+ isClean());
+ binaryStatistics_ = null;
+ }
+ return binaryStatisticsBuilder_;
+ }
+
// @@protoc_insertion_point(builder_scope:org.apache.hadoop.hive.ql.io.orc.ColumnStatistics)
}
@@ -14321,6 +15054,11 @@ public Builder setMagicBytes(
com.google.protobuf.GeneratedMessage.FieldAccessorTable
internal_static_org_apache_hadoop_hive_ql_io_orc_DateStatistics_fieldAccessorTable;
private static com.google.protobuf.Descriptors.Descriptor
+ internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_descriptor;
+ private static
+ com.google.protobuf.GeneratedMessage.FieldAccessorTable
+ internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_fieldAccessorTable;
+ private static com.google.protobuf.Descriptors.Descriptor
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnStatistics_descriptor;
private static
com.google.protobuf.GeneratedMessage.FieldAccessorTable
@@ -14388,71 +15126,74 @@ public Builder setMagicBytes(
"e.ql.io.orc\"B\n\021IntegerStatistics\022\017\n\007mini" +
"mum\030\001 \001(\022\022\017\n\007maximum\030\002 \001(\022\022\013\n\003sum\030\003 \001(\022\"" +
"A\n\020DoubleStatistics\022\017\n\007minimum\030\001 \001(\001\022\017\n\007" +
- "maximum\030\002 \001(\001\022\013\n\003sum\030\003 \001(\001\"4\n\020StringStat" +
+ "maximum\030\002 \001(\001\022\013\n\003sum\030\003 \001(\001\"A\n\020StringStat" +
"istics\022\017\n\007minimum\030\001 \001(\t\022\017\n\007maximum\030\002 \001(\t" +
- "\"%\n\020BucketStatistics\022\021\n\005count\030\001 \003(\004B\002\020\001\"" +
- "B\n\021DecimalStatistics\022\017\n\007minimum\030\001 \001(\t\022\017\n" +
- "\007maximum\030\002 \001(\t\022\013\n\003sum\030\003 \001(\t\"2\n\016DateStati" +
- "stics\022\017\n\007minimum\030\001 \001(\021\022\017\n\007maximum\030\002 \001(\021\"",
- "\372\003\n\020ColumnStatistics\022\026\n\016numberOfValues\030\001" +
- " \001(\004\022J\n\rintStatistics\030\002 \001(\01323.org.apache" +
- ".hadoop.hive.ql.io.orc.IntegerStatistics" +
- "\022L\n\020doubleStatistics\030\003 \001(\01322.org.apache." +
- "hadoop.hive.ql.io.orc.DoubleStatistics\022L" +
- "\n\020stringStatistics\030\004 \001(\01322.org.apache.ha" +
- "doop.hive.ql.io.orc.StringStatistics\022L\n\020" +
- "bucketStatistics\030\005 \001(\01322.org.apache.hado" +
- "op.hive.ql.io.orc.BucketStatistics\022N\n\021de" +
- "cimalStatistics\030\006 \001(\01323.org.apache.hadoo",
- "p.hive.ql.io.orc.DecimalStatistics\022H\n\016da" +
- "teStatistics\030\007 \001(\01320.org.apache.hadoop.h" +
- "ive.ql.io.orc.DateStatistics\"n\n\rRowIndex" +
- "Entry\022\025\n\tpositions\030\001 \003(\004B\002\020\001\022F\n\nstatisti" +
- "cs\030\002 \001(\01322.org.apache.hadoop.hive.ql.io." +
- "orc.ColumnStatistics\"J\n\010RowIndex\022>\n\005entr" +
- "y\030\001 \003(\0132/.org.apache.hadoop.hive.ql.io.o" +
- "rc.RowIndexEntry\"\331\001\n\006Stream\022;\n\004kind\030\001 \002(" +
- "\0162-.org.apache.hadoop.hive.ql.io.orc.Str" +
- "eam.Kind\022\016\n\006column\030\002 \001(\r\022\016\n\006length\030\003 \001(\004",
- "\"r\n\004Kind\022\013\n\007PRESENT\020\000\022\010\n\004DATA\020\001\022\n\n\006LENGT" +
- "H\020\002\022\023\n\017DICTIONARY_DATA\020\003\022\024\n\020DICTIONARY_C" +
- "OUNT\020\004\022\r\n\tSECONDARY\020\005\022\r\n\tROW_INDEX\020\006\"\263\001\n" +
- "\016ColumnEncoding\022C\n\004kind\030\001 \002(\01625.org.apac" +
- "he.hadoop.hive.ql.io.orc.ColumnEncoding." +
- "Kind\022\026\n\016dictionarySize\030\002 \001(\r\"D\n\004Kind\022\n\n\006" +
- "DIRECT\020\000\022\016\n\nDICTIONARY\020\001\022\r\n\tDIRECT_V2\020\002\022" +
- "\021\n\rDICTIONARY_V2\020\003\"\214\001\n\014StripeFooter\0229\n\007s" +
- "treams\030\001 \003(\0132(.org.apache.hadoop.hive.ql" +
- ".io.orc.Stream\022A\n\007columns\030\002 \003(\01320.org.ap",
- "ache.hadoop.hive.ql.io.orc.ColumnEncodin" +
- "g\"\314\002\n\004Type\0229\n\004kind\030\001 \002(\0162+.org.apache.ha" +
- "doop.hive.ql.io.orc.Type.Kind\022\024\n\010subtype" +
- "s\030\002 \003(\rB\002\020\001\022\022\n\nfieldNames\030\003 \003(\t\022\025\n\rmaxim" +
- "umLength\030\004 \001(\r\"\307\001\n\004Kind\022\013\n\007BOOLEAN\020\000\022\010\n\004" +
- "BYTE\020\001\022\t\n\005SHORT\020\002\022\007\n\003INT\020\003\022\010\n\004LONG\020\004\022\t\n\005" +
- "FLOAT\020\005\022\n\n\006DOUBLE\020\006\022\n\n\006STRING\020\007\022\n\n\006BINAR" +
- "Y\020\010\022\r\n\tTIMESTAMP\020\t\022\010\n\004LIST\020\n\022\007\n\003MAP\020\013\022\n\n" +
- "\006STRUCT\020\014\022\t\n\005UNION\020\r\022\013\n\007DECIMAL\020\016\022\010\n\004DAT" +
- "E\020\017\022\013\n\007VARCHAR\020\020\"x\n\021StripeInformation\022\016\n",
- "\006offset\030\001 \001(\004\022\023\n\013indexLength\030\002 \001(\004\022\022\n\nda" +
- "taLength\030\003 \001(\004\022\024\n\014footerLength\030\004 \001(\004\022\024\n\014" +
- "numberOfRows\030\005 \001(\004\"/\n\020UserMetadataItem\022\014" +
- "\n\004name\030\001 \002(\t\022\r\n\005value\030\002 \002(\014\"\356\002\n\006Footer\022\024" +
- "\n\014headerLength\030\001 \001(\004\022\025\n\rcontentLength\030\002 " +
- "\001(\004\022D\n\007stripes\030\003 \003(\01323.org.apache.hadoop" +
- ".hive.ql.io.orc.StripeInformation\0225\n\005typ" +
- "es\030\004 \003(\0132&.org.apache.hadoop.hive.ql.io." +
- "orc.Type\022D\n\010metadata\030\005 \003(\01322.org.apache." +
- "hadoop.hive.ql.io.orc.UserMetadataItem\022\024",
- "\n\014numberOfRows\030\006 \001(\004\022F\n\nstatistics\030\007 \003(\013" +
- "22.org.apache.hadoop.hive.ql.io.orc.Colu" +
- "mnStatistics\022\026\n\016rowIndexStride\030\010 \001(\r\"\255\001\n" +
- "\nPostScript\022\024\n\014footerLength\030\001 \001(\004\022F\n\013com" +
- "pression\030\002 \001(\01621.org.apache.hadoop.hive." +
- "ql.io.orc.CompressionKind\022\034\n\024compression" +
- "BlockSize\030\003 \001(\004\022\023\n\007version\030\004 \003(\rB\002\020\001\022\016\n\005" +
- "magic\030\300> \001(\t*:\n\017CompressionKind\022\010\n\004NONE\020" +
- "\000\022\010\n\004ZLIB\020\001\022\n\n\006SNAPPY\020\002\022\007\n\003LZO\020\003"
+ "\022\013\n\003sum\030\003 \001(\022\"%\n\020BucketStatistics\022\021\n\005cou" +
+ "nt\030\001 \003(\004B\002\020\001\"B\n\021DecimalStatistics\022\017\n\007min" +
+ "imum\030\001 \001(\t\022\017\n\007maximum\030\002 \001(\t\022\013\n\003sum\030\003 \001(\t" +
+ "\"2\n\016DateStatistics\022\017\n\007minimum\030\001 \001(\021\022\017\n\007m",
+ "aximum\030\002 \001(\021\"\037\n\020BinaryStatistics\022\013\n\003sum\030" +
+ "\001 \001(\022\"\310\004\n\020ColumnStatistics\022\026\n\016numberOfVa" +
+ "lues\030\001 \001(\004\022J\n\rintStatistics\030\002 \001(\01323.org." +
+ "apache.hadoop.hive.ql.io.orc.IntegerStat" +
+ "istics\022L\n\020doubleStatistics\030\003 \001(\01322.org.a" +
+ "pache.hadoop.hive.ql.io.orc.DoubleStatis" +
+ "tics\022L\n\020stringStatistics\030\004 \001(\01322.org.apa" +
+ "che.hadoop.hive.ql.io.orc.StringStatisti" +
+ "cs\022L\n\020bucketStatistics\030\005 \001(\01322.org.apach" +
+ "e.hadoop.hive.ql.io.orc.BucketStatistics",
+ "\022N\n\021decimalStatistics\030\006 \001(\01323.org.apache" +
+ ".hadoop.hive.ql.io.orc.DecimalStatistics" +
+ "\022H\n\016dateStatistics\030\007 \001(\01320.org.apache.ha" +
+ "doop.hive.ql.io.orc.DateStatistics\022L\n\020bi" +
+ "naryStatistics\030\010 \001(\01322.org.apache.hadoop" +
+ ".hive.ql.io.orc.BinaryStatistics\"n\n\rRowI" +
+ "ndexEntry\022\025\n\tpositions\030\001 \003(\004B\002\020\001\022F\n\nstat" +
+ "istics\030\002 \001(\01322.org.apache.hadoop.hive.ql" +
+ ".io.orc.ColumnStatistics\"J\n\010RowIndex\022>\n\005" +
+ "entry\030\001 \003(\0132/.org.apache.hadoop.hive.ql.",
+ "io.orc.RowIndexEntry\"\331\001\n\006Stream\022;\n\004kind\030" +
+ "\001 \002(\0162-.org.apache.hadoop.hive.ql.io.orc" +
+ ".Stream.Kind\022\016\n\006column\030\002 \001(\r\022\016\n\006length\030\003" +
+ " \001(\004\"r\n\004Kind\022\013\n\007PRESENT\020\000\022\010\n\004DATA\020\001\022\n\n\006L" +
+ "ENGTH\020\002\022\023\n\017DICTIONARY_DATA\020\003\022\024\n\020DICTIONA" +
+ "RY_COUNT\020\004\022\r\n\tSECONDARY\020\005\022\r\n\tROW_INDEX\020\006" +
+ "\"\263\001\n\016ColumnEncoding\022C\n\004kind\030\001 \002(\01625.org." +
+ "apache.hadoop.hive.ql.io.orc.ColumnEncod" +
+ "ing.Kind\022\026\n\016dictionarySize\030\002 \001(\r\"D\n\004Kind" +
+ "\022\n\n\006DIRECT\020\000\022\016\n\nDICTIONARY\020\001\022\r\n\tDIRECT_V",
+ "2\020\002\022\021\n\rDICTIONARY_V2\020\003\"\214\001\n\014StripeFooter\022" +
+ "9\n\007streams\030\001 \003(\0132(.org.apache.hadoop.hiv" +
+ "e.ql.io.orc.Stream\022A\n\007columns\030\002 \003(\01320.or" +
+ "g.apache.hadoop.hive.ql.io.orc.ColumnEnc" +
+ "oding\"\314\002\n\004Type\0229\n\004kind\030\001 \002(\0162+.org.apach" +
+ "e.hadoop.hive.ql.io.orc.Type.Kind\022\024\n\010sub" +
+ "types\030\002 \003(\rB\002\020\001\022\022\n\nfieldNames\030\003 \003(\t\022\025\n\rm" +
+ "aximumLength\030\004 \001(\r\"\307\001\n\004Kind\022\013\n\007BOOLEAN\020\000" +
+ "\022\010\n\004BYTE\020\001\022\t\n\005SHORT\020\002\022\007\n\003INT\020\003\022\010\n\004LONG\020\004" +
+ "\022\t\n\005FLOAT\020\005\022\n\n\006DOUBLE\020\006\022\n\n\006STRING\020\007\022\n\n\006B",
+ "INARY\020\010\022\r\n\tTIMESTAMP\020\t\022\010\n\004LIST\020\n\022\007\n\003MAP\020" +
+ "\013\022\n\n\006STRUCT\020\014\022\t\n\005UNION\020\r\022\013\n\007DECIMAL\020\016\022\010\n" +
+ "\004DATE\020\017\022\013\n\007VARCHAR\020\020\"x\n\021StripeInformatio" +
+ "n\022\016\n\006offset\030\001 \001(\004\022\023\n\013indexLength\030\002 \001(\004\022\022" +
+ "\n\ndataLength\030\003 \001(\004\022\024\n\014footerLength\030\004 \001(\004" +
+ "\022\024\n\014numberOfRows\030\005 \001(\004\"/\n\020UserMetadataIt" +
+ "em\022\014\n\004name\030\001 \002(\t\022\r\n\005value\030\002 \002(\014\"\356\002\n\006Foot" +
+ "er\022\024\n\014headerLength\030\001 \001(\004\022\025\n\rcontentLengt" +
+ "h\030\002 \001(\004\022D\n\007stripes\030\003 \003(\01323.org.apache.ha" +
+ "doop.hive.ql.io.orc.StripeInformation\0225\n",
+ "\005types\030\004 \003(\0132&.org.apache.hadoop.hive.ql" +
+ ".io.orc.Type\022D\n\010metadata\030\005 \003(\01322.org.apa" +
+ "che.hadoop.hive.ql.io.orc.UserMetadataIt" +
+ "em\022\024\n\014numberOfRows\030\006 \001(\004\022F\n\nstatistics\030\007" +
+ " \003(\01322.org.apache.hadoop.hive.ql.io.orc." +
+ "ColumnStatistics\022\026\n\016rowIndexStride\030\010 \001(\r" +
+ "\"\255\001\n\nPostScript\022\024\n\014footerLength\030\001 \001(\004\022F\n" +
+ "\013compression\030\002 \001(\01621.org.apache.hadoop.h" +
+ "ive.ql.io.orc.CompressionKind\022\034\n\024compres" +
+ "sionBlockSize\030\003 \001(\004\022\023\n\007version\030\004 \003(\rB\002\020\001",
+ "\022\016\n\005magic\030\300> \001(\t*:\n\017CompressionKind\022\010\n\004N" +
+ "ONE\020\000\022\010\n\004ZLIB\020\001\022\n\n\006SNAPPY\020\002\022\007\n\003LZO\020\003"
};
com.google.protobuf.Descriptors.FileDescriptor.InternalDescriptorAssigner assigner =
new com.google.protobuf.Descriptors.FileDescriptor.InternalDescriptorAssigner() {
@@ -14476,7 +15217,7 @@ public Builder setMagicBytes(
internal_static_org_apache_hadoop_hive_ql_io_orc_StringStatistics_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_StringStatistics_descriptor,
- new java.lang.String[] { "Minimum", "Maximum", });
+ new java.lang.String[] { "Minimum", "Maximum", "Sum", });
internal_static_org_apache_hadoop_hive_ql_io_orc_BucketStatistics_descriptor =
getDescriptor().getMessageTypes().get(3);
internal_static_org_apache_hadoop_hive_ql_io_orc_BucketStatistics_fieldAccessorTable = new
@@ -14495,68 +15236,74 @@ public Builder setMagicBytes(
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_DateStatistics_descriptor,
new java.lang.String[] { "Minimum", "Maximum", });
- internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnStatistics_descriptor =
+ internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_descriptor =
getDescriptor().getMessageTypes().get(6);
+ internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_fieldAccessorTable = new
+ com.google.protobuf.GeneratedMessage.FieldAccessorTable(
+ internal_static_org_apache_hadoop_hive_ql_io_orc_BinaryStatistics_descriptor,
+ new java.lang.String[] { "Sum", });
+ internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnStatistics_descriptor =
+ getDescriptor().getMessageTypes().get(7);
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnStatistics_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnStatistics_descriptor,
- new java.lang.String[] { "NumberOfValues", "IntStatistics", "DoubleStatistics", "StringStatistics", "BucketStatistics", "DecimalStatistics", "DateStatistics", });
+ new java.lang.String[] { "NumberOfValues", "IntStatistics", "DoubleStatistics", "StringStatistics", "BucketStatistics", "DecimalStatistics", "DateStatistics", "BinaryStatistics", });
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndexEntry_descriptor =
- getDescriptor().getMessageTypes().get(7);
+ getDescriptor().getMessageTypes().get(8);
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndexEntry_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndexEntry_descriptor,
new java.lang.String[] { "Positions", "Statistics", });
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndex_descriptor =
- getDescriptor().getMessageTypes().get(8);
+ getDescriptor().getMessageTypes().get(9);
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndex_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_RowIndex_descriptor,
new java.lang.String[] { "Entry", });
internal_static_org_apache_hadoop_hive_ql_io_orc_Stream_descriptor =
- getDescriptor().getMessageTypes().get(9);
+ getDescriptor().getMessageTypes().get(10);
internal_static_org_apache_hadoop_hive_ql_io_orc_Stream_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_Stream_descriptor,
new java.lang.String[] { "Kind", "Column", "Length", });
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnEncoding_descriptor =
- getDescriptor().getMessageTypes().get(10);
+ getDescriptor().getMessageTypes().get(11);
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnEncoding_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_ColumnEncoding_descriptor,
new java.lang.String[] { "Kind", "DictionarySize", });
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeFooter_descriptor =
- getDescriptor().getMessageTypes().get(11);
+ getDescriptor().getMessageTypes().get(12);
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeFooter_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeFooter_descriptor,
new java.lang.String[] { "Streams", "Columns", });
internal_static_org_apache_hadoop_hive_ql_io_orc_Type_descriptor =
- getDescriptor().getMessageTypes().get(12);
+ getDescriptor().getMessageTypes().get(13);
internal_static_org_apache_hadoop_hive_ql_io_orc_Type_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_Type_descriptor,
new java.lang.String[] { "Kind", "Subtypes", "FieldNames", "MaximumLength", });
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeInformation_descriptor =
- getDescriptor().getMessageTypes().get(13);
+ getDescriptor().getMessageTypes().get(14);
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeInformation_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_StripeInformation_descriptor,
new java.lang.String[] { "Offset", "IndexLength", "DataLength", "FooterLength", "NumberOfRows", });
internal_static_org_apache_hadoop_hive_ql_io_orc_UserMetadataItem_descriptor =
- getDescriptor().getMessageTypes().get(14);
+ getDescriptor().getMessageTypes().get(15);
internal_static_org_apache_hadoop_hive_ql_io_orc_UserMetadataItem_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_UserMetadataItem_descriptor,
new java.lang.String[] { "Name", "Value", });
internal_static_org_apache_hadoop_hive_ql_io_orc_Footer_descriptor =
- getDescriptor().getMessageTypes().get(15);
+ getDescriptor().getMessageTypes().get(16);
internal_static_org_apache_hadoop_hive_ql_io_orc_Footer_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_Footer_descriptor,
new java.lang.String[] { "HeaderLength", "ContentLength", "Stripes", "Types", "Metadata", "NumberOfRows", "Statistics", "RowIndexStride", });
internal_static_org_apache_hadoop_hive_ql_io_orc_PostScript_descriptor =
- getDescriptor().getMessageTypes().get(16);
+ getDescriptor().getMessageTypes().get(17);
internal_static_org_apache_hadoop_hive_ql_io_orc_PostScript_fieldAccessorTable = new
com.google.protobuf.GeneratedMessage.FieldAccessorTable(
internal_static_org_apache_hadoop_hive_ql_io_orc_PostScript_descriptor,
diff --git ql/src/java/org/apache/hadoop/hive/ql/exec/FileSinkOperator.java ql/src/java/org/apache/hadoop/hive/ql/exec/FileSinkOperator.java
index bcee201..73388c1 100644
--- ql/src/java/org/apache/hadoop/hive/ql/exec/FileSinkOperator.java
+++ ql/src/java/org/apache/hadoop/hive/ql/exec/FileSinkOperator.java
@@ -38,8 +38,8 @@
import org.apache.hadoop.hive.ql.io.HiveFileFormatUtils;
import org.apache.hadoop.hive.ql.io.HiveKey;
import org.apache.hadoop.hive.ql.io.HiveOutputFormat;
-import org.apache.hadoop.hive.ql.io.HivePassThroughOutputFormat;
import org.apache.hadoop.hive.ql.io.HivePartitioner;
+import org.apache.hadoop.hive.ql.io.HivePassThroughOutputFormat;
import org.apache.hadoop.hive.ql.metadata.HiveException;
import org.apache.hadoop.hive.ql.plan.DynamicPartitionCtx;
import org.apache.hadoop.hive.ql.plan.ExprNodeDesc;
@@ -89,6 +89,7 @@
protected transient ListBucketingCtx lbCtx;
protected transient boolean isSkewedStoredAsSubDirectories;
private transient boolean statsCollectRawDataSize;
+ private transient boolean statsFromRecordWriter = false;
private static final transient String[] FATAL_ERR_MSG = {
@@ -106,6 +107,10 @@
void close(boolean abort) throws IOException;
}
+ public static interface StatsProvidingRecordWriter extends RecordWriter {
+ SerDeStats getStats();
+ }
+
public class FSPaths implements Cloneable {
Path tmpPath;
Path taskOutputTempPath;
@@ -516,6 +521,9 @@ private void createBucketFiles(FSPaths fsp) throws HiveException {
fsp.outWriters[filesIdx] = HiveFileFormatUtils.getHiveRecordWriter(
jc, conf.getTableInfo(), outputClass, conf, fsp.outPaths[filesIdx],
reporter);
+ // If the record writer provides stats, get it from there instead of the serde
+ statsFromRecordWriter =
+ fsp.outWriters[filesIdx] instanceof StatsProvidingRecordWriter;
// increment the CREATED_FILES counter
if (reporter != null) {
reporter.incrCounter(ProgressCounter.CREATED_FILES, 1);
@@ -619,7 +627,7 @@ public void processOp(Object row, int tag) throws HiveException {
}
rowOutWriters = fpaths.outWriters;
- if (conf.isGatherStats()) {
+ if (conf.isGatherStats() && !statsFromRecordWriter) {
if (statsCollectRawDataSize) {
SerDeStats stats = serializer.getSerDeStats();
if (stats != null) {
@@ -634,8 +642,10 @@ public void processOp(Object row, int tag) throws HiveException {
row_count.set(row_count.get() + 1);
}
+ RecordWriter rowOutWriter = null;
+
if (!multiFileSpray) {
- rowOutWriters[0].write(recordValue);
+ rowOutWriter = rowOutWriters[0];
} else {
int keyHashCode = 0;
for (int i = 0; i < partitionEval.length; i++) {
@@ -646,8 +656,9 @@ public void processOp(Object row, int tag) throws HiveException {
key.setHashCode(keyHashCode);
int bucketNum = prtner.getBucket(key, null, totalFiles);
int idx = bucketMap.get(bucketNum);
- rowOutWriters[idx].write(recordValue);
+ rowOutWriter = rowOutWriters[idx];
}
+ rowOutWriter.write(recordValue);
} catch (IOException e) {
throw new HiveException(e);
} catch (SerDeException e) {
@@ -864,6 +875,26 @@ public void closeOp(boolean abort) throws HiveException {
if (!abort) {
for (FSPaths fsp : valToPaths.values()) {
fsp.closeWriters(abort);
+ // before closing the operator check if statistics gathering is requested
+ // and is provided by record writer. this is different from the statistics
+ // gathering done in processOp(). In processOp(), for each row added
+ // serde statistics about the row is gathered and accumulated in hashmap.
+ // this adds more overhead to the actual processing of row. But if the
+ // record writer already gathers the statistics, it can simply return the
+ // accumulated statistics which will be aggregated in case of spray writers
+ if (conf.isGatherStats() && statsFromRecordWriter) {
+ for (int idx = 0; idx < fsp.outWriters.length; idx++) {
+ RecordWriter outWriter = fsp.outWriters[idx];
+ if (outWriter != null) {
+ SerDeStats stats = ((StatsProvidingRecordWriter) outWriter).getStats();
+ if (stats != null) {
+ fsp.stat.addToStat(StatsSetupConst.RAW_DATA_SIZE, stats.getRawDataSize());
+ fsp.stat.addToStat(StatsSetupConst.ROW_COUNT, stats.getRowCount());
+ }
+ }
+ }
+ }
+
if (isNativeTable) {
fsp.commit(fs);
}
@@ -934,7 +965,7 @@ public void checkOutputSpecs(FileSystem ignored, JobConf job) throws IOException
hiveOutputFormat = ReflectionUtils.newInstance(conf.getTableInfo().getOutputFileFormatClass(),job);
}
else {
- hiveOutputFormat = conf.getTableInfo().getOutputFileFormatClass().newInstance();
+ hiveOutputFormat = conf.getTableInfo().getOutputFileFormatClass().newInstance();
}
}
else {
diff --git ql/src/java/org/apache/hadoop/hive/ql/io/orc/BinaryColumnStatistics.java ql/src/java/org/apache/hadoop/hive/ql/io/orc/BinaryColumnStatistics.java
new file mode 100644
index 0000000..23030a3
--- /dev/null
+++ ql/src/java/org/apache/hadoop/hive/ql/io/orc/BinaryColumnStatistics.java
@@ -0,0 +1,25 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.hadoop.hive.ql.io.orc;
+
+/**
+ * Statistics for binary columns.
+ */
+public interface BinaryColumnStatistics extends ColumnStatistics {
+ long getSum();
+}
diff --git ql/src/java/org/apache/hadoop/hive/ql/io/orc/ColumnStatisticsImpl.java ql/src/java/org/apache/hadoop/hive/ql/io/orc/ColumnStatisticsImpl.java
index 6268617..42d897c 100644
--- ql/src/java/org/apache/hadoop/hive/ql/io/orc/ColumnStatisticsImpl.java
+++ ql/src/java/org/apache/hadoop/hive/ql/io/orc/ColumnStatisticsImpl.java
@@ -21,6 +21,7 @@
import org.apache.hadoop.hive.serde2.io.DateWritable;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector;
+import org.apache.hadoop.io.BytesWritable;
class ColumnStatisticsImpl implements ColumnStatistics {
@@ -332,10 +333,11 @@ public String toString() {
}
}
- private static final class StringStatisticsImpl extends ColumnStatisticsImpl
+ protected static final class StringStatisticsImpl extends ColumnStatisticsImpl
implements StringColumnStatistics {
private String minimum = null;
private String maximum = null;
+ private long sum = 0;
StringStatisticsImpl() {
}
@@ -349,6 +351,9 @@ public String toString() {
if (str.hasMinimum()) {
minimum = str.getMinimum();
}
+ if(str.hasSum()) {
+ sum = str.getSum();
+ }
}
@Override
@@ -356,6 +361,7 @@ void reset() {
super.reset();
minimum = null;
maximum = null;
+ sum = 0;
}
@Override
@@ -368,6 +374,7 @@ void updateString(String value) {
} else if (maximum.compareTo(value) < 0) {
maximum = value;
}
+ sum += value.length();
}
@Override
@@ -384,6 +391,7 @@ void merge(ColumnStatisticsImpl other) {
maximum = str.maximum;
}
}
+ sum += str.sum;
}
@Override
@@ -394,6 +402,7 @@ void merge(ColumnStatisticsImpl other) {
if (getNumberOfValues() != 0) {
str.setMinimum(minimum);
str.setMaximum(maximum);
+ str.setSum(sum);
}
result.setStringStatistics(str);
return result;
@@ -410,6 +419,11 @@ public String getMaximum() {
}
@Override
+ public long getSum() {
+ return sum;
+ }
+
+ @Override
public String toString() {
StringBuilder buf = new StringBuilder(super.toString());
if (getNumberOfValues() != 0) {
@@ -417,6 +431,67 @@ public String toString() {
buf.append(minimum);
buf.append(" max: ");
buf.append(maximum);
+ buf.append(" sum: ");
+ buf.append(sum);
+ }
+ return buf.toString();
+ }
+ }
+
+ protected static final class BinaryStatisticsImpl extends ColumnStatisticsImpl implements
+ BinaryColumnStatistics {
+
+ private long sum = 0;
+
+ BinaryStatisticsImpl() {
+ }
+
+ BinaryStatisticsImpl(OrcProto.ColumnStatistics stats) {
+ super(stats);
+ OrcProto.BinaryStatistics binStats = stats.getBinaryStatistics();
+ if (binStats.hasSum()) {
+ sum = binStats.getSum();
+ }
+ }
+
+ @Override
+ void reset() {
+ super.reset();
+ sum = 0;
+ }
+
+ @Override
+ void updateBinary(BytesWritable value) {
+ sum += value.getLength();
+ }
+
+ @Override
+ void merge(ColumnStatisticsImpl other) {
+ super.merge(other);
+ BinaryStatisticsImpl bin = (BinaryStatisticsImpl) other;
+ sum += bin.sum;
+ }
+
+ @Override
+ public long getSum() {
+ return sum;
+ }
+
+ @Override
+ OrcProto.ColumnStatistics.Builder serialize() {
+ OrcProto.ColumnStatistics.Builder result = super.serialize();
+ OrcProto.BinaryStatistics.Builder bin = OrcProto.BinaryStatistics.newBuilder();
+ bin.setSum(sum);
+ result.setBinaryStatistics(bin);
+ return result;
+ }
+
+ @Override
+ public String toString() {
+ StringBuilder buf = new StringBuilder(super.toString());
+ if (getNumberOfValues() != 0) {
+ buf.append(" sum: ");
+ buf.append(sum);
}
return buf.toString();
}
@@ -666,6 +741,10 @@ void updateString(String value) {
throw new UnsupportedOperationException("Can't update string");
}
+ void updateBinary(BytesWritable value) {
+ throw new UnsupportedOperationException("Can't update binary");
+ }
+
void updateDecimal(HiveDecimal value) {
throw new UnsupportedOperationException("Can't update decimal");
}
@@ -720,6 +799,8 @@ static ColumnStatisticsImpl create(ObjectInspector inspector) {
return new DecimalStatisticsImpl();
case DATE:
return new DateStatisticsImpl();
+ case BINARY:
+ return new BinaryStatisticsImpl();
default:
return new ColumnStatisticsImpl();
}
@@ -741,6 +822,8 @@ static ColumnStatisticsImpl deserialize(OrcProto.ColumnStatistics stats) {
return new DecimalStatisticsImpl(stats);
} else if (stats.hasDateStatistics()) {
return new DateStatisticsImpl(stats);
+ } else if(stats.hasBinaryStatistics()) {
+ return new BinaryStatisticsImpl(stats);
} else {
return new ColumnStatisticsImpl(stats);
}
diff --git ql/src/java/org/apache/hadoop/hive/ql/io/orc/OrcOutputFormat.java ql/src/java/org/apache/hadoop/hive/ql/io/orc/OrcOutputFormat.java
index c80fb02..0454b91 100644
--- ql/src/java/org/apache/hadoop/hive/ql/io/orc/OrcOutputFormat.java
+++ ql/src/java/org/apache/hadoop/hive/ql/io/orc/OrcOutputFormat.java
@@ -17,12 +17,16 @@
*/
package org.apache.hadoop.hive.ql.io.orc;
-import org.apache.hadoop.conf.Configuration;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Properties;
+
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hive.ql.exec.FileSinkOperator;
import org.apache.hadoop.hive.ql.io.HiveOutputFormat;
import org.apache.hadoop.hive.ql.io.orc.OrcSerde.OrcSerdeRow;
+import org.apache.hadoop.hive.serde2.SerDeStats;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspectorFactory;
import org.apache.hadoop.io.NullWritable;
@@ -33,10 +37,6 @@
import org.apache.hadoop.mapred.Reporter;
import org.apache.hadoop.util.Progressable;
-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.Properties;
-
/**
* A Hive OutputFormat for ORC files.
*/
@@ -45,14 +45,17 @@
private static class OrcRecordWriter
implements RecordWriter