diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Attr.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Attr.java deleted file mode 100644 index 5d355d2..0000000 --- a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Attr.java +++ /dev/null @@ -1,39 +0,0 @@ -/** - * Licensed to the Apache Software Foundation (ASF) under one - * or more contributor license agreements. See the NOTICE file - * distributed with this work for additional information - * regarding copyright ownership. The ASF licenses this file - * to you under the Apache License, Version 2.0 (the - * "License"); you may not use this file except in compliance - * with the License. You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ - -package org.apache.hadoop.hive.common.jsonexplain.tez; - -public final class Attr implements Comparable { - public final String name; - public final String value; - - public Attr(String name, String value) { - super(); - this.name = name; - this.value = value; - } - - @Override - public int compareTo(Attr o) { - return this.name.compareToIgnoreCase(o.name); - } - - public String toString() { - return this.name + this.value; - } -} diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Op.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Op.java index d0c1037..61c714d 100644 --- a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Op.java +++ b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Op.java @@ -19,7 +19,6 @@ package org.apache.hadoop.hive.common.jsonexplain.tez; import java.util.ArrayList; -import java.util.Collections; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; @@ -34,7 +33,7 @@ public final String operatorId; public Op parent; public final List children; - public final List attrs; + public final Map attrs; // the jsonObject for this operator public final JSONObject opObject; // the vertex that this operator belongs to @@ -43,8 +42,9 @@ // ReduceOutputOperator public final String outputVertexName; - public Op(String name, String id, String outputVertexName, List children, List attrs, - JSONObject opObject, Vertex vertex, TezJsonParser tezJsonParser) throws JSONException { + public Op(String name, String id, String outputVertexName, List children, + Map attrs, JSONObject opObject, Vertex vertex, TezJsonParser tezJsonParser) + throws JSONException { super(); this.name = name; this.operatorId = id; @@ -62,14 +62,14 @@ private void inlineJoinOp() throws Exception { JSONObject mapjoinObj = opObject.getJSONObject("Map Join Operator"); // get the map for posToVertex JSONObject verticeObj = mapjoinObj.getJSONObject("input vertices:"); - Map posToVertex = new LinkedHashMap<>(); + Map posToVertex = new LinkedHashMap<>(); for (String pos : JSONObject.getNames(verticeObj)) { String vertexName = verticeObj.getString(pos); - posToVertex.put(pos, vertexName); // update the connection Connection c = null; for (Connection connection : vertex.parentConnections) { if (connection.from.name.equals(vertexName)) { + posToVertex.put(pos, connection.from); c = connection; break; } @@ -79,22 +79,30 @@ private void inlineJoinOp() throws Exception { } } // update the attrs - removeAttr("input vertices:"); - // update the keys to use vertex name + this.attrs.remove("input vertices:"); + // update the keys to use operator name JSONObject keys = mapjoinObj.getJSONObject("keys:"); if (keys.length() != 0) { JSONObject newKeys = new JSONObject(new LinkedHashMap<>()); for (String key : JSONObject.getNames(keys)) { - String vertexName = posToVertex.get(key); - if (vertexName != null) { - newKeys.put(vertexName, keys.get(key)); + Vertex vertex = posToVertex.get(key); + if (vertex != null) { + if (vertex.rootOps.size() > 1) { + throw new Exception("There are more than one root operators in a single vertex " + + vertex.name + " when hive explain user is trying to identify the operator id."); + } + newKeys.put(vertex.rootOps.get(0).operatorId, keys.get(key)); } else { - newKeys.put(this.vertex.name, keys.get(key)); + if (parent == null) { + throw new Exception( + "Can not find the source operator on one of the branches of join."); + } + newKeys.put(this.parent.operatorId, keys.get(key)); } } // update the attrs - removeAttr("keys:"); - this.attrs.add(new Attr("keys:", newKeys.toString())); + this.attrs.remove("keys:"); + this.attrs.put("keys:", newKeys.toString()); } } // inline merge join operator in a self-join @@ -107,12 +115,17 @@ private void inlineJoinOp() throws Exception { } } - private String getNameWithOpId() { + private String getNameWithOpIdStats() { + StringBuffer sb = new StringBuffer(); + sb.append(TezJsonParserUtils.renameReduceOutputOperator(name, vertex)); if (operatorId != null) { - return this.name + " [" + operatorId + "]"; - } else { - return this.name; + sb.append(" [" + operatorId + "]"); + } + if (!TezJsonParserUtils.OperatorNoStats.contains(name) && attrs.containsKey("Statistics:")) { + sb.append(" (" + attrs.get("Statistics:") + ")"); } + attrs.remove("Statistics:"); + return sb.toString(); } /** @@ -123,19 +136,19 @@ private String getNameWithOpId() { * operator so that we can decide the corresponding indent. * @throws Exception */ - public void print(Printer printer, List indentFlag, boolean branchOfJoinOp) + public void print(Printer printer, int indentFlag, boolean branchOfJoinOp) throws Exception { // print name if (parser.printSet.contains(this)) { printer.println(TezJsonParser.prefixString(indentFlag) + " Please refer to the previous " - + this.getNameWithOpId()); + + this.getNameWithOpIdStats()); return; } parser.printSet.add(this); if (!branchOfJoinOp) { - printer.println(TezJsonParser.prefixString(indentFlag) + this.getNameWithOpId()); + printer.println(TezJsonParser.prefixString(indentFlag) + this.getNameWithOpIdStats()); } else { - printer.println(TezJsonParser.prefixString(indentFlag, "|<-") + this.getNameWithOpId()); + printer.println(TezJsonParser.prefixString(indentFlag, "<-") + this.getNameWithOpIdStats()); } branchOfJoinOp = false; // if this operator is a Map Join Operator or a Merge Join Operator @@ -156,71 +169,28 @@ public void print(Printer printer, List indentFlag, boolean branchOfJoi } } // print attr - List attFlag = new ArrayList<>(); - attFlag.addAll(indentFlag); - // should print | if (1) it is branchOfJoinOp or (2) it is the last op and - // has following non-inlined vertex - if (branchOfJoinOp || (this.parent == null && !noninlined.isEmpty())) { - attFlag.add(true); - } else { - attFlag.add(false); - } - Collections.sort(attrs); - for (Attr attr : attrs) { - printer.println(TezJsonParser.prefixString(attFlag) + attr.toString()); + indentFlag++; + if (!attrs.isEmpty()) { + printer + .println(TezJsonParser.prefixString(indentFlag) + TezJsonParserUtils.attrsToString(attrs)); } // print inline vertex if (parser.inlineMap.containsKey(this)) { for (int index = 0; index < parser.inlineMap.get(this).size(); index++) { Connection connection = parser.inlineMap.get(this).get(index); - List vertexFlag = new ArrayList<>(); - vertexFlag.addAll(indentFlag); - if (branchOfJoinOp) { - vertexFlag.add(true); - } - // if there is an inline vertex but the operator itself is not on a join - // branch, - // then it means it is from a vertex created by an operator tree, - // e.g., fetch operator, etc. - else { - vertexFlag.add(false); - } - connection.from.print(printer, vertexFlag, connection.type, this.vertex); + connection.from.print(printer, indentFlag, connection.type, this.vertex); } } // print parent op, i.e., where data comes from if (this.parent != null) { - List parentFlag = new ArrayList<>(); - parentFlag.addAll(indentFlag); - parentFlag.add(false); - this.parent.print(printer, parentFlag, branchOfJoinOp); + this.parent.print(printer, indentFlag, branchOfJoinOp); } // print next vertex else { for (int index = 0; index < noninlined.size(); index++) { Vertex v = noninlined.get(index).from; - List vertexFlag = new ArrayList<>(); - vertexFlag.addAll(indentFlag); - if (index != noninlined.size() - 1) { - vertexFlag.add(true); - } else { - vertexFlag.add(false); - } - v.print(printer, vertexFlag, noninlined.get(index).type, this.vertex); - } - } - } - - public void removeAttr(String name) { - int removeIndex = -1; - for (int index = 0; index < attrs.size(); index++) { - if (attrs.get(index).name.equals(name)) { - removeIndex = index; - break; + v.print(printer, indentFlag, noninlined.get(index).type, this.vertex); } } - if (removeIndex != -1) { - attrs.remove(removeIndex); - } } } diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Stage.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Stage.java index 455d59f..b3631d0 100644 --- a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Stage.java +++ b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Stage.java @@ -20,7 +20,6 @@ import java.util.ArrayList; import java.util.Arrays; -import java.util.Collections; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; @@ -43,7 +42,7 @@ // downstream stages. public final List childStages = new ArrayList<>(); public final Map vertexs =new LinkedHashMap<>(); - public final List attrs = new ArrayList<>(); + public final Map attrs = new TreeMap<>(); Map> tezStageDependency; // some stage may contain only a single operator, e.g., create table operator, // fetch operator. @@ -112,6 +111,7 @@ public void extractVertex(JSONObject object) throws Exception { // for union vertex, we reverse the dependency relationship if (!"CONTAINS".equals(type)) { v.addDependency(new Connection(type, parentVertex)); + parentVertex.setType(type); parentVertex.children.add(v); } else { parentVertex.addDependency(new Connection(type, v)); @@ -133,6 +133,7 @@ public void extractVertex(JSONObject object) throws Exception { String type = obj.getString("type"); if (!"CONTAINS".equals(type)) { v.addDependency(new Connection(type, parentVertex)); + parentVertex.setType(type); parentVertex.children.add(v); } else { parentVertex.addDependency(new Connection(type, v)); @@ -162,7 +163,9 @@ public void extractVertex(JSONObject object) throws Exception { if (name.contains("Operator")) { this.op = extractOp(name, object.getJSONObject(name)); } else { - attrs.add(new Attr(name, object.get(name).toString())); + if (!object.get(name).toString().isEmpty()) { + attrs.put(name, object.get(name).toString()); + } } } } @@ -178,14 +181,14 @@ public void extractVertex(JSONObject object) throws Exception { * etc */ Op extractOp(String opName, JSONObject opObj) throws Exception { - List attrs = new ArrayList<>(); + Map attrs = new TreeMap<>(); Vertex v = null; if (opObj.length() > 0) { String[] names = JSONObject.getNames(opObj); for (String name : names) { Object o = opObj.get(name); - if (isPrintable(o)) { - attrs.add(new Attr(name, o.toString())); + if (isPrintable(o) && !o.toString().isEmpty()) { + attrs.put(name, o.toString()); } else if (o instanceof JSONObject) { JSONObject attrObj = (JSONObject) o; if (attrObj.length() > 0) { @@ -196,7 +199,9 @@ Op extractOp(String opName, JSONObject opObj) throws Exception { v.extractOpTree(); } else { for (String attrName : JSONObject.getNames(attrObj)) { - attrs.add(new Attr(attrName, attrObj.get(attrName).toString())); + if (!attrObj.get(attrName).toString().isEmpty()) { + attrs.put(attrName, attrObj.get(attrName).toString()); + } } } } @@ -224,7 +229,7 @@ private boolean isPrintable(Object val) { return false; } - public void print(Printer printer, List indentFlag) throws Exception { + public void print(Printer printer, int indentFlag) throws Exception { // print stagename if (parser.printSet.contains(this)) { printer.println(TezJsonParser.prefixString(indentFlag) + " Please refer to the previous " @@ -234,27 +239,23 @@ public void print(Printer printer, List indentFlag) throws Exception { parser.printSet.add(this); printer.println(TezJsonParser.prefixString(indentFlag) + externalName); // print vertexes - List nextIndentFlag = new ArrayList<>(); - nextIndentFlag.addAll(indentFlag); - nextIndentFlag.add(false); + indentFlag++; for (Vertex candidate : this.vertexs.values()) { if (!parser.isInline(candidate) && candidate.children.isEmpty()) { - candidate.print(printer, nextIndentFlag, null, null); + candidate.print(printer, indentFlag, null, null); } } if (!attrs.isEmpty()) { - Collections.sort(attrs); - for (Attr attr : attrs) { - printer.println(TezJsonParser.prefixString(nextIndentFlag) + attr.toString()); - } + printer.println(TezJsonParser.prefixString(indentFlag) + + TezJsonParserUtils.attrsToString(attrs)); } if (op != null) { - op.print(printer, nextIndentFlag, false); + op.print(printer, indentFlag, false); } - nextIndentFlag.add(false); + indentFlag++; // print dependent stages for (Stage stage : this.parentStages) { - stage.print(printer, nextIndentFlag); + stage.print(printer, indentFlag); } } } diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParser.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParser.java index b193fef..9228315 100644 --- a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParser.java +++ b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParser.java @@ -75,13 +75,10 @@ public void extractStagesAndPlans(JSONObject inputObject) throws Exception { * help to generate correct indent * @return */ - public static String prefixString(List indentFlag) { + public static String prefixString(int indentFlag) { StringBuilder sb = new StringBuilder(); - for (int index = 0; index < indentFlag.size(); index++) { - if (indentFlag.get(index)) - sb.append("| "); - else - sb.append(" "); + for (int index = 0; index < indentFlag; index++) { + sb.append(" "); } return sb.toString(); } @@ -92,13 +89,10 @@ public static String prefixString(List indentFlag) { * help to generate correct indent with a specific tail * @return */ - public static String prefixString(List indentFlag, String tail) { + public static String prefixString(int indentFlag, String tail) { StringBuilder sb = new StringBuilder(); - for (int index = 0; index < indentFlag.size(); index++) { - if (indentFlag.get(index)) - sb.append("| "); - else - sb.append(" "); + for (int index = 0; index < indentFlag; index++) { + sb.append(" "); } int len = sb.length(); return sb.replace(len - tail.length(), len, tail).toString(); @@ -136,11 +130,10 @@ public void print(JSONObject inputObject, PrintStream outputStream) throws Excep printer.println(); } } - List indentFlag = new ArrayList<>(); // print out all the stages that have no childStages. for (Stage candidate : this.stages.values()) { if (candidate.childStages.isEmpty()) { - candidate.print(printer, indentFlag); + candidate.print(printer, 0); } } outputStream.println(printer.toString()); diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParserUtils.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParserUtils.java new file mode 100644 index 0000000..20ec4ec --- /dev/null +++ b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/TezJsonParserUtils.java @@ -0,0 +1,53 @@ +/** + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.hive.common.jsonexplain.tez; + +import java.util.Arrays; +import java.util.List; +import java.util.Map; +import java.util.Map.Entry; + + +public class TezJsonParserUtils { + + public static List OperatorNoStats = Arrays.asList(new String[] { "File Output Operator", + "Reduce Output Operator" }); + + public static String renameReduceOutputOperator(String operatorName, Vertex vertex) { + if (operatorName.equals("Reduce Output Operator") && vertex.type != null) { + return vertex.type.name(); + } else { + return operatorName; + } + } + + public static String attrsToString(Map attrs) { + StringBuffer sb = new StringBuffer(); + boolean first = true; + for (Entry entry : attrs.entrySet()) { + if (first) { + first = false; + } else { + sb.append(","); + } + sb.append(entry.getKey() + entry.getValue()); + } + return sb.toString(); + } +} diff --git a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Vertex.java b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Vertex.java index be01b8b..2bf4516 100644 --- a/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Vertex.java +++ b/common/src/java/org/apache/hadoop/hive/common/jsonexplain/tez/Vertex.java @@ -21,6 +21,8 @@ import java.io.IOException; import java.util.ArrayList; import java.util.List; +import java.util.Map; +import java.util.TreeMap; import org.codehaus.jackson.JsonParseException; import org.codehaus.jackson.map.JsonMappingException; @@ -53,6 +55,12 @@ // execution mode public String executionMode = ""; + public static enum Type { + BROADCAST, SHUFFLE, OTHER + }; + // type for broadcast or shuffle only. + public Type type; + public Vertex(String name, JSONObject vertexObject, TezJsonParser tezJsonParser) { super(); this.name = name; @@ -134,7 +142,7 @@ Op extractOp(JSONObject operator) throws JSONException, JsonParseException, Json } else { String opName = names[0]; JSONObject attrObj = (JSONObject) operator.get(opName); - List attrs = new ArrayList<>(); + Map attrs = new TreeMap<>(); List children = new ArrayList<>(); String id = null; String outputVertexName = null; @@ -162,7 +170,9 @@ Op extractOp(JSONObject operator) throws JSONException, JsonParseException, Json } else if (attrName.equals("outputname:")) { outputVertexName = attrObj.get(attrName).toString(); } else { - attrs.add(new Attr(attrName, attrObj.get(attrName).toString())); + if (!attrObj.get(attrName).toString().isEmpty()) { + attrs.put(attrName, attrObj.get(attrName).toString()); + } } } } @@ -178,22 +188,22 @@ Op extractOp(JSONObject operator) throws JSONException, JsonParseException, Json } } - public void print(Printer printer, List indentFlag, String type, Vertex callingVertex) + public void print(Printer printer, int indentFlag, String type, Vertex callingVertex) throws JSONException, Exception { // print vertexname if (parser.printSet.contains(this) && !hasMultiReduceOp) { if (type != null) { - printer.println(TezJsonParser.prefixString(indentFlag, "|<-") + printer.println(TezJsonParser.prefixString(indentFlag, "<-") + " Please refer to the previous " + this.name + " [" + type + "]"); } else { - printer.println(TezJsonParser.prefixString(indentFlag, "|<-") + printer.println(TezJsonParser.prefixString(indentFlag, "<-") + " Please refer to the previous " + this.name); } return; } parser.printSet.add(this); if (type != null) { - printer.println(TezJsonParser.prefixString(indentFlag, "|<-") + this.name + " [" + type + "]" + printer.println(TezJsonParser.prefixString(indentFlag, "<-") + this.name + " [" + type + "]" + this.executionMode); } else if (this.name != null) { printer.println(TezJsonParser.prefixString(indentFlag) + this.name + this.executionMode); @@ -224,16 +234,10 @@ public void print(Printer printer, List indentFlag, String type, Vertex } if (this.union) { // print dependent vertexs + indentFlag++; for (int index = 0; index < this.parentConnections.size(); index++) { Connection connection = this.parentConnections.get(index); - List unionFlag = new ArrayList<>(); - unionFlag.addAll(indentFlag); - if (index != this.parentConnections.size() - 1) { - unionFlag.add(true); - } else { - unionFlag.add(false); - } - connection.from.print(printer, unionFlag, connection.type, this); + connection.from.print(printer, indentFlag, connection.type, this); } } } @@ -254,6 +258,19 @@ public void checkMultiReduceOperator() { this.hasMultiReduceOp = true; } + public void setType(String type) { + switch (type) { + case "BROADCAST_EDGE": + this.type = Type.BROADCAST; + break; + case "SIMPLE_EDGE": + this.type = Type.SHUFFLE; + break; + default: + this.type = Type.OTHER; + } + } + //The following code should be gone after HIVE-11075 using topological order @Override public int compareTo(Vertex o) { diff --git a/ql/src/java/org/apache/hadoop/hive/ql/exec/ExplainTask.java b/ql/src/java/org/apache/hadoop/hive/ql/exec/ExplainTask.java index f48db6a..4116141 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/exec/ExplainTask.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/exec/ExplainTask.java @@ -763,7 +763,7 @@ private JSONObject outputPlan(Object work, PrintStream out, out.println(header); } JSONObject jsonOut = outputPlan(val, out, extended, jsonOutput, ind); - if (jsonOutput) { + if (jsonOutput && jsonOut != null && jsonOut.length() != 0) { if (!skipHeader) { json.put(header, jsonOut); } else { diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/AbstractOperatorDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/AbstractOperatorDesc.java index bc67e5a..adec5c7 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/AbstractOperatorDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/AbstractOperatorDesc.java @@ -33,11 +33,16 @@ protected long memNeeded = 0; @Override - @Explain(skipHeader = true, displayName = "Statistics", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(skipHeader = true, displayName = "Statistics") public Statistics getStatistics() { return statistics; } + @Explain(skipHeader = true, displayName = "Statistics", explainLevels = { Level.USER }) + public String getUserLevelStatistics() { + return statistics.toUserLevelExplainString(); + } + @Override public void setStatistics(Statistics statistics) { this.statistics = statistics; diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableDesc.java index 3f38f74..66d3b7d 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableDesc.java @@ -143,12 +143,12 @@ public CreateTableDesc(String tableName, boolean isExternal, boolean isTemporary return copy == null ? null : new ArrayList(copy); } - @Explain(displayName = "columns", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "columns") public List getColsString() { return Utilities.getFieldSchemaString(getCols()); } - @Explain(displayName = "partition columns", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "partition columns") public List getPartColsString() { return Utilities.getFieldSchemaString(getPartCols()); } @@ -191,7 +191,7 @@ public void setPartCols(ArrayList partCols) { this.partCols = partCols; } - @Explain(displayName = "bucket columns", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "bucket columns") public List getBucketCols() { return bucketCols; } @@ -200,7 +200,7 @@ public void setBucketCols(ArrayList bucketCols) { this.bucketCols = bucketCols; } - @Explain(displayName = "# buckets", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "# buckets") public Integer getNumBucketsExplain() { if (numBuckets == -1) { return null; @@ -271,7 +271,7 @@ public void setComment(String comment) { this.comment = comment; } - @Explain(displayName = "input format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "input format") public String getInputFormat() { return inputFormat; } @@ -280,7 +280,7 @@ public void setInputFormat(String inputFormat) { this.inputFormat = inputFormat; } - @Explain(displayName = "output format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "output format") public String getOutputFormat() { return outputFormat; } @@ -289,7 +289,7 @@ public void setOutputFormat(String outputFormat) { this.outputFormat = outputFormat; } - @Explain(displayName = "storage handler", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "storage handler") public String getStorageHandler() { return storageHandler; } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableLikeDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableLikeDesc.java index f051712..37b7f0e 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableLikeDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/CreateTableLikeDesc.java @@ -82,7 +82,7 @@ public void setTableName(String tableName) { this.tableName = tableName; } - @Explain(displayName = "default input format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "default input format") public String getDefaultInputFormat() { return defaultInputFormat; } @@ -91,7 +91,7 @@ public void setInputFormat(String inputFormat) { this.defaultInputFormat = inputFormat; } - @Explain(displayName = "default output format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "default output format") public String getDefaultOutputFormat() { return defaultOutputFormat; } @@ -150,7 +150,7 @@ public void setDefaultSerdeProps(Map serdeProps) { this.defaultSerdeProps = serdeProps; } - @Explain(displayName = "like", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "like") public String getLikeTableName() { return likeTableName; } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/FileSinkDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/FileSinkDesc.java index 40a8477..cc462be 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/FileSinkDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/FileSinkDesc.java @@ -181,7 +181,7 @@ public void setTableInfo(final TableDesc tableInfo) { this.tableInfo = tableInfo; } - @Explain(displayName = "compressed", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "compressed") public boolean getCompressed() { return compressed; } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/FilterDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/FilterDesc.java index d04cb78..abb2025 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/FilterDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/FilterDesc.java @@ -18,7 +18,9 @@ package org.apache.hadoop.hive.ql.plan; +import java.util.Arrays; import java.util.List; + import org.apache.hadoop.hive.ql.plan.Explain.Level; @@ -105,11 +107,14 @@ public FilterDesc( this.sampleDescr = sampleDescr; } - @Explain(displayName = "predicate", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "predicate") public String getPredicateString() { - StringBuilder sb = new StringBuilder(); - PlanUtils.addExprToStringBuffer(predicate, sb); - return sb.toString(); + return PlanUtils.getExprListString(Arrays.asList(predicate)); + } + + @Explain(displayName = "predicate", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + public String getUserLevelExplainPredicateString() { + return PlanUtils.getExprListString(Arrays.asList(predicate), true); } public org.apache.hadoop.hive.ql.plan.ExprNodeDesc getPredicate() { diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/GroupByDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/GroupByDesc.java index 0f2855e..99791e5 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/GroupByDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/GroupByDesc.java @@ -158,11 +158,16 @@ public void setMode(final Mode mode) { this.mode = mode; } - @Explain(displayName = "keys", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "keys") public String getKeyString() { return PlanUtils.getExprListString(keys); } + @Explain(displayName = "keys", explainLevels = { Level.USER }) + public String getUserLevelExplainKeyString() { + return PlanUtils.getExprListString(keys, true); + } + public ArrayList getKeys() { return keys; } @@ -171,11 +176,16 @@ public void setKeys(final ArrayList keys) { this.keys = keys; } - @Explain(displayName = "outputColumnNames", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "outputColumnNames") public ArrayList getOutputColumnNames() { return outputColumnNames; } + @Explain(displayName = "Output", explainLevels = { Level.USER }) + public ArrayList getUserLevelExplainOutputColumnNames() { + return outputColumnNames; + } + @Explain(displayName = "pruneGroupingSetId", displayOnlyOnTrue = true) public boolean pruneGroupingSetId() { return groupingSetPosition >= 0 && diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/HashTableSinkDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/HashTableSinkDesc.java index 7c8eee2..0b1e95d 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/HashTableSinkDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/HashTableSinkDesc.java @@ -303,7 +303,7 @@ public void setRetainList(Map> retainList) { /** * @return the keys in string form */ - @Explain(displayName = "keys", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "keys") public Map getKeysString() { Map keyMap = new LinkedHashMap(); for (Map.Entry> k: getKeys().entrySet()) { @@ -312,6 +312,15 @@ public void setRetainList(Map> retainList) { return keyMap; } + @Explain(displayName = "keys", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + public Map getUserLevelExplainKeysString() { + Map keyMap = new LinkedHashMap(); + for (Map.Entry> k: getKeys().entrySet()) { + keyMap.put(k.getKey(), PlanUtils.getExprListString(k.getValue(), true)); + } + return keyMap; + } + /** * @return the keys */ diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/JoinDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/JoinDesc.java index eb83fd6..4ed2a0d 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/JoinDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/JoinDesc.java @@ -211,7 +211,7 @@ public void setReversedExprs(Map reversedExprs) { /** * @return the keys in string form */ - @Explain(displayName = "keys", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "keys") public Map getKeysString() { if (joinKeys == null) { return null; @@ -224,6 +224,19 @@ public void setReversedExprs(Map reversedExprs) { return keyMap; } + @Explain(displayName = "keys", explainLevels = { Level.USER }) + public Map getUserLevelExplainKeysString() { + if (joinKeys == null) { + return null; + } + + Map keyMap = new LinkedHashMap(); + for (byte i = 0; i < joinKeys.length; i++) { + keyMap.put(i, PlanUtils.getExprListString(Arrays.asList(joinKeys[i]), true)); + } + return keyMap; + } + public void setExprs(final Map> exprs) { this.exprs = exprs; } @@ -235,7 +248,7 @@ public void setExprs(final Map> exprs) { * * @return Map from alias to filters on the alias. */ - @Explain(displayName = "filter predicates", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "filter predicates") public Map getFiltersStringMap() { if (getFilters() == null || getFilters().size() == 0) { return null; @@ -281,10 +294,15 @@ public void setFilters(Map> filters) { this.filters = filters; } - @Explain(displayName = "outputColumnNames", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "outputColumnNames") public List getOutputColumnNames() { return outputColumnNames; } + + @Explain(displayName = "Output", explainLevels = { Level.USER }) + public List getUserLevelExplainOutputColumnNames() { + return outputColumnNames; + } public void setOutputColumnNames( List outputColumnNames) { @@ -299,7 +317,7 @@ public void setNoOuterJoin(final boolean noOuterJoin) { this.noOuterJoin = noOuterJoin; } - @Explain(displayName = "condition map", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "condition map") public List getCondsList() { if (conds == null) { return null; diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/LateralViewJoinDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/LateralViewJoinDesc.java index 12f01e5..d19cb3d 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/LateralViewJoinDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/LateralViewJoinDesc.java @@ -46,11 +46,16 @@ public void setOutputInternalColNames(ArrayList outputInternalColNames) this.outputInternalColNames = outputInternalColNames; } - @Explain(displayName = "outputColumnNames", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "outputColumnNames") public ArrayList getOutputInternalColNames() { return outputInternalColNames; } + @Explain(displayName = "Output", explainLevels = { Level.USER }) + public ArrayList getUserLevelExplainOutputInternalColNames() { + return outputInternalColNames; + } + public int getNumSelColumns() { return numSelColumns; } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/LoadTableDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/LoadTableDesc.java index 427aac1..771a919 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/LoadTableDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/LoadTableDesc.java @@ -121,7 +121,7 @@ public void setTable(final org.apache.hadoop.hive.ql.plan.TableDesc table) { this.table = table; } - @Explain(displayName = "partition", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "partition") public Map getPartitionSpec() { return partitionSpec; } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/MapJoinDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/MapJoinDesc.java index 4b93e7c..ec35860 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/MapJoinDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/MapJoinDesc.java @@ -29,8 +29,6 @@ import java.util.Set; import org.apache.hadoop.hive.ql.plan.Explain.Level; -import org.apache.hadoop.hive.ql.exec.ReduceSinkOperator; - /** * Map Join operator Descriptor implementation. * @@ -217,7 +215,7 @@ public void setDumpFilePrefix(String dumpFilePrefix) { * @return the keys in string form */ @Override - @Explain(displayName = "keys", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "keys") public Map getKeysString() { Map keyMap = new LinkedHashMap(); for (Map.Entry> k: getKeys().entrySet()) { @@ -226,6 +224,16 @@ public void setDumpFilePrefix(String dumpFilePrefix) { return keyMap; } + @Override + @Explain(displayName = "keys", explainLevels = { Level.USER }) + public Map getUserLevelExplainKeysString() { + Map keyMap = new LinkedHashMap(); + for (Map.Entry> k: getKeys().entrySet()) { + keyMap.put(k.getKey(), PlanUtils.getExprListString(k.getValue(), true)); + } + return keyMap; + } + /** * @return the keys */ diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/PlanUtils.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/PlanUtils.java index 5bea6fb..04d26f3 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/PlanUtils.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/PlanUtils.java @@ -926,7 +926,11 @@ public static ReadEntity addInput(Set inputs, ReadEntity newInput) { return null; } - public static String getExprListString(Collection exprs) { + public static String getExprListString(Collection exprs) { + return getExprListString(exprs, false); + } + + public static String getExprListString(Collection exprs, boolean userLevelExplain) { StringBuilder sb = new StringBuilder(); boolean first = true; for (ExprNodeDesc expr: exprs) { @@ -935,18 +939,20 @@ public static String getExprListString(Collection exprs } else { first = false; } - addExprToStringBuffer(expr, sb); + addExprToStringBuffer(expr, sb, userLevelExplain); } return sb.length() == 0 ? null : sb.toString(); } - public static void addExprToStringBuffer(ExprNodeDesc expr, Appendable sb) { + public static void addExprToStringBuffer(ExprNodeDesc expr, Appendable sb, boolean userLevelExplain) { try { sb.append(expr.getExprString()); - sb.append(" (type: "); - sb.append(expr.getTypeString()); - sb.append(")"); + if (!userLevelExplain) { + sb.append(" (type: "); + sb.append(expr.getTypeString()); + sb.append(")"); + } } catch (IOException e) { throw new RuntimeException(e); } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/ReduceSinkDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/ReduceSinkDesc.java index 2f69b7f..41d9ffe 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/ReduceSinkDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/ReduceSinkDesc.java @@ -213,7 +213,7 @@ public void setOutputValueColumnNames( this.outputValueColumnNames = outputValueColumnNames; } - @Explain(displayName = "key expressions", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "key expressions") public String getKeyColString() { return PlanUtils.getExprListString(keyCols); } @@ -234,7 +234,7 @@ public void setNumDistributionKeys(int numKeys) { this.numDistributionKeys = numKeys; } - @Explain(displayName = "value expressions", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "value expressions") public String getValueColsString() { return PlanUtils.getExprListString(valueCols); } @@ -247,11 +247,16 @@ public void setValueCols(final java.util.ArrayList valueCols) { this.valueCols = valueCols; } - @Explain(displayName = "Map-reduce partition columns", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "Map-reduce partition columns") public String getParitionColsString() { return PlanUtils.getExprListString(partitionCols); } + @Explain(displayName = "PartitionCols", explainLevels = { Level.USER }) + public String getUserLevelExplainParitionColsString() { + return PlanUtils.getExprListString(partitionCols, true); + } + public java.util.ArrayList getPartitionCols() { return partitionCols; } @@ -356,7 +361,7 @@ public void setValueSerializeInfo(TableDesc valueSerializeInfo) { * of the same length as key columns, that consists of only "+" * (ascending order) and "-" (descending order). */ - @Explain(displayName = "sort order", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "sort order") public String getOrder() { return keySerializeInfo.getProperties().getProperty( org.apache.hadoop.hive.serde.serdeConstants.SERIALIZATION_SORT_ORDER); diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/SelectDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/SelectDesc.java index e7bbab4..67a8327 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/SelectDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/SelectDesc.java @@ -82,11 +82,16 @@ public void setColList( this.colList = colList; } - @Explain(displayName = "outputColumnNames", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "outputColumnNames") public List getOutputColumnNames() { return outputColumnNames; } + @Explain(displayName = "Output", explainLevels = { Level.USER }) + public List getUserLevelExplainOutputColumnNames() { + return outputColumnNames; + } + public void setOutputColumnNames( List outputColumnNames) { this.outputColumnNames = outputColumnNames; diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/Statistics.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/Statistics.java index 4e52bac..029043f 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/Statistics.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/Statistics.java @@ -102,7 +102,7 @@ public void setColumnStatsState(State columnStatsState) { } @Override - @Explain(displayName = "Statistics", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "Statistics") public String toString() { StringBuilder sb = new StringBuilder(); sb.append("Num rows: "); @@ -116,6 +116,21 @@ public String toString() { return sb.toString(); } + @Explain(displayName = "Statistics", explainLevels = { Level.USER }) + public String toUserLevelExplainString() { + StringBuilder sb = new StringBuilder(); + sb.append("rows="); + sb.append(numRows); + sb.append(" width="); + // just to be safe about numRows + if (numRows != 0) { + sb.append(dataSize / numRows); + } else { + sb.append("-1"); + } + return sb.toString(); + } + public String extendedToString() { StringBuilder sb = new StringBuilder(); sb.append(" numRows: "); diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/TableDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/TableDesc.java index 2fdb0a1..1da8e91 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/TableDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/TableDesc.java @@ -140,7 +140,7 @@ public void setJobProperties(Map jobProperties) { /** * @return the serdeClassName */ - @Explain(displayName = "serde", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "serde") public String getSerdeClassName() { return properties.getProperty(serdeConstants.SERIALIZATION_LIB); } @@ -151,12 +151,12 @@ public String getTableName() { .getProperty(hive_metastoreConstants.META_TABLE_NAME); } - @Explain(displayName = "input format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "input format") public String getInputFileFormatClassName() { return getInputFileFormatClass().getName(); } - @Explain(displayName = "output format", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "output format") public String getOutputFileFormatClassName() { return getOutputFileFormatClass().getName(); } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/TableScanDesc.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/TableScanDesc.java index 098aa89..59d20ef 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/TableScanDesc.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/TableScanDesc.java @@ -20,6 +20,7 @@ import java.io.Serializable; import java.util.ArrayList; +import java.util.Arrays; import java.util.BitSet; import java.util.List; import java.util.Map; @@ -131,21 +132,38 @@ public Object clone() { return new TableScanDesc(getAlias(), vcs, this.tableMetadata); } - @Explain(displayName = "alias", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "alias") public String getAlias() { return alias; } + + @Explain(explainLevels = { Level.USER }) + public String getTbl() { + StringBuffer sb = new StringBuffer(); + sb.append(this.tableMetadata.getCompleteName()); + sb.append("," + alias); + if (isAcidTable()) { + sb.append(", ACID table"); + } + sb.append(",Tbl:"); + sb.append(this.statistics.getBasicStatsState()); + sb.append(",Col:"); + sb.append(this.statistics.getColumnStatsState()); + return sb.toString(); + } - @Explain(displayName = "ACID table", explainLevels = { Level.USER }, displayOnlyOnTrue = true) public boolean isAcidTable() { return SemanticAnalyzer.isAcidTable(this.tableMetadata); } + @Explain(displayName = "Output", explainLevels = { Level.USER }) + public List getOutputColumnNames() { + return this.neededColumns; + } + @Explain(displayName = "filterExpr") public String getFilterExprString() { - StringBuilder sb = new StringBuilder(); - PlanUtils.addExprToStringBuffer(filterExpr, sb); - return sb.toString(); + return PlanUtils.getExprListString(Arrays.asList(filterExpr)); } public ExprNodeGenericFuncDesc getFilterExpr() { diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PTFQueryInputDef.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PTFQueryInputDef.java index ae55741..f830eaa 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PTFQueryInputDef.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PTFQueryInputDef.java @@ -22,12 +22,12 @@ import org.apache.hadoop.hive.ql.plan.Explain; import org.apache.hadoop.hive.ql.plan.Explain.Level; -@Explain(displayName = "Input definition", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) +@Explain(displayName = "Input definition") public class PTFQueryInputDef extends PTFInputDef { private String destination; private PTFQueryInputType type; - @Explain(displayName = "destination", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "destination") public String getDestination() { return destination; } @@ -44,7 +44,7 @@ public void setType(PTFQueryInputType type) { this.type = type; } - @Explain(displayName = "type", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "type") public String getTypeExplain() { return type.name(); } diff --git a/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PartitionedTableFunctionDef.java b/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PartitionedTableFunctionDef.java index 46f106c..2a8b1c0 100644 --- a/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PartitionedTableFunctionDef.java +++ b/ql/src/java/org/apache/hadoop/hive/ql/plan/ptf/PartitionedTableFunctionDef.java @@ -145,7 +145,7 @@ public void setArgs(List args) { this.args = args; } - @Explain(displayName = "arguments", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "arguments") public String getArgsExplain() { if (args == null) { return null; @@ -189,7 +189,7 @@ public void setResolverClassName(String resolverClassName) { this.resolverClassName = resolverClassName; } - @Explain(displayName = "referenced columns", explainLevels = { Level.USER, Level.DEFAULT, Level.EXTENDED }) + @Explain(displayName = "referenced columns") public List getReferencedColumns() { return referencedColumns; } diff --git a/ql/src/test/results/clientpositive/perf/query12.q.out b/ql/src/test/results/clientpositive/perf/query12.q.out index 648d64d..2e4f2dd 100644 --- a/ql/src/test/results/clientpositive/perf/query12.q.out +++ b/ql/src/test/results/clientpositive/perf/query12.q.out @@ -12,118 +12,63 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_26] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_25] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_24] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col1 (type: string), _col2 (type: string), _col4 (type: string), _col0 (type: string), _col6 (type: decimal(38,23)) - sort order:+++++ - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_20] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_19] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col3 (type: string) - Map-reduce partition columns:_col3 (type: string) - sort order:+ - Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Group By Operator [GBY_17] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 34938 Data size: 50180683 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: decimal(7,2)) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: decimal(7,2)) - sort order:+++++ - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)) - Group By Operator [GBY_15] - aggregations:["sum(_col23)"] - keys:_col38 (type: string), _col41 (type: string), _col49 (type: string), _col47 (type: string), _col42 (type: decimal(7,2)) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_14] - outputColumnNames:["_col38","_col41","_col49","_col47","_col42","_col23"] - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_32] - predicate:((_col3 = _col37) and (_col0 = _col62)) (type: boolean) - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_37] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"d_date_sk (type: int)"} - | outputColumnNames:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49","_col62"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:d_date_sk (type: int) - | Map-reduce partition columns:d_date_sk (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_35] - | predicate:(d_date_sk is not null and d_date BETWEEN '2001-01-12' AND '2001-02-11') (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_2] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col23 (type: decimal(7,2)), _col37 (type: int), _col38 (type: string), _col41 (type: string), _col42 (type: decimal(7,2)), _col47 (type: string), _col49 (type: string) - Merge Join Operator [MERGEJOIN_36] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"ws_item_sk (type: int)","1":"i_item_sk (type: int)"} - | outputColumnNames:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:ws_item_sk (type: int) - | Map-reduce partition columns:ws_item_sk (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:ws_sold_date_sk (type: int), ws_ext_sales_price (type: decimal(7,2)) - | Filter Operator [FIL_33] - | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - key expressions:i_item_sk (type: int) - Map-reduce partition columns:i_item_sk (type: int) - sort order:+ - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - value expressions:i_item_id (type: string), i_item_desc (type: string), i_current_price (type: decimal(7,2)), i_class (type: string), i_category (type: string) - Filter Operator [FIL_34] - predicate:(i_item_sk is not null and (i_category) IN ('Jewelry', 'Sports', 'Books')) (type: boolean) - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_1] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_26] + Limit [LIM_25] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_24] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Select Operator [SEL_21] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_20] (rows=34938 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] + Select Operator [SEL_19] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col3 + Group By Operator [GBY_17] (rows=34938 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_15] (rows=69877 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col23)"],keys:_col38, _col41, _col49, _col47, _col42 + Select Operator [SEL_14] (rows=69877 width=1436) + Output:["_col38","_col41","_col49","_col47","_col42","_col23"] + Filter Operator [FIL_32] (rows=69877 width=1436) + predicate:((_col3 = _col37) and (_col0 = _col62)) + Merge Join Operator [MERGEJOIN_37] (rows=279510 width=1436) + Output:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49","_col62"],keys:{"0":"_col0","1":"d_date_sk"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:d_date_sk + Filter Operator [FIL_35] (rows=36524 width=1119) + predicate:(d_date_sk is not null and d_date BETWEEN '2001-01-12' AND '2001-02-11') + TableScan [TS_2] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_36] (rows=254100 width=1436) + Output:["_col0","_col3","_col23","_col37","_col38","_col41","_col42","_col47","_col49"],keys:{"0":"ws_item_sk","1":"i_item_sk"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:ws_item_sk + Filter Operator [FIL_33] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_ext_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:i_item_sk + Filter Operator [FIL_34] (rows=231000 width=1436) + predicate:(i_item_sk is not null and (i_category) IN ('Jewelry', 'Sports', 'Books')) + TableScan [TS_1] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_class","i_category"] diff --git a/ql/src/test/results/clientpositive/perf/query13.q.out b/ql/src/test/results/clientpositive/perf/query13.q.out index 6113d18..ec780af 100644 --- a/ql/src/test/results/clientpositive/perf/query13.q.out +++ b/ql/src/test/results/clientpositive/perf/query13.q.out @@ -117,184 +117,99 @@ Reducer 6 <- Map 12 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_42] - compressed:false - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_40] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","sum(VALUE._col3)"] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - sort order: - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: struct), _col1 (type: struct), _col2 (type: struct), _col3 (type: decimal(17,2)) - Group By Operator [GBY_38] - aggregations:["avg(_col5)","avg(_col7)","avg(_col8)","sum(_col8)"] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_73] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col7","_col8"] - | Statistics:Num rows: 18150000 Data size: 18420070657 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_35] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_33] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_68] - | predicate:(d_date_sk is not null and (d_year = 2001)) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_31] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Select Operator [SEL_30] - outputColumnNames:["_col0","_col5","_col7","_col8"] - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_29] - predicate:(((_col17) IN ('KY', 'GA', 'NM') and _col9 BETWEEN 100 AND 200) or ((_col17) IN ('MT', 'OR', 'IN') and _col9 BETWEEN 150 AND 300) or ((_col17) IN ('WI', 'MO', 'WV') and _col9 BETWEEN 50 AND 250)) (type: boolean) - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col5","_col7","_col8","_col9","_col17"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_67] - | predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col5 (type: int), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - Select Operator [SEL_22] - outputColumnNames:["_col0","_col3","_col5","_col7","_col8","_col9"] - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_21] - predicate:(((_col12 = 'M') and (_col13 = '4 yr Degree') and _col6 BETWEEN 100.0 AND 150.0 and (_col15 = 3)) or ((_col12 = 'D') and (_col13 = 'Primary') and _col6 BETWEEN 50.0 AND 100.0 and (_col15 = 1)) or ((_col12 = 'U') and (_col13 = 'Advanced Degree') and _col6 BETWEEN 150.0 AND 200.0 and (_col15 = 1))) (type: boolean) - Statistics:Num rows: 4491 Data size: 1626526 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_71] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13","_col15"] - | Statistics:Num rows: 23958 Data size: 8676981 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_66] - | predicate:(((hd_dep_count = 3) or (hd_dep_count = 1)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col12 (type: string), _col13 (type: string) - Merge Join Operator [MERGEJOIN_70] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13"] - | Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_65] - | predicate:((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_69] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col4 (type: int) - | Map-reduce partition columns:_col4 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_63] - | predicate:(((((((ss_net_profit BETWEEN 100 AND 200 or ss_net_profit BETWEEN 150 AND 300 or ss_net_profit BETWEEN 50 AND 250) and ss_store_sk is not null) and (ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0)) and ss_cdemo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_64] - predicate:s_store_sk is not null (type: boolean) - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:store - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_42] + Group By Operator [GBY_40] (rows=1 width=344) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","sum(VALUE._col3)"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + Group By Operator [GBY_38] (rows=1 width=112) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(_col5)","avg(_col7)","avg(_col8)","sum(_col8)"] + Merge Join Operator [MERGEJOIN_73] (rows=18150000 width=1014) + Output:["_col5","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col0 + Select Operator [SEL_33] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_68] (rows=36524 width=1119) + predicate:(d_date_sk is not null and (d_year = 2001)) + TableScan [TS_31] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=16500000 width=1014) + Output:["_col0","_col5","_col7","_col8"] + Filter Operator [FIL_29] (rows=16500000 width=1014) + predicate:(((_col17) IN ('KY', 'GA', 'NM') and _col9 BETWEEN 100 AND 200) or ((_col17) IN ('MT', 'OR', 'IN') and _col9 BETWEEN 150 AND 300) or ((_col17) IN ('WI', 'MO', 'WV') and _col9 BETWEEN 50 AND 250)) + Merge Join Operator [MERGEJOIN_72] (rows=22000000 width=1014) + Output:["_col0","_col5","_col7","_col8","_col9","_col17"],keys:{"0":"_col3","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_25] (rows=20000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_67] (rows=20000000 width=1014) + predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) + TableScan [TS_23] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col3 + Select Operator [SEL_22] (rows=4491 width=362) + Output:["_col0","_col3","_col5","_col7","_col8","_col9"] + Filter Operator [FIL_21] (rows=4491 width=362) + predicate:(((_col12 = 'M') and (_col13 = '4 yr Degree') and _col6 BETWEEN 100.0 AND 150.0 and (_col15 = 3)) or ((_col12 = 'D') and (_col13 = 'Primary') and _col6 BETWEEN 50.0 AND 100.0 and (_col15 = 1)) or ((_col12 = 'U') and (_col13 = 'Advanced Degree') and _col6 BETWEEN 150.0 AND 200.0 and (_col15 = 1))) + Merge Join Operator [MERGEJOIN_71] (rows=23958 width=362) + Output:["_col0","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13","_col15"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_66] (rows=7200 width=107) + predicate:(((hd_dep_count = 3) or (hd_dep_count = 1)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_70] (rows=21780 width=362) + Output:["_col0","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col12","_col13"],keys:{"0":"_col1","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=19800 width=362) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_65] (rows=19800 width=362) + predicate:((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) + TableScan [TS_6] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_69] (rows=1874 width=1911) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"],keys:{"0":"_col4","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Filter Operator [FIL_63] (rows=1 width=0) + predicate:(((((((ss_net_profit BETWEEN 100 AND 200 or ss_net_profit BETWEEN 150 AND 300 or ss_net_profit BETWEEN 50 AND 250) and ss_store_sk is not null) and (ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0)) and ss_cdemo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_ext_sales_price","ss_ext_wholesale_cost","ss_net_profit"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1704 width=1910) + Output:["_col0"] + Filter Operator [FIL_64] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_3] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query15.q.out b/ql/src/test/results/clientpositive/perf/query15.q.out index c237828..d20d28c 100644 --- a/ql/src/test/results/clientpositive/perf/query15.q.out +++ b/ql/src/test/results/clientpositive/perf/query15.q.out @@ -12,142 +12,76 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_30] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_26] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_24] - aggregations:["sum(_col2)"] - keys:_col7 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_23] - outputColumnNames:["_col7","_col2"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_47] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col7"] - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_44] - | predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col7 (type: string) - Select Operator [SEL_16] - outputColumnNames:["_col0","_col2","_col7"] - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_15] - predicate:((substr(_col7, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792') or (_col6) IN ('CA', 'WA', 'GA') or (_col2 > 500)) (type: boolean) - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_46] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col6","_col7"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_45] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_41] - | predicate:(cs_bill_customer_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_42] - predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_31] + Limit [LIM_30] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_29] (rows=53240002 width=860) + Output:["_col0","_col1"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_28] + Group By Operator [GBY_26] (rows=53240002 width=860) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Group By Operator [GBY_24] (rows=106480005 width=860) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col7 + Select Operator [SEL_23] (rows=106480005 width=860) + Output:["_col7","_col2"] + Merge Join Operator [MERGEJOIN_47] (rows=106480005 width=860) + Output:["_col2","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_44] (rows=18262 width=1119) + predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) + TableScan [TS_17] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=96800003 width=860) + Output:["_col0","_col2","_col7"] + Filter Operator [FIL_15] (rows=96800003 width=860) + predicate:((substr(_col7, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792') or (_col6) IN ('CA', 'WA', 'GA') or (_col2 > 500)) + Merge Join Operator [MERGEJOIN_46] (rows=96800003 width=860) + Output:["_col0","_col2","_col6","_col7"],keys:{"0":"_col4","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_43] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_6] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_zip"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_45] (rows=88000001 width=860) + Output:["_col0","_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_41] (rows=1 width=0) + predicate:(cs_bill_customer_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=80000000 width=860) + Output:["_col0","_col1"] + Filter Operator [FIL_42] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_3] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query17.q.out b/ql/src/test/results/clientpositive/perf/query17.q.out index 0e42d05..211aecf 100644 --- a/ql/src/test/results/clientpositive/perf/query17.q.out +++ b/ql/src/test/results/clientpositive/perf/query17.q.out @@ -16,249 +16,130 @@ Reducer 8 <- Map 17 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 10 - File Output Operator [FS_54] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_53] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_52] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_51] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: double), _col5 (type: double), _col6 (type: double), _col7 (type: bigint), _col8 (type: double), _col9 (type: double), _col10 (type: double), _col11 (type: bigint), _col12 (type: double), _col13 (type: double) - Select Operator [SEL_49] - outputColumnNames:["_col0","_col1","_col10","_col11","_col12","_col13","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_48] - | aggregations:["count(VALUE._col0)","avg(VALUE._col1)","stddev_samp(VALUE._col2)","count(VALUE._col3)","avg(VALUE._col4)","stddev_samp(VALUE._col5)","count(VALUE._col6)","avg(VALUE._col7)","stddev_samp(VALUE._col8)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: struct), _col5 (type: struct), _col6 (type: bigint), _col7 (type: struct), _col8 (type: struct), _col9 (type: bigint), _col10 (type: struct), _col11 (type: struct) - Group By Operator [GBY_46] - aggregations:["count(_col5)","avg(_col5)","stddev_samp(_col5)","count(_col10)","avg(_col10)","stddev_samp(_col10)","count(_col14)","avg(_col14)","stddev_samp(_col14)"] - keys:_col22 (type: string), _col24 (type: string), _col25 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_45] - outputColumnNames:["_col22","_col24","_col25","_col5","_col10","_col14"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_104] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col10","_col14","_col22","_col24","_col25"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_23] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_97] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 53473 Data size: 59838291 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col10 (type: int), _col14 (type: int), _col22 (type: string) - Merge Join Operator [MERGEJOIN_103] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col5","_col10","_col14","_col22"] - | Statistics:Num rows: 53473 Data size: 59838291 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_96] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 48612 Data size: 54398446 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: int), _col10 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_102] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col11 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col14"] - | Statistics:Num rows: 48612 Data size: 54398446 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_95] - | predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col11 (type: int) - Map-reduce partition columns:_col11 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col10 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_101] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col11","_col14"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_94] - | predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col10 (type: int), _col11 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_100] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_93] - | predicate:((d_quarter_name = '2000Q1') and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_99] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col8 (type: int), _col7 (type: int)","1":"_col1 (type: int), _col2 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col2 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_92] - | predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_6] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col8 (type: int), _col7 (type: int) - Map-reduce partition columns:_col8 (type: int), _col7 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int) - Merge Join Operator [MERGEJOIN_98] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int), _col1 (type: int), _col4 (type: int)","1":"_col2 (type: int), _col1 (type: int), _col3 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_90] - | predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col2 (type: int), _col1 (type: int), _col3 (type: int) - Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col3 (type: int) - sort order:+++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_91] - predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 10 + File Output Operator [FS_54] + Limit [LIM_53] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_52] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_51] + Select Operator [SEL_49] (rows=254100 width=1436) + Output:["_col0","_col1","_col10","_col11","_col12","_col13","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Group By Operator [GBY_48] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"],aggregations:["count(VALUE._col0)","avg(VALUE._col1)","stddev_samp(VALUE._col2)","count(VALUE._col3)","avg(VALUE._col4)","stddev_samp(VALUE._col5)","count(VALUE._col6)","avg(VALUE._col7)","stddev_samp(VALUE._col8)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_46] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"],aggregations:["count(_col5)","avg(_col5)","stddev_samp(_col5)","count(_col10)","avg(_col10)","stddev_samp(_col10)","count(_col14)","avg(_col14)","stddev_samp(_col14)"],keys:_col22, _col24, _col25 + Select Operator [SEL_45] (rows=508200 width=1436) + Output:["_col22","_col24","_col25","_col5","_col10","_col14"] + Merge Join Operator [MERGEJOIN_104] (rows=508200 width=1436) + Output:["_col5","_col10","_col14","_col22","_col24","_col25"],keys:{"0":"_col1","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=462000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_97] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_21] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_103] (rows=53473 width=1119) + Output:["_col1","_col5","_col10","_col14","_col22"],keys:{"0":"_col3","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_96] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_18] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_102] (rows=48612 width=1119) + Output:["_col1","_col3","_col5","_col10","_col14"],keys:{"0":"_col11","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_95] (rows=36524 width=1119) + predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) + TableScan [TS_15] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_quarter_name"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col11 + Merge Join Operator [MERGEJOIN_101] (rows=44193 width=1119) + Output:["_col1","_col3","_col5","_col10","_col11","_col14"],keys:{"0":"_col6","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_94] (rows=36524 width=1119) + predicate:((d_quarter_name) IN ('2000Q1', '2000Q2', '2000Q3') and d_date_sk is not null) + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_quarter_name"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_100] (rows=40176 width=1119) + Output:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_93] (rows=36524 width=1119) + predicate:((d_quarter_name = '2000Q1') and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_quarter_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_99] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col8, _col7","1":"_col1, _col2"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col1, _col2 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_92] (rows=1 width=0) + predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) + TableScan [TS_6] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_quantity"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col8, _col7 + Merge Join Operator [MERGEJOIN_98] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"],keys:{"0":"_col2, _col1, _col4","1":"_col2, _col1, _col3"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2, _col1, _col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_90] (rows=1 width=0) + predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number","ss_quantity"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col2, _col1, _col3 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_91] (rows=1 width=0) + predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number","sr_return_quantity"] diff --git a/ql/src/test/results/clientpositive/perf/query18.q.out b/ql/src/test/results/clientpositive/perf/query18.q.out index 83f21dc..1cd14d9 100644 --- a/ql/src/test/results/clientpositive/perf/query18.q.out +++ b/ql/src/test/results/clientpositive/perf/query18.q.out @@ -15,222 +15,116 @@ Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 9 - File Output Operator [FS_48] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_47] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_46] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - | Statistics:Num rows: 133100005 Data size: 114468695810 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_45] - key expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col0 (type: string) - sort order:++++ - Statistics:Num rows: 133100005 Data size: 114468695810 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(16,6)), _col5 (type: decimal(16,6)), _col6 (type: decimal(16,6)), _col7 (type: decimal(16,6)), _col8 (type: decimal(16,6)), _col9 (type: decimal(16,6)), _col10 (type: decimal(16,6)) - Select Operator [SEL_44] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - Statistics:Num rows: 133100005 Data size: 114468695810 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_43] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)","avg(VALUE._col4)","avg(VALUE._col5)","avg(VALUE._col6)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - | Statistics:Num rows: 133100005 Data size: 114468695810 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 266200010 Data size: 228937391620 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: struct), _col6 (type: struct), _col7 (type: struct), _col8 (type: struct), _col9 (type: struct), _col10 (type: struct), _col11 (type: struct) - Group By Operator [GBY_41] - aggregations:["avg(_col4)","avg(_col5)","avg(_col6)","avg(_col7)","avg(_col8)","avg(_col9)","avg(_col10)"] - keys:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), '0' (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - Statistics:Num rows: 266200010 Data size: 228937391620 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_39] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - Statistics:Num rows: 53240002 Data size: 45787478324 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_88] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col18 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col21","_col23","_col24","_col25"] - | Statistics:Num rows: 53240002 Data size: 45787478324 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_20] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:cd_demo_sk is not null (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:cd1 - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col18 (type: int) - Map-reduce partition columns:_col18 (type: int) - sort order:+ - Statistics:Num rows: 48400001 Data size: 41624979393 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col14 (type: int), _col16 (type: string), _col21 (type: int), _col23 (type: string), _col24 (type: string), _col25 (type: string) - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col19 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col18","_col21","_col23","_col24","_col25"] - | Statistics:Num rows: 48400001 Data size: 41624979393 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_17] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:((ca_state) IN ('ND', 'WI', 'AL', 'NC', 'OK', 'MS', 'TN') and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col19 (type: int) - Map-reduce partition columns:_col19 (type: int) - sort order:+ - Statistics:Num rows: 44000000 Data size: 37840889538 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col14 (type: int), _col16 (type: string), _col18 (type: int), _col21 (type: int) - Merge Join Operator [MERGEJOIN_86] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col18","_col19","_col21"] - | Statistics:Num rows: 44000000 Data size: 37840889538 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 34400807926 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col4 (type: int) - | Select Operator [SEL_14] - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 40000000 Data size: 34400807926 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_80] - | predicate:(((c_customer_sk is not null and (c_birth_month) IN (9, 5, 12, 4, 1, 10)) and c_current_addr_sk is not null) and c_current_cdemo_sk is not null) (type: boolean) - | Statistics:Num rows: 40000000 Data size: 34400807926 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col14 (type: int), _col16 (type: string) - Merge Join Operator [MERGEJOIN_85] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4","_col5","_col6","_col7","_col8","_col14","_col16"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_79] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col14 (type: int) - Merge Join Operator [MERGEJOIN_84] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col14"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_78] - | predicate:(((cd_gender = 'M') and (cd_education_status = 'College')) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:cd1 - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_83] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_76] - | predicate:(((cs_sold_date_sk is not null and cs_bill_cdemo_sk is not null) and cs_item_sk is not null) and cs_bill_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_77] - predicate:(d_date_sk is not null and (d_year = 2001)) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 9 + File Output Operator [FS_48] + Limit [LIM_47] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_46] (rows=133100005 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_45] + Select Operator [SEL_44] (rows=133100005 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] + Group By Operator [GBY_43] (rows=133100005 width=860) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9","_col10","_col11"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)","avg(VALUE._col4)","avg(VALUE._col5)","avg(VALUE._col6)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_41] (rows=266200010 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"],aggregations:["avg(_col4)","avg(_col5)","avg(_col6)","avg(_col7)","avg(_col8)","avg(_col9)","avg(_col10)"],keys:_col0, _col1, _col2, _col3, '0' + Select Operator [SEL_39] (rows=53240002 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] + Merge Join Operator [MERGEJOIN_88] (rows=53240002 width=860) + Output:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col21","_col23","_col24","_col25"],keys:{"0":"_col18","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=19800 width=362) + Output:["_col0"] + Filter Operator [FIL_82] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_18] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col18 + Merge Join Operator [MERGEJOIN_87] (rows=48400001 width=860) + Output:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col18","_col21","_col23","_col24","_col25"],keys:{"0":"_col19","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=20000000 width=1014) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_81] (rows=20000000 width=1014) + predicate:((ca_state) IN ('ND', 'WI', 'AL', 'NC', 'OK', 'MS', 'TN') and ca_address_sk is not null) + TableScan [TS_15] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state","ca_country"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col19 + Merge Join Operator [MERGEJOIN_86] (rows=44000000 width=860) + Output:["_col4","_col5","_col6","_col7","_col8","_col14","_col16","_col18","_col19","_col21"],keys:{"0":"_col1","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=40000000 width=860) + Output:["_col0","_col1","_col2","_col4"] + Filter Operator [FIL_80] (rows=40000000 width=860) + predicate:(((c_customer_sk is not null and (c_birth_month) IN (9, 5, 12, 4, 1, 10)) and c_current_addr_sk is not null) and c_current_cdemo_sk is not null) + TableScan [TS_12] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_addr_sk","c_birth_month","c_birth_year"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_85] (rows=508200 width=1436) + Output:["_col1","_col4","_col5","_col6","_col7","_col8","_col14","_col16"],keys:{"0":"_col3","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_79] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_9] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_84] (rows=44193 width=1119) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col14"],keys:{"0":"_col2","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=4950 width=362) + Output:["_col0","_col3"] + Filter Operator [FIL_78] (rows=4950 width=362) + predicate:(((cd_gender = 'M') and (cd_education_status = 'College')) and cd_demo_sk is not null) + TableScan [TS_6] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_education_status","cd_dep_count"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_83] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Filter Operator [FIL_76] (rows=1 width=0) + predicate:(((cs_sold_date_sk is not null and cs_bill_cdemo_sk is not null) and cs_item_sk is not null) and cs_bill_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_bill_cdemo_sk","cs_item_sk","cs_quantity","cs_list_price","cs_sales_price","cs_coupon_amt","cs_net_profit"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_77] (rows=36524 width=1119) + predicate:(d_date_sk is not null and (d_year = 2001)) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] diff --git a/ql/src/test/results/clientpositive/perf/query19.q.out b/ql/src/test/results/clientpositive/perf/query19.q.out index d565839..a1f027f 100644 --- a/ql/src/test/results/clientpositive/perf/query19.q.out +++ b/ql/src/test/results/clientpositive/perf/query19.q.out @@ -14,194 +14,102 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 8 - File Output Operator [FS_43] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_42] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_41] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_40] - key expressions:_col4 (type: decimal(17,2)), _col1 (type: string), _col0 (type: int), _col2 (type: int), _col3 (type: string) - sort order:-++++ - Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_37] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: string), KEY._col2 (type: int), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 53240002 Data size: 45787477895 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: int), _col1 (type: string), _col2 (type: int), _col3 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: string), _col2 (type: int), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)) - Group By Operator [GBY_35] - aggregations:["sum(_col7)"] - keys:_col9 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_34] - outputColumnNames:["_col9","_col10","_col11","_col12","_col7"] - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_33] - predicate:(substr(_col17, 1, 5) <> substr(_col19, 1, 5)) (type: boolean) - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_74] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col7","_col9","_col10","_col11","_col12","_col17","_col19"] - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_17] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_69] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col7 (type: decimal(7,2)), _col9 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string), _col17 (type: string) - Merge Join Operator [MERGEJOIN_73] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col15 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col6","_col7","_col9","_col10","_col11","_col12","_col17"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_14] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_68] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col15 (type: int) - Map-reduce partition columns:_col15 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col6 (type: int), _col7 (type: decimal(7,2)), _col9 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string) - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col6","_col7","_col9","_col10","_col11","_col12","_col15"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_67] - | predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col6 (type: int), _col7 (type: decimal(7,2)), _col9 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string) - Merge Join Operator [MERGEJOIN_71] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col6","_col7","_col9","_col10","_col11","_col12"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string), _col3 (type: int), _col4 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_66] - | predicate:((i_manager_id = 7) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col6 (type: int), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_70] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_64] - | predicate:(((d_moy = 11) and d_date_sk is not null) and (d_year = 1999)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_65] - predicate:(((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_store_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 8 + File Output Operator [FS_43] + Limit [LIM_42] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_41] (rows=53240002 width=860) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_40] + Group By Operator [GBY_37] (rows=53240002 width=860) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_35] (rows=106480005 width=860) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(_col7)"],keys:_col9, _col10, _col11, _col12 + Select Operator [SEL_34] (rows=106480005 width=860) + Output:["_col9","_col10","_col11","_col12","_col7"] + Filter Operator [FIL_33] (rows=106480005 width=860) + predicate:(substr(_col17, 1, 5) <> substr(_col19, 1, 5)) + Merge Join Operator [MERGEJOIN_74] (rows=106480005 width=860) + Output:["_col7","_col9","_col10","_col11","_col12","_col17","_col19"],keys:{"0":"_col6","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_69] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_15] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_zip"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_73] (rows=96800003 width=860) + Output:["_col6","_col7","_col9","_col10","_col11","_col12","_col17"],keys:{"0":"_col15","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_68] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_12] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_zip"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col15 + Merge Join Operator [MERGEJOIN_72] (rows=88000001 width=860) + Output:["_col6","_col7","_col9","_col10","_col11","_col12","_col15"],keys:{"0":"_col5","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=80000000 width=860) + Output:["_col0","_col1"] + Filter Operator [FIL_67] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_9] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_71] (rows=254100 width=1436) + Output:["_col5","_col6","_col7","_col9","_col10","_col11","_col12"],keys:{"0":"_col4","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_66] (rows=231000 width=1436) + predicate:((i_manager_id = 7) and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manufact_id","i_manufact","i_manager_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_70] (rows=20088 width=1119) + Output:["_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_64] (rows=18262 width=1119) + predicate:(((d_moy = 11) and d_date_sk is not null) and (d_year = 1999)) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_65] (rows=1 width=0) + predicate:(((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_store_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ext_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query20.q.out b/ql/src/test/results/clientpositive/perf/query20.q.out index 40c9a17..4e2706c 100644 --- a/ql/src/test/results/clientpositive/perf/query20.q.out +++ b/ql/src/test/results/clientpositive/perf/query20.q.out @@ -12,127 +12,69 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_28] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_27] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_26] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col1 (type: string), _col2 (type: string), _col4 (type: string), _col0 (type: string), _col6 (type: decimal(38,23)) - sort order:+++++ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_23] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_22] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col3 (type: string) - Map-reduce partition columns:_col3 (type: string) - sort order:+ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_19] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: decimal(7,2)), KEY._col3 (type: string), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)), _col3 (type: string), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)) - Group By Operator [GBY_16] - aggregations:["sum(_col2)"] - keys:_col4 (type: string), _col5 (type: string), _col6 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col4","_col5","_col6","_col7","_col8","_col2"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_38] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_36] - | predicate:(d_date BETWEEN '2001-01-12' AND '2001-02-11' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col4 (type: string), _col5 (type: string), _col6 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - Merge Join Operator [MERGEJOIN_37] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_34] - | predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: decimal(7,2)), _col4 (type: string), _col5 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_35] - predicate:((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean) - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_28] + Limit [LIM_27] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_26] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_25] + Select Operator [SEL_23] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_22] (rows=139755 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] + Select Operator [SEL_21] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col3 + Select Operator [SEL_19] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_18] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_16] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col2)"],keys:_col4, _col5, _col6, _col7, _col8 + Select Operator [SEL_15] (rows=279510 width=1436) + Output:["_col4","_col5","_col6","_col7","_col8","_col2"] + Merge Join Operator [MERGEJOIN_38] (rows=279510 width=1436) + Output:["_col2","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_36] (rows=36524 width=1119) + predicate:(d_date BETWEEN '2001-01-12' AND '2001-02-11' and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_37] (rows=254100 width=1436) + Output:["_col0","_col2","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_34] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_ext_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_35] (rows=231000 width=1436) + predicate:((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_class","i_category"] diff --git a/ql/src/test/results/clientpositive/perf/query21.q.out b/ql/src/test/results/clientpositive/perf/query21.q.out index 2634d3d..a68b0c1 100644 --- a/ql/src/test/results/clientpositive/perf/query21.q.out +++ b/ql/src/test/results/clientpositive/perf/query21.q.out @@ -62,140 +62,74 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_30] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: bigint), _col3 (type: bigint) - Filter Operator [FIL_26] - predicate:CASE WHEN ((_col2 > 0)) THEN ((UDFToDouble(_col3) / UDFToDouble(_col2))) ELSE (null) END BETWEEN 0.6666666666666666 AND 1.5 (type: boolean) - Statistics:Num rows: 69877 Data size: 100362804 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_25] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: bigint), _col3 (type: bigint) - Group By Operator [GBY_23] - aggregations:["sum(_col2)","sum(_col3)"] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_47] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col5","_col7","_col10"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_44] - | predicate:(d_date BETWEEN '1998-03-09' AND '1998-05-07' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col5 (type: string), _col7 (type: string) - Merge Join Operator [MERGEJOIN_46] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col5","_col7"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:(i_current_price BETWEEN 0.99 AND 1.49 and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: string) - Merge Join Operator [MERGEJOIN_45] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5"] - | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_41] - | predicate:((inv_warehouse_sk is not null and inv_item_sk is not null) and inv_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:inventory - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_42] - predicate:w_warehouse_sk is not null (type: boolean) - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:warehouse - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_31] + Limit [LIM_30] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_29] (rows=69877 width=1436) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_28] + Filter Operator [FIL_26] (rows=69877 width=1436) + predicate:CASE WHEN ((_col2 > 0)) THEN ((UDFToDouble(_col3) / UDFToDouble(_col2))) ELSE (null) END BETWEEN 0.6666666666666666 AND 1.5 + Group By Operator [GBY_25] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0, _col1 + Group By Operator [GBY_23] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col2)","sum(_col3)"],keys:_col0, _col1 + Select Operator [SEL_21] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_47] (rows=279510 width=1436) + Output:["_col3","_col5","_col7","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_44] (rows=36524 width=1119) + predicate:(d_date BETWEEN '1998-03-09' AND '1998-05-07' and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_46] (rows=254100 width=1436) + Output:["_col0","_col3","_col5","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_43] (rows=231000 width=1436) + predicate:(i_current_price BETWEEN 0.99 AND 1.49 and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_current_price"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_45] (rows=29 width=1054) + Output:["_col0","_col1","_col3","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_41] (rows=1 width=0) + predicate:((inv_warehouse_sk is not null and inv_item_sk is not null) and inv_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=27 width=1029) + Output:["_col0","_col1"] + Filter Operator [FIL_42] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_3] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name"] diff --git a/ql/src/test/results/clientpositive/perf/query22.q.out b/ql/src/test/results/clientpositive/perf/query22.q.out index 72935ed..a8ff977 100644 --- a/ql/src/test/results/clientpositive/perf/query22.q.out +++ b/ql/src/test/results/clientpositive/perf/query22.q.out @@ -12,137 +12,74 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_30] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_29] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_28] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1397550 Data size: 2007270467 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col4 (type: double), _col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:+++++ - Statistics:Num rows: 1397550 Data size: 2007270467 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1397550 Data size: 2007270467 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["avg(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | Statistics:Num rows: 1397550 Data size: 2007270467 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 2795100 Data size: 4014540935 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: struct) - Group By Operator [GBY_22] - aggregations:["avg(_col3)"] - keys:_col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), '0' (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 2795100 Data size: 4014540935 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col7","_col8","_col9","_col10","_col3"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_46] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col7","_col8","_col9","_col10"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:w_warehouse_sk is not null (type: boolean) - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:warehouse - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string) - Merge Join Operator [MERGEJOIN_45] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col3","_col7","_col8","_col9","_col10"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_42] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int), _col3 (type: int) - Merge Join Operator [MERGEJOIN_44] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_40] - | predicate:((inv_date_sk is not null and inv_item_sk is not null) and inv_warehouse_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:inventory - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_41] - predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_30] + Limit [LIM_29] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_28] (rows=1397550 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_27] + Select Operator [SEL_25] (rows=1397550 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_24] (rows=1397550 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"],aggregations:["avg(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_22] (rows=2795100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["avg(_col3)"],keys:_col7, _col8, _col9, _col10, '0' + Select Operator [SEL_21] (rows=559020 width=1436) + Output:["_col7","_col8","_col9","_col10","_col3"] + Merge Join Operator [MERGEJOIN_46] (rows=559020 width=1436) + Output:["_col3","_col7","_col8","_col9","_col10"],keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=27 width=1029) + Output:["_col0"] + Filter Operator [FIL_43] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_9] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_45] (rows=508200 width=1436) + Output:["_col2","_col3","_col7","_col8","_col9","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=462000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_42] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand","i_class","i_category","i_product_name"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_44] (rows=40176 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_40] (rows=1 width=0) + predicate:((inv_date_sk is not null and inv_item_sk is not null) and inv_warehouse_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_41] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] diff --git a/ql/src/test/results/clientpositive/perf/query25.q.out b/ql/src/test/results/clientpositive/perf/query25.q.out index dabc1c5..b305bb6 100644 --- a/ql/src/test/results/clientpositive/perf/query25.q.out +++ b/ql/src/test/results/clientpositive/perf/query25.q.out @@ -16,249 +16,130 @@ Reducer 8 <- Map 17 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 10 - File Output Operator [FS_53] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_52] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_51] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_50] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) - Select Operator [SEL_49] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_48] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) - Group By Operator [GBY_46] - aggregations:["sum(_col5)","sum(_col10)","sum(_col14)"] - keys:_col25 (type: string), _col26 (type: string), _col28 (type: string), _col29 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_45] - outputColumnNames:["_col25","_col26","_col28","_col29","_col5","_col10","_col14"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_103] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col10","_col14","_col25","_col26","_col28","_col29"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_23] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_96] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 26735 Data size: 29919145 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: decimal(7,2)), _col25 (type: string), _col26 (type: string) - Merge Join Operator [MERGEJOIN_102] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col5","_col10","_col14","_col25","_col26"] - | Statistics:Num rows: 26735 Data size: 29919145 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_95] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_101] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col11 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col14"] - | Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_94] - | predicate:(((d_year = 1998) and d_moy BETWEEN 4 AND 10) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col11 (type: int) - Map-reduce partition columns:_col11 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_100] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col11","_col14"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_93] - | predicate:(((d_year = 1998) and d_moy BETWEEN 4 AND 10) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: int), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_99] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_92] - | predicate:(((d_year = 1998) and (d_moy = 4)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: int), _col10 (type: decimal(7,2)), _col11 (type: int), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_98] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col8 (type: int), _col7 (type: int)","1":"_col1 (type: int), _col2 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col2 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_91] - | predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_6] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col8 (type: int), _col7 (type: int) - Map-reduce partition columns:_col8 (type: int), _col7 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: int), _col10 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_97] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int), _col1 (type: int), _col4 (type: int)","1":"_col2 (type: int), _col1 (type: int), _col3 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_89] - | predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col2 (type: int), _col1 (type: int), _col3 (type: int) - Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col3 (type: int) - sort order:+++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_90] - predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 10 + File Output Operator [FS_53] + Limit [LIM_52] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_51] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_50] + Select Operator [SEL_49] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Group By Operator [GBY_48] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_46] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col10)","sum(_col14)"],keys:_col25, _col26, _col28, _col29 + Select Operator [SEL_45] (rows=508200 width=1436) + Output:["_col25","_col26","_col28","_col29","_col5","_col10","_col14"] + Merge Join Operator [MERGEJOIN_103] (rows=508200 width=1436) + Output:["_col5","_col10","_col14","_col25","_col26","_col28","_col29"],keys:{"0":"_col1","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=462000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_96] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_21] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_102] (rows=26735 width=1119) + Output:["_col1","_col5","_col10","_col14","_col25","_col26"],keys:{"0":"_col3","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_95] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_18] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id","s_store_name"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_101] (rows=24305 width=1119) + Output:["_col1","_col3","_col5","_col10","_col14"],keys:{"0":"_col11","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_94] (rows=18262 width=1119) + predicate:(((d_year = 1998) and d_moy BETWEEN 4 AND 10) and d_date_sk is not null) + TableScan [TS_15] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col11 + Merge Join Operator [MERGEJOIN_100] (rows=22096 width=1119) + Output:["_col1","_col3","_col5","_col10","_col11","_col14"],keys:{"0":"_col6","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_93] (rows=18262 width=1119) + predicate:(((d_year = 1998) and d_moy BETWEEN 4 AND 10) and d_date_sk is not null) + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_99] (rows=20088 width=1119) + Output:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_92] (rows=18262 width=1119) + predicate:(((d_year = 1998) and (d_moy = 4)) and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_98] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col8, _col7","1":"_col1, _col2"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col1, _col2 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_91] (rows=1 width=0) + predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) + TableScan [TS_6] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_net_profit"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col8, _col7 + Merge Join Operator [MERGEJOIN_97] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"],keys:{"0":"_col2, _col1, _col4","1":"_col2, _col1, _col3"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2, _col1, _col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_89] (rows=1 width=0) + predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number","ss_net_profit"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col2, _col1, _col3 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_90] (rows=1 width=0) + predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number","sr_net_loss"] diff --git a/ql/src/test/results/clientpositive/perf/query26.q.out b/ql/src/test/results/clientpositive/perf/query26.q.out index 84cc238..15fd229 100644 --- a/ql/src/test/results/clientpositive/perf/query26.q.out +++ b/ql/src/test/results/clientpositive/perf/query26.q.out @@ -13,162 +13,86 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_35] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_34] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: double), _col2 (type: decimal(11,6)), _col3 (type: decimal(11,6)), _col4 (type: decimal(11,6)) - Group By Operator [GBY_30] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: struct), _col2 (type: struct), _col3 (type: struct), _col4 (type: struct) - Group By Operator [GBY_28] - aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"] - keys:_col15 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col15","_col4","_col5","_col7","_col6"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col15"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:(((p_channel_email = 'N') or (p_channel_event = 'N')) and p_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:promotion - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col15 (type: string) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5","_col6","_col7","_col15"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_52] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_55] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_50] - | predicate:(((cs_bill_cdemo_sk is not null and cs_sold_date_sk is not null) and cs_item_sk is not null) and cs_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_51] - predicate:((((cd_gender = 'F') and (cd_marital_status = 'W')) and (cd_education_status = 'Primary')) and cd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer_demographics - Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_35] + Limit [LIM_34] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_33] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Group By Operator [GBY_30] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"],keys:KEY._col0 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Group By Operator [GBY_28] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"],keys:_col15 + Select Operator [SEL_27] (rows=559020 width=1436) + Output:["_col15","_col4","_col5","_col7","_col6"] + Merge Join Operator [MERGEJOIN_58] (rows=559020 width=1436) + Output:["_col4","_col5","_col6","_col7","_col15"],keys:{"0":"_col3","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=2300 width=1179) + Output:["_col0"] + Filter Operator [FIL_54] (rows=2300 width=1179) + predicate:(((p_channel_email = 'N') or (p_channel_event = 'N')) and p_promo_sk is not null) + TableScan [TS_12] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk","p_channel_email","p_channel_event"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_57] (rows=508200 width=1436) + Output:["_col3","_col4","_col5","_col6","_col7","_col15"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_53] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_9] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_56] (rows=40176 width=1119) + Output:["_col2","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_52] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_55] (rows=2722 width=362) + Output:["_col0","_col2","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_50] (rows=1 width=0) + predicate:(((cs_bill_cdemo_sk is not null and cs_sold_date_sk is not null) and cs_item_sk is not null) and cs_promo_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_cdemo_sk","cs_item_sk","cs_promo_sk","cs_quantity","cs_list_price","cs_sales_price","cs_coupon_amt"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=2475 width=362) + Output:["_col0"] + Filter Operator [FIL_51] (rows=2475 width=362) + predicate:((((cd_gender = 'F') and (cd_marital_status = 'W')) and (cd_education_status = 'Primary')) and cd_demo_sk is not null) + TableScan [TS_3] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status"] diff --git a/ql/src/test/results/clientpositive/perf/query27.q.out b/ql/src/test/results/clientpositive/perf/query27.q.out index ac38683..a7fee8b 100644 --- a/ql/src/test/results/clientpositive/perf/query27.q.out +++ b/ql/src/test/results/clientpositive/perf/query27.q.out @@ -13,166 +13,88 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_35] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_34] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: double), _col3 (type: decimal(11,6)), _col4 (type: decimal(11,6)), _col5 (type: decimal(11,6)) - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_30] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: struct), _col3 (type: struct), _col4 (type: struct), _col5 (type: struct) - Group By Operator [GBY_28] - aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"] - keys:_col15 (type: string), _col17 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col15","_col17","_col4","_col5","_col7","_col6"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col15","_col17"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_14] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col15 (type: string) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4","_col5","_col6","_col7","_col15"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:((s_state) IN ('KS', 'AL', 'MN', 'AL', 'SC', 'VT') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_52] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_55] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_50] - | predicate:(((ss_cdemo_sk is not null and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_item_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_51] - predicate:((((cd_gender = 'F') and (cd_marital_status = 'D')) and (cd_education_status = 'Unknown')) and cd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer_demographics - Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_35] + Limit [LIM_34] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_33] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Select Operator [SEL_31] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_30] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1 + Group By Operator [GBY_28] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"],keys:_col15, _col17 + Select Operator [SEL_27] (rows=508200 width=1436) + Output:["_col15","_col17","_col4","_col5","_col7","_col6"] + Merge Join Operator [MERGEJOIN_58] (rows=508200 width=1436) + Output:["_col4","_col5","_col6","_col7","_col15","_col17"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_54] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_12] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_57] (rows=44193 width=1119) + Output:["_col1","_col4","_col5","_col6","_col7","_col15"],keys:{"0":"_col3","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=852 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_53] (rows=852 width=1910) + predicate:((s_state) IN ('KS', 'AL', 'MN', 'AL', 'SC', 'VT') and s_store_sk is not null) + TableScan [TS_9] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_56] (rows=40176 width=1119) + Output:["_col1","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_52] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_55] (rows=2722 width=362) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col2","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_50] (rows=1 width=0) + predicate:(((ss_cdemo_sk is not null and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_item_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_cdemo_sk","ss_store_sk","ss_quantity","ss_list_price","ss_sales_price","ss_coupon_amt"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=2475 width=362) + Output:["_col0"] + Filter Operator [FIL_51] (rows=2475 width=362) + predicate:((((cd_gender = 'F') and (cd_marital_status = 'D')) and (cd_education_status = 'Unknown')) and cd_demo_sk is not null) + TableScan [TS_3] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status"] diff --git a/ql/src/test/results/clientpositive/perf/query28.q.out b/ql/src/test/results/clientpositive/perf/query28.q.out index cac9ac3..bc6c3fe 100644 --- a/ql/src/test/results/clientpositive/perf/query28.q.out +++ b/ql/src/test/results/clientpositive/perf/query28.q.out @@ -121,237 +121,115 @@ Reducer 7 <- Reducer 17 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_64] - compressed:false - Statistics:Num rows: 1 Data size: 215 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_63] - Number of rows:100 - Statistics:Num rows: 1 Data size: 215 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_62] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17"] - Statistics:Num rows: 1 Data size: 215 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_75] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17"] - | Statistics:Num rows: 1 Data size: 215 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_60] - | sort order: - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - | Group By Operator [GBY_40] - | | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: decimal(7,2)) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: struct), _col2 (type: bigint) - | Group By Operator [GBY_38] - | aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - | keys:ss_list_price (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_37] - | outputColumnNames:["ss_list_price"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_70] - | predicate:(ss_quantity BETWEEN 6 AND 10 and (ss_list_price BETWEEN 91 AND 101 or ss_coupon_amt BETWEEN 1430 AND 2430 or ss_wholesale_cost BETWEEN 32 AND 52)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_35] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_59] - sort order: - Statistics:Num rows: 1 Data size: 196 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: decimal(11,6)), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: decimal(11,6)), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: decimal(11,6)), _col10 (type: bigint), _col11 (type: bigint), _col12 (type: decimal(11,6)), _col13 (type: bigint), _col14 (type: bigint) - Merge Join Operator [MERGEJOIN_74] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - | Statistics:Num rows: 1 Data size: 196 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_57] - | sort order: - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - | Group By Operator [GBY_33] - | | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: decimal(7,2)) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: struct), _col2 (type: bigint) - | Group By Operator [GBY_31] - | aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - | keys:ss_list_price (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_30] - | outputColumnNames:["ss_list_price"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_69] - | predicate:(ss_quantity BETWEEN 11 AND 15 and (ss_list_price BETWEEN 66 AND 76 or ss_coupon_amt BETWEEN 920 AND 1920 or ss_wholesale_cost BETWEEN 4 AND 24)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_28] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_56] - sort order: - Statistics:Num rows: 1 Data size: 179 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: decimal(11,6)), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: decimal(11,6)), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: decimal(11,6)), _col10 (type: bigint), _col11 (type: bigint) - Merge Join Operator [MERGEJOIN_73] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - | Statistics:Num rows: 1 Data size: 179 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_54] - | sort order: - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - | Group By Operator [GBY_26] - | | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: decimal(7,2)) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: struct), _col2 (type: bigint) - | Group By Operator [GBY_24] - | aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - | keys:ss_list_price (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_23] - | outputColumnNames:["ss_list_price"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_68] - | predicate:(ss_quantity BETWEEN 16 AND 20 and (ss_list_price BETWEEN 142 AND 152 or ss_coupon_amt BETWEEN 3054 AND 4054 or ss_wholesale_cost BETWEEN 80 AND 100)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_21] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_53] - sort order: - Statistics:Num rows: 1 Data size: 163 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: decimal(11,6)), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: decimal(11,6)), _col7 (type: bigint), _col8 (type: bigint) - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 1 Data size: 163 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_51] - | sort order: - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - | Group By Operator [GBY_19] - | | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: decimal(7,2)) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: struct), _col2 (type: bigint) - | Group By Operator [GBY_17] - | aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - | keys:ss_list_price (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_16] - | outputColumnNames:["ss_list_price"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_67] - | predicate:(ss_quantity BETWEEN 21 AND 25 and (ss_list_price BETWEEN 135 AND 145 or ss_coupon_amt BETWEEN 14180 AND 15180 or ss_wholesale_cost BETWEEN 38 AND 58)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_14] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_50] - sort order: - Statistics:Num rows: 1 Data size: 149 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: decimal(11,6)), _col4 (type: bigint), _col5 (type: bigint) - Merge Join Operator [MERGEJOIN_71] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 149 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_47] - | sort order: - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - | Group By Operator [GBY_5] - | | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: decimal(7,2)) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: struct), _col2 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - | keys:ss_list_price (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["ss_list_price"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_65] - | predicate:(ss_quantity BETWEEN 0 AND 5 and (ss_list_price BETWEEN 11 AND 21 or ss_coupon_amt BETWEEN 460 AND 1460 or ss_wholesale_cost BETWEEN 14 AND 34)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_48] - sort order: - Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(11,6)), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_12] - | aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 136 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col0 (type: decimal(7,2)) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: struct), _col2 (type: bigint) - Group By Operator [GBY_10] - aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"] - keys:ss_list_price (type: decimal(7,2)) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_9] - outputColumnNames:["ss_list_price"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_66] - predicate:(ss_quantity BETWEEN 26 AND 30 and (ss_list_price BETWEEN 28 AND 38 or ss_coupon_amt BETWEEN 2513 AND 3513 or ss_wholesale_cost BETWEEN 42 AND 62)) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_7] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_64] + Limit [LIM_63] (rows=1 width=215) + Number of rows:100 + Select Operator [SEL_62] (rows=1 width=215) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17"] + Merge Join Operator [MERGEJOIN_75] (rows=1 width=215) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17"],keys:{} + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_60] + Group By Operator [GBY_40] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_39] + Group By Operator [GBY_38] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_37] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_70] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 6 AND 10 and (ss_list_price BETWEEN 91 AND 101 or ss_coupon_amt BETWEEN 1430 AND 2430 or ss_wholesale_cost BETWEEN 32 AND 52)) + TableScan [TS_35] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_59] + Merge Join Operator [MERGEJOIN_74] (rows=1 width=196) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],keys:{} + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_57] + Group By Operator [GBY_33] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Group By Operator [GBY_31] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_30] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_69] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 11 AND 15 and (ss_list_price BETWEEN 66 AND 76 or ss_coupon_amt BETWEEN 920 AND 1920 or ss_wholesale_cost BETWEEN 4 AND 24)) + TableScan [TS_28] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_56] + Merge Join Operator [MERGEJOIN_73] (rows=1 width=179) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"],keys:{} + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_54] + Group By Operator [GBY_26] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_25] + Group By Operator [GBY_24] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_23] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_68] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 16 AND 20 and (ss_list_price BETWEEN 142 AND 152 or ss_coupon_amt BETWEEN 3054 AND 4054 or ss_wholesale_cost BETWEEN 80 AND 100)) + TableScan [TS_21] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_53] + Merge Join Operator [MERGEJOIN_72] (rows=1 width=163) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],keys:{} + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_51] + Group By Operator [GBY_19] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_18] + Group By Operator [GBY_17] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_16] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_67] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 21 AND 25 and (ss_list_price BETWEEN 135 AND 145 or ss_coupon_amt BETWEEN 14180 AND 15180 or ss_wholesale_cost BETWEEN 38 AND 58)) + TableScan [TS_14] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_50] + Merge Join Operator [MERGEJOIN_71] (rows=1 width=149) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],keys:{} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_47] + Group By Operator [GBY_5] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + Group By Operator [GBY_3] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_2] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_65] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 0 AND 5 and (ss_list_price BETWEEN 11 AND 21 or ss_coupon_amt BETWEEN 460 AND 1460 or ss_wholesale_cost BETWEEN 14 AND 34)) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_48] + Group By Operator [GBY_12] (rows=1 width=136) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)","count(VALUE._col1)","count(DISTINCT KEY._col0:0._col0)"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_11] + Group By Operator [GBY_10] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(ss_list_price)","count(ss_list_price)","count(DISTINCT ss_list_price)"],keys:ss_list_price + Select Operator [SEL_9] (rows=1 width=0) + Output:["ss_list_price"] + Filter Operator [FIL_66] (rows=1 width=0) + predicate:(ss_quantity BETWEEN 26 AND 30 and (ss_list_price BETWEEN 28 AND 38 or ss_coupon_amt BETWEEN 2513 AND 3513 or ss_wholesale_cost BETWEEN 42 AND 62)) + TableScan [TS_7] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_quantity","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] diff --git a/ql/src/test/results/clientpositive/perf/query29.q.out b/ql/src/test/results/clientpositive/perf/query29.q.out index 8991f35..09f057b 100644 --- a/ql/src/test/results/clientpositive/perf/query29.q.out +++ b/ql/src/test/results/clientpositive/perf/query29.q.out @@ -16,249 +16,130 @@ Reducer 8 <- Map 17 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 10 - File Output Operator [FS_53] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_52] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_51] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_50] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint) - Select Operator [SEL_49] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_48] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 254100 Data size: 364958259 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint) - Group By Operator [GBY_46] - aggregations:["sum(_col5)","sum(_col10)","sum(_col14)"] - keys:_col24 (type: string), _col25 (type: string), _col27 (type: string), _col28 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_45] - outputColumnNames:["_col24","_col25","_col27","_col28","_col5","_col10","_col14"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_103] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col10","_col14","_col24","_col25","_col27","_col28"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_23] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_96] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col10 (type: int), _col14 (type: int), _col24 (type: string), _col25 (type: string) - Merge Join Operator [MERGEJOIN_102] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col5","_col10","_col14","_col24","_col25"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_95] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: int), _col10 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_101] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col11 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col14"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_94] - | predicate:((d_year) IN (2000, 2001, 2002) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col11 (type: int) - Map-reduce partition columns:_col11 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col10 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_100] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col10","_col11","_col14"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_93] - | predicate:((d_moy BETWEEN 2 AND 5 and (d_year = 2000)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col10 (type: int), _col11 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_99] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_92] - | predicate:(((d_year = 2000) and (d_moy = 2)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int), _col11 (type: int), _col14 (type: int) - Merge Join Operator [MERGEJOIN_98] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col8 (type: int), _col7 (type: int)","1":"_col1 (type: int), _col2 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col2 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_91] - | predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_6] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col8 (type: int), _col7 (type: int) - Map-reduce partition columns:_col8 (type: int), _col7 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col10 (type: int) - Merge Join Operator [MERGEJOIN_97] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int), _col1 (type: int), _col4 (type: int)","1":"_col2 (type: int), _col1 (type: int), _col3 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col4 (type: int) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int), _col5 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_89] - | predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col2 (type: int), _col1 (type: int), _col3 (type: int) - Map-reduce partition columns:_col2 (type: int), _col1 (type: int), _col3 (type: int) - sort order:+++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_90] - predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 10 + File Output Operator [FS_53] + Limit [LIM_52] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_51] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_50] + Select Operator [SEL_49] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Group By Operator [GBY_48] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_46] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col10)","sum(_col14)"],keys:_col24, _col25, _col27, _col28 + Select Operator [SEL_45] (rows=508200 width=1436) + Output:["_col24","_col25","_col27","_col28","_col5","_col10","_col14"] + Merge Join Operator [MERGEJOIN_103] (rows=508200 width=1436) + Output:["_col5","_col10","_col14","_col24","_col25","_col27","_col28"],keys:{"0":"_col1","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=462000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_96] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_21] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_102] (rows=44193 width=1119) + Output:["_col1","_col5","_col10","_col14","_col24","_col25"],keys:{"0":"_col3","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_95] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_18] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id","s_store_name"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_101] (rows=40176 width=1119) + Output:["_col1","_col3","_col5","_col10","_col14"],keys:{"0":"_col11","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_94] (rows=36524 width=1119) + predicate:((d_year) IN (2000, 2001, 2002) and d_date_sk is not null) + TableScan [TS_15] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col11 + Merge Join Operator [MERGEJOIN_100] (rows=22096 width=1119) + Output:["_col1","_col3","_col5","_col10","_col11","_col14"],keys:{"0":"_col6","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_93] (rows=18262 width=1119) + predicate:((d_moy BETWEEN 2 AND 5 and (d_year = 2000)) and d_date_sk is not null) + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_99] (rows=20088 width=1119) + Output:["_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_92] (rows=18262 width=1119) + predicate:(((d_year = 2000) and (d_moy = 2)) and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_98] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col10","_col11","_col14"],keys:{"0":"_col8, _col7","1":"_col1, _col2"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col1, _col2 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_91] (rows=1 width=0) + predicate:((cs_item_sk is not null and cs_bill_customer_sk is not null) and cs_sold_date_sk is not null) + TableScan [TS_6] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk","cs_quantity"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col8, _col7 + Merge Join Operator [MERGEJOIN_97] (rows=1 width=0) + Output:["_col0","_col1","_col3","_col5","_col6","_col7","_col8","_col10"],keys:{"0":"_col2, _col1, _col4","1":"_col2, _col1, _col3"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2, _col1, _col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_89] (rows=1 width=0) + predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number","ss_quantity"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col2, _col1, _col3 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_90] (rows=1 width=0) + predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number","sr_return_quantity"] diff --git a/ql/src/test/results/clientpositive/perf/query3.q.out b/ql/src/test/results/clientpositive/perf/query3.q.out index 871ad74..511d918 100644 --- a/ql/src/test/results/clientpositive/perf/query3.q.out +++ b/ql/src/test/results/clientpositive/perf/query3.q.out @@ -11,109 +11,58 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_23] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: int), _col3 (type: decimal(17,2)), _col1 (type: int) - sort order:+-+ - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: string) - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Group By Operator [GBY_16] - aggregations:["sum(_col5)"] - keys:_col1 (type: int), _col7 (type: int), _col8 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col1","_col7","_col8","_col5"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_34] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col5","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_32] - | predicate:((i_manufact_id = 436) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4","_col5"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_30] - | predicate:((d_moy = 12) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:dt - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_31] - predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_24] + Limit [LIM_23] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_22] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_21] + Group By Operator [GBY_18] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_16] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col5)"],keys:_col1, _col7, _col8 + Select Operator [SEL_15] (rows=254100 width=1436) + Output:["_col1","_col7","_col8","_col5"] + Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436) + Output:["_col1","_col5","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_32] (rows=231000 width=1436) + predicate:((i_manufact_id = 436) and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manufact_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_33] (rows=40176 width=1119) + Output:["_col1","_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_30] (rows=36524 width=1119) + predicate:((d_moy = 12) and d_date_sk is not null) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query31.q.out b/ql/src/test/results/clientpositive/perf/query31.q.out index 8c370c4..c178182 100644 --- a/ql/src/test/results/clientpositive/perf/query31.q.out +++ b/ql/src/test/results/clientpositive/perf/query31.q.out @@ -28,614 +28,316 @@ Reducer 6 <- Reducer 37 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_141] - compressed:false - Statistics:Num rows: 11831111 Data size: 12007156967 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_140] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 11831111 Data size: 12007156967 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_139] - key expressions:_col2 (type: decimal(37,20)) - sort order:+ - Statistics:Num rows: 11831111 Data size: 12007156967 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col3 (type: decimal(37,20)), _col4 (type: decimal(37,20)), _col5 (type: decimal(37,20)) - Select Operator [SEL_138] - outputColumnNames:["_col0","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 11831111 Data size: 12007156967 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_137] - predicate:(CASE WHEN ((_col19 > 0)) THEN ((_col23 / _col19)) ELSE (null) END > CASE WHEN ((_col7 > 0)) THEN ((_col11 / _col7)) ELSE (null) END) (type: boolean) - Statistics:Num rows: 11831111 Data size: 12007156967 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_281] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col12 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col3","_col7","_col11","_col15","_col19","_col23"] - | Statistics:Num rows: 35493334 Data size: 36021471918 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 37 [SIMPLE_EDGE] - | Reduce Output Operator [RS_135] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Select Operator [SEL_133] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_132] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 36 [SIMPLE_EDGE] - | Reduce Output Operator [RS_131] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Group By Operator [GBY_130] - | aggregations:["sum(_col3)"] - | keys:_col0 (type: string), 3 (type: int), 1998 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_128] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_279] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col7"] - | | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | |<-Map 39 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_126] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_121] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_267] - | | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_119] - | | alias:customer_address - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 35 [SIMPLE_EDGE] - | Reduce Output Operator [RS_125] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_278] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 34 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_122] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_115] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_265] - | | predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_113] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 38 [SIMPLE_EDGE] - | Reduce Output Operator [RS_123] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_118] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_266] - | predicate:(((d_qoy = 3) and (d_year = 1998)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_116] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_134] - key expressions:_col12 (type: string) - Map-reduce partition columns:_col12 (type: string) - sort order:+ - Statistics:Num rows: 32266667 Data size: 32746791943 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col3 (type: decimal(17,2)), _col7 (type: decimal(17,2)), _col11 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col19 (type: decimal(17,2)) - Select Operator [SEL_112] - outputColumnNames:["_col0","_col11","_col12","_col15","_col19","_col3","_col7"] - Statistics:Num rows: 32266667 Data size: 32746791943 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_111] - predicate:(CASE WHEN ((_col15 > 0)) THEN ((_col19 / _col15)) ELSE (null) END > CASE WHEN ((_col3 > 0)) THEN ((_col7 / _col3)) ELSE (null) END) (type: boolean) - Statistics:Num rows: 32266667 Data size: 32746791943 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_280] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 1 to 2"},{"":"Inner Join 0 to 3"},{"":"Inner Join 3 to 4"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)","3":"_col0 (type: string)","4":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col3","_col7","_col11","_col12","_col15","_col19"] - | Statistics:Num rows: 96800002 Data size: 98240376845 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_106] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Select Operator [SEL_41] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_40] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Group By Operator [GBY_38] - | aggregations:["sum(_col3)"] - | keys:_col0 (type: string), 2 (type: int), 1998 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_36] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_271] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col7"] - | | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_34] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_29] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_255] - | | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_27] - | | alias:customer_address - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_33] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_270] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_30] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_23] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_253] - | | predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_21] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_26] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_254] - | predicate:(((d_qoy = 2) and (d_year = 1998)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_24] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 19 [SIMPLE_EDGE] - | Reduce Output Operator [RS_107] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Select Operator [SEL_62] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_61] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_60] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Group By Operator [GBY_59] - | aggregations:["sum(_col3)"] - | keys:_col0 (type: string), 3 (type: int), 1998 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_57] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_273] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col7"] - | | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_55] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_50] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_258] - | | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_48] - | | alias:customer_address - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_54] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_272] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_51] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_44] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_256] - | | predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_42] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_52] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_47] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_257] - | predicate:(((d_qoy = 3) and (d_year = 1998)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_45] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 25 [SIMPLE_EDGE] - | Reduce Output Operator [RS_108] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Select Operator [SEL_83] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_82] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 24 [SIMPLE_EDGE] - | Reduce Output Operator [RS_81] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Group By Operator [GBY_80] - | aggregations:["sum(_col3)"] - | keys:_col0 (type: string), 1 (type: int), 1998 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_78] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_275] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col7"] - | | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | |<-Map 27 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_76] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_71] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_261] - | | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_69] - | | alias:customer_address - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 23 [SIMPLE_EDGE] - | Reduce Output Operator [RS_75] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_274] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 22 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_72] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_65] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_259] - | | predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_63] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 26 [SIMPLE_EDGE] - | Reduce Output Operator [RS_73] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_68] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_260] - | predicate:(((d_year = 1998) and (d_qoy = 1)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_66] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 31 [SIMPLE_EDGE] - | Reduce Output Operator [RS_109] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Select Operator [SEL_104] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_103] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 30 [SIMPLE_EDGE] - | Reduce Output Operator [RS_102] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(17,2)) - | Group By Operator [GBY_101] - | aggregations:["sum(_col3)"] - | keys:_col0 (type: string), 2 (type: int), 1998 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_99] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_277] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col7"] - | | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - | |<-Map 33 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_97] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_92] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_264] - | | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_90] - | | alias:customer_address - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 29 [SIMPLE_EDGE] - | Reduce Output Operator [RS_96] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_276] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 28 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_93] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_86] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_262] - | | predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_84] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 32 [SIMPLE_EDGE] - | Reduce Output Operator [RS_94] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_89] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_263] - | predicate:(((d_qoy = 2) and (d_year = 1998)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_87] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_105] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Select Operator [SEL_20] - outputColumnNames:["_col0","_col3"] - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_19] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int) - sort order:+++ - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Group By Operator [GBY_17] - aggregations:["sum(_col3)"] - keys:_col0 (type: string), 1 (type: int), 1998 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col0","_col3"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_269] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col7"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_252] - | predicate:(ca_address_sk is not null and ca_county is not null) (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_268] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_250] - | predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_251] - predicate:(((d_year = 1998) and (d_qoy = 1)) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_141] + Select Operator [SEL_140] (rows=11831111 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_139] + Select Operator [SEL_138] (rows=11831111 width=1014) + Output:["_col0","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_137] (rows=11831111 width=1014) + predicate:(CASE WHEN ((_col19 > 0)) THEN ((_col23 / _col19)) ELSE (null) END > CASE WHEN ((_col7 > 0)) THEN ((_col11 / _col7)) ELSE (null) END) + Merge Join Operator [MERGEJOIN_281] (rows=35493334 width=1014) + Output:["_col0","_col3","_col7","_col11","_col15","_col19","_col23"],keys:{"0":"_col12","1":"_col0"} + <-Reducer 37 [SIMPLE_EDGE] + SHUFFLE [RS_135] + PartitionCols:_col0 + Select Operator [SEL_133] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_132] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 36 [SIMPLE_EDGE] + SHUFFLE [RS_131] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_130] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 3, 1998 + Select Operator [SEL_128] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_279] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 39 [SIMPLE_EDGE] + SHUFFLE [RS_126] + PartitionCols:_col0 + Select Operator [SEL_121] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_267] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_119] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 35 [SIMPLE_EDGE] + SHUFFLE [RS_125] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_278] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 34 [SIMPLE_EDGE] + SHUFFLE [RS_122] + PartitionCols:_col0 + Select Operator [SEL_115] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_265] (rows=1 width=0) + predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) + TableScan [TS_113] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_bill_addr_sk","ws_ext_sales_price"] + <-Map 38 [SIMPLE_EDGE] + SHUFFLE [RS_123] + PartitionCols:_col0 + Select Operator [SEL_118] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_266] (rows=18262 width=1119) + predicate:(((d_qoy = 3) and (d_year = 1998)) and d_date_sk is not null) + TableScan [TS_116] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_134] + PartitionCols:_col12 + Select Operator [SEL_112] (rows=32266667 width=1014) + Output:["_col0","_col11","_col12","_col15","_col19","_col3","_col7"] + Filter Operator [FIL_111] (rows=32266667 width=1014) + predicate:(CASE WHEN ((_col15 > 0)) THEN ((_col19 / _col15)) ELSE (null) END > CASE WHEN ((_col3 > 0)) THEN ((_col7 / _col3)) ELSE (null) END) + Merge Join Operator [MERGEJOIN_280] (rows=96800002 width=1014) + Output:["_col0","_col3","_col7","_col11","_col12","_col15","_col19"],keys:{"0":"_col0","1":"_col0","2":"_col0","3":"_col0","4":"_col0"} + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_106] + PartitionCols:_col0 + Select Operator [SEL_41] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_40] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_38] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 2, 1998 + Select Operator [SEL_36] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_271] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_29] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_255] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_27] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_270] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_253] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) + TableScan [TS_21] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_addr_sk","ss_ext_sales_price"] + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_254] (rows=18262 width=1119) + predicate:(((d_qoy = 2) and (d_year = 1998)) and d_date_sk is not null) + TableScan [TS_24] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_107] + PartitionCols:_col0 + Select Operator [SEL_62] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_61] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_60] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_59] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 3, 1998 + Select Operator [SEL_57] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_273] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col0 + Select Operator [SEL_50] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_258] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_48] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_54] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_272] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_51] + PartitionCols:_col0 + Select Operator [SEL_44] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_256] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) + TableScan [TS_42] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_addr_sk","ss_ext_sales_price"] + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col0 + Select Operator [SEL_47] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_257] (rows=18262 width=1119) + predicate:(((d_qoy = 3) and (d_year = 1998)) and d_date_sk is not null) + TableScan [TS_45] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 25 [SIMPLE_EDGE] + SHUFFLE [RS_108] + PartitionCols:_col0 + Select Operator [SEL_83] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_82] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 24 [SIMPLE_EDGE] + SHUFFLE [RS_81] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_80] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 1, 1998 + Select Operator [SEL_78] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_275] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 27 [SIMPLE_EDGE] + SHUFFLE [RS_76] + PartitionCols:_col0 + Select Operator [SEL_71] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_261] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_69] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 23 [SIMPLE_EDGE] + SHUFFLE [RS_75] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_274] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_72] + PartitionCols:_col0 + Select Operator [SEL_65] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_259] (rows=1 width=0) + predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) + TableScan [TS_63] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_bill_addr_sk","ws_ext_sales_price"] + <-Map 26 [SIMPLE_EDGE] + SHUFFLE [RS_73] + PartitionCols:_col0 + Select Operator [SEL_68] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_260] (rows=18262 width=1119) + predicate:(((d_year = 1998) and (d_qoy = 1)) and d_date_sk is not null) + TableScan [TS_66] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 31 [SIMPLE_EDGE] + SHUFFLE [RS_109] + PartitionCols:_col0 + Select Operator [SEL_104] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_103] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 30 [SIMPLE_EDGE] + SHUFFLE [RS_102] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_101] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 2, 1998 + Select Operator [SEL_99] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_277] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 33 [SIMPLE_EDGE] + SHUFFLE [RS_97] + PartitionCols:_col0 + Select Operator [SEL_92] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_264] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_90] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 29 [SIMPLE_EDGE] + SHUFFLE [RS_96] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_276] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 28 [SIMPLE_EDGE] + SHUFFLE [RS_93] + PartitionCols:_col0 + Select Operator [SEL_86] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_262] (rows=1 width=0) + predicate:(ws_sold_date_sk is not null and ws_bill_addr_sk is not null) + TableScan [TS_84] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_bill_addr_sk","ws_ext_sales_price"] + <-Map 32 [SIMPLE_EDGE] + SHUFFLE [RS_94] + PartitionCols:_col0 + Select Operator [SEL_89] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_263] (rows=18262 width=1119) + predicate:(((d_qoy = 2) and (d_year = 1998)) and d_date_sk is not null) + TableScan [TS_87] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_105] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=22000000 width=1014) + Output:["_col0","_col3"] + Group By Operator [GBY_19] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_17] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:_col0, 1, 1998 + Select Operator [SEL_15] (rows=44000000 width=1014) + Output:["_col0","_col3"] + Merge Join Operator [MERGEJOIN_269] (rows=44000000 width=1014) + Output:["_col2","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_252] (rows=40000000 width=1014) + predicate:(ca_address_sk is not null and ca_county is not null) + TableScan [TS_6] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_268] (rows=20088 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_250] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_addr_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_addr_sk","ss_ext_sales_price"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_251] (rows=18262 width=1119) + predicate:(((d_year = 1998) and (d_qoy = 1)) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] diff --git a/ql/src/test/results/clientpositive/perf/query32.q.out b/ql/src/test/results/clientpositive/perf/query32.q.out index da2ac8f..ad32fd1 100644 --- a/ql/src/test/results/clientpositive/perf/query32.q.out +++ b/ql/src/test/results/clientpositive/perf/query32.q.out @@ -46,160 +46,87 @@ Reducer 8 <- Map 10 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_35] - | aggregations:["sum(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - sort order: - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(17,2)) - Group By Operator [GBY_33] - aggregations:["sum(_col1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 112 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_32] - outputColumnNames:["_col1"] - Statistics:Num rows: 169400 Data size: 243305505 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_31] - predicate:(_col1 > CAST( _col5 AS decimal(20,15))) (type: boolean) - Statistics:Num rows: 169400 Data size: 243305505 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_59] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 1 to 2"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)","2":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col5"] - | Statistics:Num rows: 508200 Data size: 729916517 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_12] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:((i_manufact_id = 436) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_10] - | alias:i - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(7,2)) - | Select Operator [SEL_9] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_57] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_6] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_52] - | | predicate:(cs_sold_date_sk is not null and cs_item_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_0] - | | alias:cs - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:(d_date BETWEEN '2000-01-27' AND '2000-04-27' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:d - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: double) - Select Operator [SEL_26] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_25] - | aggregations:["avg(VALUE._col0)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: struct) - Group By Operator [GBY_23] - aggregations:["avg(_col2)"] - keys:_col1 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_18] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_56] - | predicate:(d_date BETWEEN '2000-01-27' AND '2000-04-27' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:d - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_55] - predicate:(cs_sold_date_sk is not null and cs_item_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_13] - alias:cs - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_37] + Group By Operator [GBY_35] (rows=1 width=112) + Output:["_col0"],aggregations:["sum(VALUE._col0)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_34] + Group By Operator [GBY_33] (rows=1 width=112) + Output:["_col0"],aggregations:["sum(_col1)"] + Select Operator [SEL_32] (rows=169400 width=1436) + Output:["_col1"] + Filter Operator [FIL_31] (rows=169400 width=1436) + predicate:(_col1 > CAST( _col5 AS decimal(20,15))) + Merge Join Operator [MERGEJOIN_59] (rows=508200 width=1436) + Output:["_col1","_col5"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_12] (rows=231000 width=1436) + Output:["_col0"] + Filter Operator [FIL_54] (rows=231000 width=1436) + predicate:((i_manufact_id = 436) and i_item_sk is not null) + TableScan [TS_10] (rows=462000 width=1436) + default@item,i,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_manufact_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_9] (rows=40176 width=1119) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_57] (rows=40176 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_52] (rows=1 width=0) + predicate:(cs_sold_date_sk is not null and cs_item_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,cs,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_ext_discount_amt"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_53] (rows=36524 width=1119) + predicate:(d_date BETWEEN '2000-01-27' AND '2000-04-27' and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,d,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=20088 width=1119) + Output:["_col0","_col1"] + Group By Operator [GBY_25] (rows=20088 width=1119) + Output:["_col0","_col1"],aggregations:["avg(VALUE._col0)"],keys:KEY._col0 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Group By Operator [GBY_23] (rows=40176 width=1119) + Output:["_col0","_col1"],aggregations:["avg(_col2)"],keys:_col1 + Merge Join Operator [MERGEJOIN_58] (rows=40176 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_56] (rows=36524 width=1119) + predicate:(d_date BETWEEN '2000-01-27' AND '2000-04-27' and d_date_sk is not null) + TableScan [TS_16] (rows=73049 width=1119) + default@date_dim,d,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_15] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_55] (rows=1 width=0) + predicate:(cs_sold_date_sk is not null and cs_item_sk is not null) + TableScan [TS_13] (rows=1 width=0) + default@catalog_sales,cs,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_ext_discount_amt"] diff --git a/ql/src/test/results/clientpositive/perf/query34.q.out b/ql/src/test/results/clientpositive/perf/query34.q.out index 1cb7c28..b8fadb9 100644 --- a/ql/src/test/results/clientpositive/perf/query34.q.out +++ b/ql/src/test/results/clientpositive/perf/query34.q.out @@ -13,165 +13,88 @@ Reducer 6 <- Map 11 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_36] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_35] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:+++- - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: bigint) - Select Operator [SEL_34] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_60] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | Select Operator [SEL_30] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_56] - | predicate:c_customer_sk is not null (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_28] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_31] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 12153 Data size: 13599611 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: bigint) - Filter Operator [FIL_26] - predicate:_col2 BETWEEN 15 AND 20 (type: boolean) - Statistics:Num rows: 12153 Data size: 13599611 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 24306 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 24306 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 48612 Data size: 54398446 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_22] - aggregations:["count()"] - keys:_col1 (type: int), _col4 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 48612 Data size: 54398446 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_59] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4"] - | Statistics:Num rows: 48612 Data size: 54398446 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_55] - | predicate:((((CASE WHEN ((hd_vehicle_count > 0)) THEN ((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count))) ELSE (null) END > 1.2) and ((hd_buy_potential = '1001-5000') or (hd_buy_potential = '5001-10000'))) and (hd_vehicle_count > 0)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int) - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:((s_county) IN ('Kittitas County', 'Adams County', 'Richland County', 'Furnas County', 'Orange County', 'Appanoose County', 'Franklin Parish', 'Tehama County') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col4 (type: int) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_52] - | predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_53] - predicate:(((d_year) IN (1998, 1999, 2000) and (d_dom BETWEEN 1 AND 3 or d_dom BETWEEN 25 AND 28)) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_37] + Select Operator [SEL_36] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_35] + Select Operator [SEL_34] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_60] (rows=88000001 width=860) + Output:["_col0","_col2","_col4","_col5","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_56] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_28] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_salutation","c_first_name","c_last_name","c_preferred_cust_flag"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col1 + Filter Operator [FIL_26] (rows=12153 width=1119) + predicate:_col2 BETWEEN 15 AND 20 + Select Operator [SEL_25] (rows=24306 width=1119) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_24] (rows=24306 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0, _col1 + Group By Operator [GBY_22] (rows=48612 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col1, _col4 + Merge Join Operator [MERGEJOIN_59] (rows=48612 width=1119) + Output:["_col1","_col4"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=800 width=107) + Output:["_col0"] + Filter Operator [FIL_55] (rows=800 width=107) + predicate:((((CASE WHEN ((hd_vehicle_count > 0)) THEN ((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count))) ELSE (null) END > 1.2) and ((hd_buy_potential = '1001-5000') or (hd_buy_potential = '5001-10000'))) and (hd_vehicle_count > 0)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential","hd_dep_count","hd_vehicle_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_58] (rows=44193 width=1119) + Output:["_col1","_col2","_col4"],keys:{"0":"_col3","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_54] (rows=852 width=1910) + predicate:((s_county) IN ('Kittitas County', 'Adams County', 'Richland County', 'Furnas County', 'Orange County', 'Appanoose County', 'Franklin Parish', 'Tehama County') and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_county"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_57] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_52] (rows=1 width=0) + predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_store_sk","ss_ticket_number"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_53] (rows=36524 width=1119) + predicate:(((d_year) IN (1998, 1999, 2000) and (d_dom BETWEEN 1 AND 3 or d_dom BETWEEN 25 AND 28)) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"] diff --git a/ql/src/test/results/clientpositive/perf/query39.q.out b/ql/src/test/results/clientpositive/perf/query39.q.out index f4ad98c..b24b8ca 100644 --- a/ql/src/test/results/clientpositive/perf/query39.q.out +++ b/ql/src/test/results/clientpositive/perf/query39.q.out @@ -17,285 +17,151 @@ Reducer 6 <- Reducer 15 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_62] - compressed:false - Statistics:Num rows: 112735 Data size: 161919824 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_61] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 112735 Data size: 161919824 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_60] - key expressions:_col0 (type: int), _col1 (type: int), 3 (type: int), _col3 (type: double), _col4 (type: double), _col7 (type: int), _col8 (type: double), _col9 (type: double) - sort order:++++++++ - Statistics:Num rows: 112735 Data size: 161919824 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col6 (type: int) - Select Operator [SEL_59] - outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 112735 Data size: 161919824 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_104] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int), _col0 (type: int)","1":"_col2 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 112735 Data size: 161919824 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_57] - | key expressions:_col2 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col4 (type: double), _col5 (type: double) - | Select Operator [SEL_55] - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:(CASE (_col5) WHEN (0) THEN (0) ELSE ((_col4 / _col5)) END > 1.0) (type: boolean) - | Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_53] - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_52] - | | aggregations:["stddev_samp(VALUE._col0)","avg(VALUE._col1)"] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_51] - | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: string), _col3 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: string), _col3 (type: int) - | sort order:++++ - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col4 (type: struct), _col5 (type: struct) - | Group By Operator [GBY_50] - | aggregations:["stddev_samp(_col3)","avg(_col3)"] - | keys:_col4 (type: int), _col5 (type: int), _col6 (type: string), _col9 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_49] - | outputColumnNames:["_col4","_col5","_col6","_col9","_col3"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_103] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_47] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_39] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_96] - | | predicate:(((d_moy = 4) and d_date_sk is not null) and (d_year = 1999)) (type: boolean) - | | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_37] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_46] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: string) - | Merge Join Operator [MERGEJOIN_102] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_44] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_36] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_95] - | | predicate:w_warehouse_sk is not null (type: boolean) - | | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_34] - | | alias:warehouse - | | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int), _col4 (type: int) - | Merge Join Operator [MERGEJOIN_101] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col2","_col3","_col4"] - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_40] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int) - | | Select Operator [SEL_30] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_93] - | | predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_28] - | | alias:inventory - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_41] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_33] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_94] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_31] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_56] - key expressions:_col1 (type: int), _col0 (type: int) - Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - sort order:++ - Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: double), _col3 (type: double) - Select Operator [SEL_27] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_26] - predicate:(CASE (_col4) WHEN (0) THEN (0) ELSE ((_col5 / _col4)) END > 1.0) (type: boolean) - Statistics:Num rows: 102487 Data size: 147199837 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_97] - outputColumnNames:["_col1","_col2","_col4","_col5"] - Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_25] - | aggregations:["avg(VALUE._col0)","stddev_samp(VALUE._col1)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: int), _col3 (type: int) - sort order:++++ - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: struct), _col5 (type: struct) - Group By Operator [GBY_23] - aggregations:["avg(_col4)","stddev_samp(_col4)"] - keys:_col0 (type: string), _col1 (type: int), _col2 (type: int), 3 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1","_col2","_col4"] - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_100] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_92] - | predicate:(((d_moy = 3) and d_date_sk is not null) and (d_year = 1999)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: string) - Merge Join Operator [MERGEJOIN_99] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_91] - | predicate:w_warehouse_sk is not null (type: boolean) - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:warehouse - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col4 (type: int) - Merge Join Operator [MERGEJOIN_98] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_89] - | predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:inventory - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_90] - predicate:i_item_sk is not null (type: boolean) - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_62] + Select Operator [SEL_61] (rows=112735 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_60] + Select Operator [SEL_59] (rows=112735 width=1436) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Merge Join Operator [MERGEJOIN_104] (rows=112735 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col7","_col8","_col9"],keys:{"0":"_col1, _col0","1":"_col2, _col1"} + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_57] + PartitionCols:_col2, _col1 + Select Operator [SEL_55] (rows=102487 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_54] (rows=102487 width=1436) + predicate:(CASE (_col5) WHEN (0) THEN (0) ELSE ((_col4 / _col5)) END > 1.0) + Select Operator [SEL_53] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_52] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["stddev_samp(VALUE._col0)","avg(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_51] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_50] (rows=614922 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["stddev_samp(_col3)","avg(_col3)"],keys:_col4, _col5, _col6, _col9 + Select Operator [SEL_49] (rows=614922 width=1436) + Output:["_col4","_col5","_col6","_col9","_col3"] + Merge Join Operator [MERGEJOIN_103] (rows=614922 width=1436) + Output:["_col3","_col4","_col5","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0 + Select Operator [SEL_39] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_96] (rows=18262 width=1119) + predicate:(((d_moy = 4) and d_date_sk is not null) and (d_year = 1999)) + TableScan [TS_37] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_102] (rows=559020 width=1436) + Output:["_col0","_col3","_col4","_col5","_col6"],keys:{"0":"_col2","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col0 + Select Operator [SEL_36] (rows=27 width=1029) + Output:["_col0","_col1"] + Filter Operator [FIL_95] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_34] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name"] + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_101] (rows=508200 width=1436) + Output:["_col0","_col2","_col3","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col1 + Select Operator [SEL_30] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_93] (rows=1 width=0) + predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) + TableScan [TS_28] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0 + Select Operator [SEL_33] (rows=462000 width=1436) + Output:["_col0"] + Filter Operator [FIL_94] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_31] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col1, _col0 + Select Operator [SEL_27] (rows=102487 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_26] (rows=102487 width=1436) + predicate:(CASE (_col4) WHEN (0) THEN (0) ELSE ((_col5 / _col4)) END > 1.0) + Select Operator [SEL_97] (rows=307461 width=1436) + Output:["_col1","_col2","_col4","_col5"] + Group By Operator [GBY_25] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["avg(VALUE._col0)","stddev_samp(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_23] (rows=614922 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["avg(_col4)","stddev_samp(_col4)"],keys:_col0, _col1, _col2, 3 + Select Operator [SEL_21] (rows=614922 width=1436) + Output:["_col0","_col1","_col2","_col4"] + Merge Join Operator [MERGEJOIN_100] (rows=614922 width=1436) + Output:["_col3","_col4","_col5","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_92] (rows=18262 width=1119) + predicate:(((d_moy = 3) and d_date_sk is not null) and (d_year = 1999)) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_99] (rows=559020 width=1436) + Output:["_col0","_col3","_col4","_col5","_col6"],keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=27 width=1029) + Output:["_col0","_col1"] + Filter Operator [FIL_91] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_6] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_98] (rows=508200 width=1436) + Output:["_col0","_col2","_col3","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_89] (rows=1 width=0) + predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=462000 width=1436) + Output:["_col0"] + Filter Operator [FIL_90] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk"] PREHOOK: query: with inv as (select w_warehouse_name,w_warehouse_sk,i_item_sk,d_moy ,stdev,mean, case mean when 0 then null else stdev/mean end cov from(select w_warehouse_name,w_warehouse_sk,i_item_sk,d_moy ,stddev_samp(inv_quantity_on_hand) stdev,avg(inv_quantity_on_hand) mean from inventory ,item ,warehouse ,date_dim where inv_item_sk = i_item_sk and inv_warehouse_sk = w_warehouse_sk and inv_date_sk = d_date_sk and d_year =1999 group by w_warehouse_name,w_warehouse_sk,i_item_sk,d_moy) foo where case mean when 0 then 0 else stdev/mean end > 1) select inv1.w_warehouse_sk,inv1.i_item_sk,inv1.d_moy,inv1.mean, inv1.cov ,inv2.w_warehouse_sk,inv2.i_item_sk,inv2.d_moy,inv2.mean, inv2.cov from inv inv1,inv inv2 where inv1.i_item_sk = inv2.i_item_sk and inv1.w_warehouse_sk = inv2.w_warehouse_sk and inv1.d_moy=3 and inv2.d_moy=3+1 and inv1.cov > 1.5 order by inv1.w_warehouse_sk,inv1.i_item_sk,inv1.d_moy,inv1.mean,inv1.cov ,inv2.d_moy,inv2.mean, inv2.cov PREHOOK: type: QUERY diff --git a/ql/src/test/results/clientpositive/perf/query40.q.out b/ql/src/test/results/clientpositive/perf/query40.q.out index b2d6262..a21d086 100644 --- a/ql/src/test/results/clientpositive/perf/query40.q.out +++ b/ql/src/test/results/clientpositive/perf/query40.q.out @@ -13,162 +13,84 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_35] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_34] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(23,2)), _col3 (type: decimal(23,2)) - Group By Operator [GBY_30] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(23,2)), _col3 (type: decimal(23,2)) - Group By Operator [GBY_28] - aggregations:["sum(_col2)","sum(_col3)"] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_26] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col7","_col9","_col11","_col14"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:(d_date BETWEEN '1998-03-09' AND '1998-05-08' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_11] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col9 (type: string), _col11 (type: string) - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col7","_col9","_col11"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_10] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_52] - | predicate:(i_current_price BETWEEN 0.99 AND 1.49 and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_8] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col9 (type: string) - Merge Join Operator [MERGEJOIN_55] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col7","_col9"] - | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_51] - | predicate:w_warehouse_sk is not null (type: boolean) - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_5] - | alias:warehouse - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col4 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_54] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col3 (type: int), _col2 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col4","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_14] - | key expressions:_col3 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col3 (type: int), _col2 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col4 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_49] - | predicate:((cs_warehouse_sk is not null and cs_item_sk is not null) and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int), _col0 (type: int) - Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col2 (type: decimal(7,2)) - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:catalog_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_35] + Limit [LIM_34] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_33] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Group By Operator [GBY_30] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1 + Group By Operator [GBY_28] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col2)","sum(_col3)"],keys:_col0, _col1 + Select Operator [SEL_26] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_57] (rows=279510 width=1436) + Output:["_col4","_col7","_col9","_col11","_col14"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_53] (rows=36524 width=1119) + predicate:(d_date BETWEEN '1998-03-09' AND '1998-05-08' and d_date_sk is not null) + TableScan [TS_11] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_56] (rows=254100 width=1436) + Output:["_col0","_col4","_col7","_col9","_col11"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_10] (rows=231000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_52] (rows=231000 width=1436) + predicate:(i_current_price BETWEEN 0.99 AND 1.49 and i_item_sk is not null) + TableScan [TS_8] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_current_price"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_55] (rows=29 width=1054) + Output:["_col0","_col2","_col4","_col7","_col9"],keys:{"0":"_col1","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Select Operator [SEL_7] (rows=27 width=1029) + Output:["_col0","_col1"] + Filter Operator [FIL_51] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_5] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_state"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_54] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col4","_col7"],keys:{"0":"_col3, _col2","1":"_col1, _col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col3, _col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_49] (rows=1 width=0) + predicate:((cs_warehouse_sk is not null and cs_item_sk is not null) and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_warehouse_sk","cs_item_sk","cs_order_number","cs_sales_price"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1, _col0 + Select Operator [SEL_4] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + TableScan [TS_3] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_refunded_cash"] diff --git a/ql/src/test/results/clientpositive/perf/query42.q.out b/ql/src/test/results/clientpositive/perf/query42.q.out index 94f7e32..bfa16d5 100644 --- a/ql/src/test/results/clientpositive/perf/query42.q.out +++ b/ql/src/test/results/clientpositive/perf/query42.q.out @@ -11,110 +11,60 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_23] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col3 (type: decimal(17,2)), 1998 (type: int), _col1 (type: int), _col2 (type: string) - sort order:-+++ - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_20] - outputColumnNames:["_col1","_col2","_col3"] - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_19] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Group By Operator [GBY_17] - aggregations:["sum(_col3)"] - keys:1998 (type: int), _col1 (type: int), _col2 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col1","_col2","_col3"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_34] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_32] - | predicate:((i_manager_id = 1) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_30] - | predicate:(((d_year = 1998) and (d_moy = 12)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:dt - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_31] - predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_24] + Limit [LIM_23] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_22] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_21] + Select Operator [SEL_20] (rows=127050 width=1436) + Output:["_col1","_col2","_col3"] + Group By Operator [GBY_19] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_17] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:1998, _col1, _col2 + Select Operator [SEL_15] (rows=254100 width=1436) + Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436) + Output:["_col5","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_32] (rows=231000 width=1436) + predicate:((i_manager_id = 1) and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_category_id","i_category","i_manager_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_33] (rows=20088 width=1119) + Output:["_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_30] (rows=18262 width=1119) + predicate:(((d_year = 1998) and (d_moy = 12)) and d_date_sk is not null) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query43.q.out b/ql/src/test/results/clientpositive/perf/query43.q.out index 7fa4f53..926d4a2 100644 --- a/ql/src/test/results/clientpositive/perf/query43.q.out +++ b/ql/src/test/results/clientpositive/perf/query43.q.out @@ -11,108 +11,58 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_23] - Number of rows:100 - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 22096 Data size: 24726006 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)), _col8 (type: decimal(17,2)) - sort order:+++++++++ - Statistics:Num rows: 22096 Data size: 24726006 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_19] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 22096 Data size: 24726006 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)), _col8 (type: decimal(17,2)) - Group By Operator [GBY_17] - aggregations:["sum(_col2)","sum(_col3)","sum(_col4)","sum(_col5)","sum(_col6)","sum(_col7)","sum(_col8)"] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_34] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col5","_col7","_col8"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_32] - | predicate:((s_gmt_offset = -6) and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: string), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4","_col5"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_30] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_31] - predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_24] + Limit [LIM_23] (rows=100 width=1119) + Number of rows:100 + Select Operator [SEL_22] (rows=22096 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_21] + Group By Operator [GBY_19] (rows=22096 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)"],keys:KEY._col0, KEY._col1 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1 + Group By Operator [GBY_17] (rows=44193 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],aggregations:["sum(_col2)","sum(_col3)","sum(_col4)","sum(_col5)","sum(_col6)","sum(_col7)","sum(_col8)"],keys:_col0, _col1 + Select Operator [SEL_15] (rows=44193 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_34] (rows=44193 width=1119) + Output:["_col2","_col5","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_32] (rows=852 width=1910) + predicate:((s_gmt_offset = -6) and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id","s_store_name","s_gmt_offset"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_33] (rows=40176 width=1119) + Output:["_col2","_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=36524 width=1119) + Output:["_col0","_col2"] + Filter Operator [FIL_30] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_day_name"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_store_sk","ss_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query45.q.out b/ql/src/test/results/clientpositive/perf/query45.q.out index f55f20c..dbfb867 100644 --- a/ql/src/test/results/clientpositive/perf/query45.q.out +++ b/ql/src/test/results/clientpositive/perf/query45.q.out @@ -14,197 +14,104 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_44] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_43] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_42] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_41] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)) - Select Operator [SEL_40] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_39] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_38] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)) - Group By Operator [GBY_37] - aggregations:["sum(_col3)"] - keys:_col7 (type: string), _col8 (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_36] - outputColumnNames:["_col7","_col8","_col3"] - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col7","_col8"] - | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_71] - | | condition map:[{"":"Left Semi Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_20] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: int) - | | Select Operator [SEL_14] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_66] - | | predicate:(i_item_sk is not null and i_item_id is not null) (type: boolean) - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_12] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_19] - | keys:_col0 (type: string) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_67] - | predicate:((i_item_sk) IN (2, 3, 5, 7, 11, 13, 17, 19, 23, 29) and i_item_id is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - Merge Join Operator [MERGEJOIN_70] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col7","_col8"] - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_65] - | predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - Merge Join Operator [MERGEJOIN_69] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col7","_col8"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_64] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_68] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col5"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_62] - | predicate:((ws_bill_customer_sk is not null and ws_sold_date_sk is not null) and ws_item_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_63] - predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer - Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_44] + Limit [LIM_43] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_42] (rows=58564004 width=860) + Output:["_col0","_col1","_col2"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_41] + Select Operator [SEL_40] (rows=58564004 width=860) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_39] (rows=58564004 width=860) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col0, _col1 + Group By Operator [GBY_37] (rows=117128008 width=860) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col7, _col8 + Select Operator [SEL_36] (rows=117128008 width=860) + Output:["_col7","_col8","_col3"] + Merge Join Operator [MERGEJOIN_72] (rows=117128008 width=860) + Output:["_col3","_col7","_col8"],keys:{"0":"_col1","1":"_col0"} + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_71] (rows=508200 width=1436) + Output:["_col0"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col1 + Select Operator [SEL_14] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_66] (rows=462000 width=1436) + predicate:(i_item_sk is not null and i_item_id is not null) + TableScan [TS_12] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Group By Operator [GBY_19] (rows=231000 width=1436) + Output:["_col0"],keys:_col0 + Select Operator [SEL_17] (rows=231000 width=1436) + Output:["_col0"] + Filter Operator [FIL_67] (rows=231000 width=1436) + predicate:((i_item_sk) IN (2, 3, 5, 7, 11, 13, 17, 19, 23, 29) and i_item_id is not null) + TableScan [TS_15] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_70] (rows=106480005 width=860) + Output:["_col1","_col3","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_65] (rows=18262 width=1119) + predicate:(((d_qoy = 2) and (d_year = 2000)) and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_69] (rows=96800003 width=860) + Output:["_col0","_col1","_col3","_col7","_col8"],keys:{"0":"_col5","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_64] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_6] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_zip"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_68] (rows=88000001 width=860) + Output:["_col0","_col1","_col3","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_62] (rows=1 width=0) + predicate:((ws_bill_customer_sk is not null and ws_sold_date_sk is not null) and ws_item_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_bill_customer_sk","ws_sales_price"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=80000000 width=860) + Output:["_col0","_col1"] + Filter Operator [FIL_63] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_3] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query46.q.out b/ql/src/test/results/clientpositive/perf/query46.q.out index 0ded912..8a8b52d 100644 --- a/ql/src/test/results/clientpositive/perf/query46.q.out +++ b/ql/src/test/results/clientpositive/perf/query46.q.out @@ -15,227 +15,120 @@ Reducer 8 <- Map 15 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 9 - File Output Operator [FS_50] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_49] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_48] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int) - sort order:+++++ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) - Select Operator [SEL_46] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_45] - predicate:(_col10 <> _col2) (type: boolean) - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_90] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col7","_col8","_col10"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_84] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_36] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: string), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col7 (type: string), _col8 (type: string) - Merge Join Operator [MERGEJOIN_89] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col6","_col7","_col8"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_83] - | predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_33] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: string), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)) - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_30] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) - Group By Operator [GBY_28] - aggregations:["sum(_col6)","sum(_col7)"] - keys:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col17 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col1","_col3","_col5","_col17","_col6","_col7"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_88] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col7","_col17"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_14] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col7"] - | Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:(((hd_dep_count = 4) or (hd_vehicle_count = 2)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_86] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col7"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_80] - | predicate:((s_city) IN ('Rosedale', 'Bethlehem', 'Clinton', 'Clifton', 'Springfield') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_85] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_78] - | predicate:((((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_79] - predicate:(((d_year) IN (1998, 1999, 2000) and (d_dow) IN (6, 0)) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 9 + File Output Operator [FS_50] + Limit [LIM_49] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_48] (rows=96800003 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_47] + Select Operator [SEL_46] (rows=96800003 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_45] (rows=96800003 width=860) + predicate:(_col10 <> _col2) + Merge Join Operator [MERGEJOIN_90] (rows=96800003 width=860) + Output:["_col0","_col2","_col3","_col4","_col7","_col8","_col10"],keys:{"0":"_col6","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_38] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_84] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_36] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_city"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_89] (rows=88000001 width=860) + Output:["_col0","_col2","_col3","_col4","_col6","_col7","_col8"],keys:{"0":"_col1","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_35] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_83] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_33] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk","c_first_name","c_last_name"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col1 + Select Operator [SEL_31] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_30] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_28] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col6)","sum(_col7)"],keys:_col1, _col3, _col5, _col17 + Select Operator [SEL_27] (rows=44000000 width=1014) + Output:["_col1","_col3","_col5","_col17","_col6","_col7"] + Merge Join Operator [MERGEJOIN_88] (rows=44000000 width=1014) + Output:["_col1","_col3","_col5","_col6","_col7","_col17"],keys:{"0":"_col3","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_82] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_12] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_city"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_87] (rows=24305 width=1119) + Output:["_col1","_col3","_col5","_col6","_col7"],keys:{"0":"_col2","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=7200 width=107) + Output:["_col0"] + Filter Operator [FIL_81] (rows=7200 width=107) + predicate:(((hd_dep_count = 4) or (hd_vehicle_count = 2)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_86] (rows=22096 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col7"],keys:{"0":"_col4","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_80] (rows=852 width=1910) + predicate:((s_city) IN ('Rosedale', 'Bethlehem', 'Clinton', 'Clifton', 'Springfield') and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_city"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_85] (rows=20088 width=1119) + Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_78] (rows=1 width=0) + predicate:((((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_ticket_number","ss_coupon_amt","ss_net_profit"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_79] (rows=18262 width=1119) + predicate:(((d_year) IN (1998, 1999, 2000) and (d_dow) IN (6, 0)) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dow"] diff --git a/ql/src/test/results/clientpositive/perf/query48.q.out b/ql/src/test/results/clientpositive/perf/query48.q.out index 40b76f0..5f9b8d7 100644 --- a/ql/src/test/results/clientpositive/perf/query48.q.out +++ b/ql/src/test/results/clientpositive/perf/query48.q.out @@ -12,149 +12,81 @@ Reducer 5 <- Map 10 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 6 - File Output Operator [FS_34] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_32] - | aggregations:["sum(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_31] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_30] - aggregations:["sum(_col4)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4"] - | Statistics:Num rows: 18150000 Data size: 18420070657 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_25] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int) - Select Operator [SEL_22] - outputColumnNames:["_col0","_col4"] - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_21] - predicate:(((_col12) IN ('KY', 'GA', 'NM') and _col6 BETWEEN 0 AND 2000) or ((_col12) IN ('MT', 'OR', 'IN') and _col6 BETWEEN 150 AND 3000) or ((_col12) IN ('WI', 'MO', 'WV') and _col6 BETWEEN 50 AND 25000)) (type: boolean) - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col6","_col12"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_52] - | predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 5445 Data size: 1972040 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_55] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col6"] - | Statistics:Num rows: 5445 Data size: 1972040 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_51] - | predicate:(((cd_education_status = '4 yr Degree') and (cd_marital_status = 'M')) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 4950 Data size: 1792764 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_54] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col4","_col6"] - | Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_49] - | predicate:((((((ss_net_profit BETWEEN 0 AND 2000 or ss_net_profit BETWEEN 150 AND 3000 or ss_net_profit BETWEEN 50 AND 25000) and ss_store_sk is not null) and (ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0)) and ss_cdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_50] - predicate:s_store_sk is not null (type: boolean) - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:store - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 6 + File Output Operator [FS_34] + Group By Operator [GBY_32] (rows=1 width=8) + Output:["_col0"],aggregations:["sum(VALUE._col0)"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_31] + Group By Operator [GBY_30] (rows=1 width=8) + Output:["_col0"],aggregations:["sum(_col4)"] + Merge Join Operator [MERGEJOIN_57] (rows=18150000 width=1014) + Output:["_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_25] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_53] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_23] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Select Operator [SEL_22] (rows=16500000 width=1014) + Output:["_col0","_col4"] + Filter Operator [FIL_21] (rows=16500000 width=1014) + predicate:(((_col12) IN ('KY', 'GA', 'NM') and _col6 BETWEEN 0 AND 2000) or ((_col12) IN ('MT', 'OR', 'IN') and _col6 BETWEEN 150 AND 3000) or ((_col12) IN ('WI', 'MO', 'WV') and _col6 BETWEEN 50 AND 25000)) + Merge Join Operator [MERGEJOIN_56] (rows=22000000 width=1014) + Output:["_col0","_col4","_col6","_col12"],keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=20000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_52] (rows=20000000 width=1014) + predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) + TableScan [TS_9] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_55] (rows=5445 width=362) + Output:["_col0","_col2","_col4","_col6"],keys:{"0":"_col1","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=4950 width=362) + Output:["_col0"] + Filter Operator [FIL_51] (rows=4950 width=362) + predicate:(((cd_education_status = '4 yr Degree') and (cd_marital_status = 'M')) and cd_demo_sk is not null) + TableScan [TS_6] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_54] (rows=1874 width=1911) + Output:["_col0","_col1","_col2","_col4","_col6"],keys:{"0":"_col3","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col3 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col6"] + Filter Operator [FIL_49] (rows=1 width=0) + predicate:((((((ss_net_profit BETWEEN 0 AND 2000 or ss_net_profit BETWEEN 150 AND 3000 or ss_net_profit BETWEEN 50 AND 25000) and ss_store_sk is not null) and (ss_sales_price BETWEEN 100.0 AND 150.0 or ss_sales_price BETWEEN 50.0 AND 100.0 or ss_sales_price BETWEEN 150.0 AND 200.0)) and ss_cdemo_sk is not null) and ss_addr_sk is not null) and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_cdemo_sk","ss_addr_sk","ss_store_sk","ss_quantity","ss_sales_price","ss_net_profit"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1704 width=1910) + Output:["_col0"] + Filter Operator [FIL_50] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_3] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query50.q.out b/ql/src/test/results/clientpositive/perf/query50.q.out index 8b41d05..0980ea2 100644 --- a/ql/src/test/results/clientpositive/perf/query50.q.out +++ b/ql/src/test/results/clientpositive/perf/query50.q.out @@ -125,163 +125,86 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_36] - compressed:false - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_35] - Number of rows:100 - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_34] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - | Statistics:Num rows: 44194 Data size: 49453809 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string) - sort order:++++++++++ - Statistics:Num rows: 44194 Data size: 49453809 Basic stats: COMPLETE Column stats: NONE - value expressions:_col10 (type: bigint), _col11 (type: bigint), _col12 (type: bigint), _col13 (type: bigint), _col14 (type: bigint) - Group By Operator [GBY_31] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: string), KEY._col7 (type: string), KEY._col8 (type: string), KEY._col9 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - | Statistics:Num rows: 44194 Data size: 49453809 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string) - sort order:++++++++++ - Statistics:Num rows: 88388 Data size: 98907619 Basic stats: COMPLETE Column stats: NONE - value expressions:_col10 (type: bigint), _col11 (type: bigint), _col12 (type: bigint), _col13 (type: bigint), _col14 (type: bigint) - Group By Operator [GBY_29] - aggregations:["sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)"] - keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - Statistics:Num rows: 88388 Data size: 98907619 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] - Statistics:Num rows: 88388 Data size: 98907619 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_59] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"] - | Statistics:Num rows: 88388 Data size: 98907619 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_55] - | predicate:(((d_year = 2000) and d_date_sk is not null) and (d_moy = 9)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string), _col13 (type: string), _col14 (type: string), _col15 (type: string), _col16 (type: string), _col17 (type: string), _col18 (type: string), _col19 (type: string) - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"] - | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:d_date_sk is not null (type: boolean) - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: int), _col10 (type: string), _col11 (type: int), _col12 (type: string), _col13 (type: string), _col14 (type: string), _col15 (type: string), _col16 (type: string), _col17 (type: string), _col18 (type: string), _col19 (type: string) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"] - | Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: int), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col5 (type: int) - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int), _col1 (type: int), _col2 (type: int)","1":"_col3 (type: int), _col1 (type: int), _col2 (type: int)"} - | outputColumnNames:["_col0","_col3","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col4 (type: int), _col1 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col4 (type: int), _col1 (type: int), _col2 (type: int) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_51] - | predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_store_sk is not null) and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col3 (type: int), _col1 (type: int), _col2 (type: int) - Map-reduce partition columns:_col3 (type: int), _col1 (type: int), _col2 (type: int) - sort order:+++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_52] - predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_36] + Limit [LIM_35] (rows=100 width=1119) + Number of rows:100 + Select Operator [SEL_34] (rows=44194 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_33] + Group By Operator [GBY_31] (rows=44194 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7, KEY._col8, KEY._col9 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 + Group By Operator [GBY_29] (rows=88388 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"],aggregations:["sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 + Select Operator [SEL_27] (rows=88388 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14"] + Merge Join Operator [MERGEJOIN_59] (rows=88388 width=1119) + Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col5","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_55] (rows=18262 width=1119) + predicate:(((d_year = 2000) and d_date_sk is not null) and (d_moy = 9)) + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_58] (rows=80353 width=1119) + Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=73049 width=1119) + Output:["_col0"] + Filter Operator [FIL_54] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_57] (rows=1874 width=1911) + Output:["_col0","_col5","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col3","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=1704 width=1910) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] + Filter Operator [FIL_53] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_company_id","s_street_number","s_street_name","s_street_type","s_suite_number","s_city","s_county","s_state","s_zip"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_56] (rows=1 width=0) + Output:["_col0","_col3","_col5"],keys:{"0":"_col4, _col1, _col2","1":"_col3, _col1, _col2"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col4, _col1, _col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_51] (rows=1 width=0) + predicate:((((ss_ticket_number is not null and ss_customer_sk is not null) and ss_item_sk is not null) and ss_store_sk is not null) and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_store_sk","ss_ticket_number"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col3, _col1, _col2 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_52] (rows=1 width=0) + predicate:(((sr_ticket_number is not null and sr_customer_sk is not null) and sr_item_sk is not null) and sr_returned_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_returned_date_sk","sr_item_sk","sr_customer_sk","sr_ticket_number"] diff --git a/ql/src/test/results/clientpositive/perf/query51.q.out b/ql/src/test/results/clientpositive/perf/query51.q.out index efd95f2..54d7208 100644 --- a/ql/src/test/results/clientpositive/perf/query51.q.out +++ b/ql/src/test/results/clientpositive/perf/query51.q.out @@ -96,188 +96,100 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 9 <- Map 11 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_51] - compressed:false - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_50] - Number of rows:100 - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_49] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 7365 Data size: 8241815 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_48] - key expressions:_col0 (type: int), _col1 (type: string) - sort order:++ - Statistics:Num rows: 7365 Data size: 8241815 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(27,2)), _col3 (type: decimal(27,2)), _col4 (type: decimal(27,2)), _col5 (type: decimal(27,2)) - Select Operator [SEL_44] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 7365 Data size: 8241815 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_56] - predicate:(max_window_0 > max_window_1) (type: boolean) - Statistics:Num rows: 7365 Data size: 8241815 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_43] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"CASE WHEN (_col1 is not null) THEN (_col1) ELSE (_col4) END","partition by:":"CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END"}] - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_42] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_41] - key expressions:CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END (type: int), CASE WHEN (_col1 is not null) THEN (_col1) ELSE (_col4) END (type: string) - Map-reduce partition columns:CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END (type: int) - sort order:++ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: string), _col2 (type: decimal(27,2)), _col3 (type: int), _col4 (type: string), _col5 (type: decimal(27,2)) - Merge Join Operator [MERGEJOIN_65] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"_col0 (type: int), _col1 (type: string)","1":"_col0 (type: int), _col1 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: int), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(27,2)) - | Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | PTF Operator [PTF_34] - | Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_31] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: int), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_30] - | key expressions:_col0 (type: int), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: int) - | sort order:++ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(17,2)) - | Group By Operator [GBY_29] - | aggregations:["sum(_col2)"] - | keys:_col1 (type: int), _col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_28] - | outputColumnNames:["_col1","_col4","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_64] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col4"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_26] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_24] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_60] - | | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_22] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_21] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_59] - | predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_19] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_38] - key expressions:_col0 (type: int), _col1 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: string) - sort order:++ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(27,2)) - Select Operator [SEL_16] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_15] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_12] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col0 (type: int), _col1 (type: string) - Map-reduce partition columns:_col0 (type: int) - sort order:++ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)) - Group By Operator [GBY_10] - aggregations:["sum(_col2)"] - keys:_col1 (type: int), _col4 (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_9] - outputColumnNames:["_col1","_col4","_col2"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_63] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_57] - | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_58] - predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_51] + Limit [LIM_50] (rows=100 width=1119) + Number of rows:100 + Select Operator [SEL_49] (rows=7365 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_48] + Select Operator [SEL_44] (rows=7365 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_56] (rows=7365 width=1119) + predicate:(max_window_0 > max_window_1) + PTF Operator [PTF_43] (rows=22096 width=1119) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"CASE WHEN (_col1 is not null) THEN (_col1) ELSE (_col4) END","partition by:":"CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END"}] + Select Operator [SEL_42] (rows=22096 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:CASE WHEN (_col0 is not null) THEN (_col0) ELSE (_col3) END + Merge Join Operator [MERGEJOIN_65] (rows=22096 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0, _col1 + Select Operator [SEL_35] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + PTF Operator [PTF_34] (rows=20088 width=1119) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] + Group By Operator [GBY_31] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Group By Operator [GBY_29] (rows=40176 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)"],keys:_col1, _col4 + Select Operator [SEL_28] (rows=40176 width=1119) + Output:["_col1","_col4","_col2"] + Merge Join Operator [MERGEJOIN_64] (rows=40176 width=1119) + Output:["_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Select Operator [SEL_24] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_60] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_22] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_month_seq"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_21] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_59] (rows=1 width=0) + predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_19] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_sales_price"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col0, _col1 + Select Operator [SEL_16] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + PTF Operator [PTF_15] (rows=20088 width=1119) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] + Group By Operator [GBY_12] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col0 + Group By Operator [GBY_10] (rows=40176 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col2)"],keys:_col1, _col4 + Select Operator [SEL_9] (rows=40176 width=1119) + Output:["_col1","_col4","_col2"] + Merge Join Operator [MERGEJOIN_63] (rows=40176 width=1119) + Output:["_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_57] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_58] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_month_seq"] diff --git a/ql/src/test/results/clientpositive/perf/query52.q.out b/ql/src/test/results/clientpositive/perf/query52.q.out index b4f46cc..4670f6b 100644 --- a/ql/src/test/results/clientpositive/perf/query52.q.out +++ b/ql/src/test/results/clientpositive/perf/query52.q.out @@ -11,111 +11,60 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_23] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:1998 (type: int), _col3 (type: decimal(17,2)), _col1 (type: int) - sort order:+-+ - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: string) - Select Operator [SEL_20] - outputColumnNames:["_col1","_col2","_col3"] - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_19] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: string), KEY._col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int), _col1 (type: string), _col2 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: string), _col2 (type: int) - sort order:+++ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Group By Operator [GBY_17] - aggregations:["sum(_col3)"] - keys:1998 (type: int), _col1 (type: string), _col2 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col1","_col2","_col3"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_34] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_32] - | predicate:((i_manager_id = 1) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_30] - | predicate:(((d_year = 1998) and (d_moy = 12)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:dt - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_31] - predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_24] + Limit [LIM_23] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_22] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_21] + Select Operator [SEL_20] (rows=127050 width=1436) + Output:["_col1","_col2","_col3"] + Group By Operator [GBY_19] (rows=127050 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_17] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col3)"],keys:1998, _col1, _col2 + Select Operator [SEL_15] (rows=254100 width=1436) + Output:["_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436) + Output:["_col5","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_32] (rows=231000 width=1436) + predicate:((i_manager_id = 1) and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manager_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_33] (rows=20088 width=1119) + Output:["_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_30] (rows=18262 width=1119) + predicate:(((d_year = 1998) and (d_moy = 12)) and d_date_sk is not null) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,dt,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query54.q.out b/ql/src/test/results/clientpositive/perf/query54.q.out index 56c70b7..2184419 100644 --- a/ql/src/test/results/clientpositive/perf/query54.q.out +++ b/ql/src/test/results/clientpositive/perf/query54.q.out @@ -20,295 +20,154 @@ Reducer 8 <- Map 19 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Map 20 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 13 - File Output Operator [FS_68] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_67] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_66] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 16105101 Data size: 13850712636 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 12 [SIMPLE_EDGE] - Reduce Output Operator [RS_65] - key expressions:_col0 (type: int), _col1 (type: bigint) - sort order:++ - Statistics:Num rows: 16105101 Data size: 13850712636 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int) - Select Operator [SEL_64] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 16105101 Data size: 13850712636 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_63] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 16105101 Data size: 13850712636 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_62] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 32210202 Data size: 27701425272 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_61] - aggregations:["count()"] - keys:_col0 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 32210202 Data size: 27701425272 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_59] - outputColumnNames:["_col0"] - Statistics:Num rows: 32210202 Data size: 27701425272 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_58] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 32210202 Data size: 27701425272 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_57] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 64420404 Data size: 55402850544 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_56] - aggregations:["sum(_col4)"] - keys:_col0 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 64420404 Data size: 55402850544 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_126] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4"] - | Statistics:Num rows: 64420404 Data size: 55402850544 Basic stats: COMPLETE Column stats: NONE - |<-Map 21 [SIMPLE_EDGE] - | Reduce Output Operator [RS_53] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_42] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_119] - | predicate:(d_month_seq BETWEEN 1203 AND 1205 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_40] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_52] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 58564003 Data size: 50366226676 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_125] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: string), _col7 (type: string)","1":"_col0 (type: string), _col1 (type: string)"} - | outputColumnNames:["_col0","_col2","_col4"] - | Statistics:Num rows: 58564003 Data size: 50366226676 Basic stats: COMPLETE Column stats: NONE - |<-Map 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_50] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_39] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_118] - | predicate:(s_county is not null and s_state is not null) (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_37] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_49] - key expressions:_col6 (type: string), _col7 (type: string) - Map-reduce partition columns:_col6 (type: string), _col7 (type: string) - sort order:++ - Statistics:Num rows: 53240002 Data size: 45787477804 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col4 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_124] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col6","_col7"] - | Statistics:Num rows: 53240002 Data size: 45787477804 Basic stats: COMPLETE Column stats: NONE - |<-Map 19 [SIMPLE_EDGE] - | Reduce Output Operator [RS_47] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_36] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_117] - | predicate:((ca_address_sk is not null and ca_state is not null) and ca_county is not null) (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_34] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_46] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 48400001 Data size: 41624978920 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col4 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_123] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 48400001 Data size: 41624978920 Basic stats: COMPLETE Column stats: NONE - |<-Map 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_44] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_116] - | predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_31] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_43] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int) - Group By Operator [GBY_29] - | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_27] - keys:_col9 (type: int), _col10 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_122] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col9","_col10"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_16] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_115] - | predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_14] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_121] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_13] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_114] - | predicate:(((d_year = 2000) and (d_moy = 3)) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_11] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int) - Merge Join Operator [MERGEJOIN_120] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_10] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_113] - | predicate:(((i_category = 'Jewelry') and (i_class = 'football')) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_8] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_17] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 2 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_111] - | predicate:((cs_item_sk is not null and cs_sold_date_sk is not null) and cs_bill_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 14 [CONTAINS] - Reduce Output Operator [RS_17] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 2 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_112] - predicate:((ws_item_sk is not null and ws_sold_date_sk is not null) and ws_bill_customer_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:web_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 13 + File Output Operator [FS_68] + Limit [LIM_67] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_66] (rows=16105101 width=860) + Output:["_col0","_col1","_col2"] + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_65] + Select Operator [SEL_64] (rows=16105101 width=860) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_63] (rows=16105101 width=860) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_62] + PartitionCols:_col0 + Group By Operator [GBY_61] (rows=32210202 width=860) + Output:["_col0","_col1"],aggregations:["count()"],keys:_col0 + Select Operator [SEL_59] (rows=32210202 width=860) + Output:["_col0"] + Group By Operator [GBY_58] (rows=32210202 width=860) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_57] + PartitionCols:_col0 + Group By Operator [GBY_56] (rows=64420404 width=860) + Output:["_col0","_col1"],aggregations:["sum(_col4)"],keys:_col0 + Merge Join Operator [MERGEJOIN_126] (rows=64420404 width=860) + Output:["_col0","_col4"],keys:{"0":"_col2","1":"_col0"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_53] + PartitionCols:_col0 + Select Operator [SEL_42] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_119] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1203 AND 1205 and d_date_sk is not null) + TableScan [TS_40] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_125] (rows=58564003 width=860) + Output:["_col0","_col2","_col4"],keys:{"0":"_col6, _col7","1":"_col0, _col1"} + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_50] + PartitionCols:_col0, _col1 + Select Operator [SEL_39] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_118] (rows=1704 width=1910) + predicate:(s_county is not null and s_state is not null) + TableScan [TS_37] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_county","s_state"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col6, _col7 + Merge Join Operator [MERGEJOIN_124] (rows=53240002 width=860) + Output:["_col0","_col2","_col4","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 19 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0 + Select Operator [SEL_36] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_117] (rows=40000000 width=1014) + predicate:((ca_address_sk is not null and ca_state is not null) and ca_county is not null) + TableScan [TS_34] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_county","ca_state"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_123] (rows=48400001 width=860) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col1"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col1 + Select Operator [SEL_33] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_116] (rows=1 width=0) + predicate:(ss_customer_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_31] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_ext_sales_price"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Group By Operator [GBY_29] (rows=44000000 width=860) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0, _col1 + Group By Operator [GBY_27] (rows=88000001 width=860) + Output:["_col0","_col1"],keys:_col9, _col10 + Merge Join Operator [MERGEJOIN_122] (rows=88000001 width=860) + Output:["_col9","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=80000000 width=860) + Output:["_col0","_col1"] + Filter Operator [FIL_115] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_14] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_121] (rows=139755 width=1436) + Output:["_col1"],keys:{"0":"_col0","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_114] (rows=18262 width=1119) + predicate:(((d_year = 2000) and (d_moy = 3)) and d_date_sk is not null) + TableScan [TS_11] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_120] (rows=127050 width=1436) + Output:["_col0","_col1"],keys:{"0":"_col2","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Select Operator [SEL_10] (rows=115500 width=1436) + Output:["_col0"] + Filter Operator [FIL_113] (rows=115500 width=1436) + predicate:(((i_category = 'Jewelry') and (i_class = 'football')) and i_item_sk is not null) + TableScan [TS_8] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_class","i_category"] + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_17] + PartitionCols:_col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_111] (rows=1 width=0) + predicate:((cs_item_sk is not null and cs_sold_date_sk is not null) and cs_bill_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk"] + <-Map 14 [CONTAINS] + Reduce Output Operator [RS_17] + PartitionCols:_col2 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_112] (rows=1 width=0) + predicate:((ws_item_sk is not null and ws_sold_date_sk is not null) and ws_bill_customer_sk is not null) + TableScan [TS_3] (rows=1 width=0) + Output:["ws_sold_date_sk","ws_item_sk","ws_bill_customer_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query55.q.out b/ql/src/test/results/clientpositive/perf/query55.q.out index d36f378..e35cda4 100644 --- a/ql/src/test/results/clientpositive/perf/query55.q.out +++ b/ql/src/test/results/clientpositive/perf/query55.q.out @@ -11,108 +11,58 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_23] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col2 (type: decimal(17,2)), _col0 (type: int) - sort order:-+ - Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 127050 Data size: 182479129 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: int), _col1 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: string) - sort order:++ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)) - Group By Operator [GBY_16] - aggregations:["sum(_col5)"] - keys:_col7 (type: int), _col8 (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col7","_col8","_col5"] - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_34] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_32] - | predicate:((i_manager_id = 36) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_30] - | predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_31] - predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_24] + Limit [LIM_23] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_22] (rows=127050 width=1436) + Output:["_col0","_col1","_col2"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_21] + Group By Operator [GBY_18] (rows=127050 width=1436) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1 + Group By Operator [GBY_16] (rows=254100 width=1436) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col5)"],keys:_col7, _col8 + Select Operator [SEL_15] (rows=254100 width=1436) + Output:["_col7","_col8","_col5"] + Merge Join Operator [MERGEJOIN_34] (rows=254100 width=1436) + Output:["_col5","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=231000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_32] (rows=231000 width=1436) + predicate:((i_manager_id = 36) and i_item_sk is not null) + TableScan [TS_6] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manager_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_33] (rows=20088 width=1119) + Output:["_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_30] (rows=18262 width=1119) + predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) + TableScan [TS_0] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_item_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query58.q.out b/ql/src/test/results/clientpositive/perf/query58.q.out index c2f7189..5e21730 100644 --- a/ql/src/test/results/clientpositive/perf/query58.q.out +++ b/ql/src/test/results/clientpositive/perf/query58.q.out @@ -115,488 +115,250 @@ Reducer 7 <- Reducer 28 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 8 - File Output Operator [FS_112] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_111] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_110] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 21137 Data size: 30358620 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_109] - key expressions:_col0 (type: string), _col1 (type: decimal(17,2)) - sort order:++ - Statistics:Num rows: 21137 Data size: 30358620 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(38,21)), _col3 (type: decimal(17,2)), _col4 (type: decimal(38,21)), _col5 (type: decimal(17,2)), _col6 (type: decimal(38,21)), _col7 (type: decimal(23,6)) - Select Operator [SEL_108] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 21137 Data size: 30358620 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_107] - predicate:(_col1 BETWEEN (0.9 * UDFToDouble(_col5)) AND (1.1 * UDFToDouble(_col5)) and _col3 BETWEEN (0.9 * UDFToDouble(_col5)) AND (1.1 * UDFToDouble(_col5)) and _col5 BETWEEN (0.9 * UDFToDouble(_col1)) AND (1.1 * UDFToDouble(_col1)) and _col5 BETWEEN (0.9 * UDFToDouble(_col3)) AND (1.1 * UDFToDouble(_col3))) (type: boolean) - Statistics:Num rows: 21137 Data size: 30358620 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_202] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3","_col5"] - | Statistics:Num rows: 338207 Data size: 485759473 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 28 [SIMPLE_EDGE] - | Reduce Output Operator [RS_105] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)) - | Group By Operator [GBY_102] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 27 [SIMPLE_EDGE] - | Reduce Output Operator [RS_101] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)) - | Group By Operator [GBY_100] - | aggregations:["sum(_col2)"] - | keys:_col4 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_99] - | outputColumnNames:["_col4","_col2"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_200] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col6 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col4"] - | | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 26 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_96] - | | key expressions:_col6 (type: string) - | | Map-reduce partition columns:_col6 (type: string) - | | sort order:+ - | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - | | Merge Join Operator [MERGEJOIN_196] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col2","_col4","_col6"] - | | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 30 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_94] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_79] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_186] - | | | predicate:(d_date_sk is not null and d_date is not null) (type: boolean) - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_77] - | | | alias:date_dim - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 25 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_93] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - | | Merge Join Operator [MERGEJOIN_195] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col2","_col4"] - | | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 24 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_90] - | | | key expressions:_col1 (type: int) - | | | Map-reduce partition columns:_col1 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | | | Select Operator [SEL_73] - | | | outputColumnNames:["_col0","_col1","_col2"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_184] - | | | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_71] - | | | alias:web_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 29 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_91] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_76] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_185] - | | predicate:(i_item_sk is not null and i_item_id is not null) (type: boolean) - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_74] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 32 [SIMPLE_EDGE] - | Reduce Output Operator [RS_97] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_197] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | |<-Map 31 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_86] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_82] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_187] - | | predicate:(d_week_seq is not null and d_date is not null) (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_80] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Map 33 [SIMPLE_EDGE] - | Reduce Output Operator [RS_87] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_85] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_188] - | predicate:((d_date = '1998-08-04') and d_week_seq is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_83] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_104] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 84551 Data size: 121438791 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)), _col3 (type: decimal(17,2)) - Filter Operator [FIL_69] - predicate:(_col3 BETWEEN (0.9 * UDFToDouble(_col1)) AND (1.1 * UDFToDouble(_col1)) and _col1 BETWEEN (0.9 * UDFToDouble(_col3)) AND (1.1 * UDFToDouble(_col3))) (type: boolean) - Statistics:Num rows: 84551 Data size: 121438791 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_201] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 338207 Data size: 485759473 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_67] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)) - | Group By Operator [GBY_64] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_63] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)) - | Group By Operator [GBY_62] - | aggregations:["sum(_col2)"] - | keys:_col4 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_61] - | outputColumnNames:["_col4","_col2"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_199] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col6 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col4"] - | | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_58] - | | key expressions:_col6 (type: string) - | | Map-reduce partition columns:_col6 (type: string) - | | sort order:+ - | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - | | Merge Join Operator [MERGEJOIN_193] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col2","_col4","_col6"] - | | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 20 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_56] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_41] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_181] - | | | predicate:(d_date_sk is not null and d_date is not null) (type: boolean) - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_39] - | | | alias:date_dim - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_55] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - | | Merge Join Operator [MERGEJOIN_192] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col2","_col4"] - | | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 14 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_52] - | | | key expressions:_col1 (type: int) - | | | Map-reduce partition columns:_col1 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | | | Select Operator [SEL_35] - | | | outputColumnNames:["_col0","_col1","_col2"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_179] - | | | predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_33] - | | | alias:catalog_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 19 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_53] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_38] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_180] - | | predicate:(i_item_sk is not null and i_item_id is not null) (type: boolean) - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_36] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 22 [SIMPLE_EDGE] - | Reduce Output Operator [RS_59] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_194] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_48] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_44] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_182] - | | predicate:(d_week_seq is not null and d_date is not null) (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_42] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Map 23 [SIMPLE_EDGE] - | Reduce Output Operator [RS_49] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_47] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_183] - | predicate:((d_date = '1998-08-04') and d_week_seq is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_45] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_66] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_31] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 307461 Data size: 441599512 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_29] - aggregations:["sum(_col2)"] - keys:_col4 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_28] - outputColumnNames:["_col4","_col2"] - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_198] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col2","_col4"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_26] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_191] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 80353 Data size: 89916016 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_15] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_11] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_177] - | | predicate:(d_week_seq is not null and d_date is not null) (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_9] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_178] - | predicate:((d_date = '1998-08-04') and d_week_seq is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col6 (type: string) - Map-reduce partition columns:_col6 (type: string) - sort order:+ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - Merge Join Operator [MERGEJOIN_190] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4","_col6"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_176] - | predicate:(d_date_sk is not null and d_date is not null) (type: boolean) - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - Merge Join Operator [MERGEJOIN_189] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_174] - | predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_175] - predicate:(i_item_sk is not null and i_item_id is not null) (type: boolean) - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 8 + File Output Operator [FS_112] + Limit [LIM_111] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_110] (rows=21137 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_109] + Select Operator [SEL_108] (rows=21137 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_107] (rows=21137 width=1436) + predicate:(_col1 BETWEEN (0.9 * UDFToDouble(_col5)) AND (1.1 * UDFToDouble(_col5)) and _col3 BETWEEN (0.9 * UDFToDouble(_col5)) AND (1.1 * UDFToDouble(_col5)) and _col5 BETWEEN (0.9 * UDFToDouble(_col1)) AND (1.1 * UDFToDouble(_col1)) and _col5 BETWEEN (0.9 * UDFToDouble(_col3)) AND (1.1 * UDFToDouble(_col3))) + Merge Join Operator [MERGEJOIN_202] (rows=338207 width=1436) + Output:["_col0","_col1","_col3","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 28 [SIMPLE_EDGE] + SHUFFLE [RS_105] + PartitionCols:_col0 + Group By Operator [GBY_102] (rows=307461 width=1436) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 27 [SIMPLE_EDGE] + SHUFFLE [RS_101] + PartitionCols:_col0 + Group By Operator [GBY_100] (rows=614922 width=1436) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col4 + Select Operator [SEL_99] (rows=614922 width=1436) + Output:["_col4","_col2"] + Merge Join Operator [MERGEJOIN_200] (rows=614922 width=1436) + Output:["_col2","_col4"],keys:{"0":"_col6","1":"_col0"} + <-Reducer 26 [SIMPLE_EDGE] + SHUFFLE [RS_96] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_196] (rows=559020 width=1436) + Output:["_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 30 [SIMPLE_EDGE] + SHUFFLE [RS_94] + PartitionCols:_col0 + Select Operator [SEL_79] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_186] (rows=73049 width=1119) + predicate:(d_date_sk is not null and d_date is not null) + TableScan [TS_77] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 25 [SIMPLE_EDGE] + SHUFFLE [RS_93] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_195] (rows=508200 width=1436) + Output:["_col0","_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 24 [SIMPLE_EDGE] + SHUFFLE [RS_90] + PartitionCols:_col1 + Select Operator [SEL_73] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_184] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_71] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_ext_sales_price"] + <-Map 29 [SIMPLE_EDGE] + SHUFFLE [RS_91] + PartitionCols:_col0 + Select Operator [SEL_76] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_185] (rows=462000 width=1436) + predicate:(i_item_sk is not null and i_item_id is not null) + TableScan [TS_74] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 32 [SIMPLE_EDGE] + SHUFFLE [RS_97] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_197] (rows=80353 width=1119) + Output:["_col0"],keys:{"0":"_col1","1":"_col1"} + <-Map 31 [SIMPLE_EDGE] + SHUFFLE [RS_86] + PartitionCols:_col1 + Select Operator [SEL_82] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_187] (rows=73049 width=1119) + predicate:(d_week_seq is not null and d_date is not null) + TableScan [TS_80] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Map 33 [SIMPLE_EDGE] + SHUFFLE [RS_87] + PartitionCols:_col1 + Select Operator [SEL_85] (rows=36524 width=1119) + Output:["_col1"] + Filter Operator [FIL_188] (rows=36524 width=1119) + predicate:((d_date = '1998-08-04') and d_week_seq is not null) + TableScan [TS_83] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_104] + PartitionCols:_col0 + Filter Operator [FIL_69] (rows=84551 width=1436) + predicate:(_col3 BETWEEN (0.9 * UDFToDouble(_col1)) AND (1.1 * UDFToDouble(_col1)) and _col1 BETWEEN (0.9 * UDFToDouble(_col3)) AND (1.1 * UDFToDouble(_col3))) + Merge Join Operator [MERGEJOIN_201] (rows=338207 width=1436) + Output:["_col0","_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_67] + PartitionCols:_col0 + Group By Operator [GBY_64] (rows=307461 width=1436) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_63] + PartitionCols:_col0 + Group By Operator [GBY_62] (rows=614922 width=1436) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col4 + Select Operator [SEL_61] (rows=614922 width=1436) + Output:["_col4","_col2"] + Merge Join Operator [MERGEJOIN_199] (rows=614922 width=1436) + Output:["_col2","_col4"],keys:{"0":"_col6","1":"_col0"} + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_193] (rows=559020 width=1436) + Output:["_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col0 + Select Operator [SEL_41] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_181] (rows=73049 width=1119) + predicate:(d_date_sk is not null and d_date is not null) + TableScan [TS_39] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_192] (rows=508200 width=1436) + Output:["_col0","_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col1 + Select Operator [SEL_35] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_179] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_33] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_ext_sales_price"] + <-Map 19 [SIMPLE_EDGE] + SHUFFLE [RS_53] + PartitionCols:_col0 + Select Operator [SEL_38] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_180] (rows=462000 width=1436) + predicate:(i_item_sk is not null and i_item_id is not null) + TableScan [TS_36] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 22 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_194] (rows=80353 width=1119) + Output:["_col0"],keys:{"0":"_col1","1":"_col1"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col1 + Select Operator [SEL_44] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_182] (rows=73049 width=1119) + predicate:(d_week_seq is not null and d_date is not null) + TableScan [TS_42] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col1 + Select Operator [SEL_47] (rows=36524 width=1119) + Output:["_col1"] + Filter Operator [FIL_183] (rows=36524 width=1119) + predicate:((d_date = '1998-08-04') and d_week_seq is not null) + TableScan [TS_45] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_66] + PartitionCols:_col0 + Group By Operator [GBY_31] (rows=307461 width=1436) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Group By Operator [GBY_29] (rows=614922 width=1436) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col4 + Select Operator [SEL_28] (rows=614922 width=1436) + Output:["_col4","_col2"] + Merge Join Operator [MERGEJOIN_198] (rows=614922 width=1436) + Output:["_col2","_col4"],keys:{"0":"_col6","1":"_col0"} + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_191] (rows=80353 width=1119) + Output:["_col0"],keys:{"0":"_col1","1":"_col1"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col1 + Select Operator [SEL_11] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_177] (rows=73049 width=1119) + predicate:(d_week_seq is not null and d_date is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col1 + Select Operator [SEL_14] (rows=36524 width=1119) + Output:["_col1"] + Filter Operator [FIL_178] (rows=36524 width=1119) + predicate:((d_date = '1998-08-04') and d_week_seq is not null) + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date","d_week_seq"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_190] (rows=559020 width=1436) + Output:["_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_176] (rows=73049 width=1119) + predicate:(d_date_sk is not null and d_date is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_189] (rows=508200 width=1436) + Output:["_col0","_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_174] (rows=1 width=0) + predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_175] (rows=462000 width=1436) + predicate:(i_item_sk is not null and i_item_id is not null) + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] diff --git a/ql/src/test/results/clientpositive/perf/query64.q.out b/ql/src/test/results/clientpositive/perf/query64.q.out index 68730e7..afa818d 100644 --- a/ql/src/test/results/clientpositive/perf/query64.q.out +++ b/ql/src/test/results/clientpositive/perf/query64.q.out @@ -47,1146 +47,587 @@ Reducer 8 <- Map 27 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Map 28 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 20 - File Output Operator [FS_254] - compressed:false - Statistics:Num rows: 122532649 Data size: 105380558466 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_253] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20"] - | Statistics:Num rows: 122532649 Data size: 105380558466 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 19 [SIMPLE_EDGE] - Reduce Output Operator [RS_252] - key expressions:_col0 (type: string), _col1 (type: string), _col20 (type: bigint) - sort order:+++ - Statistics:Num rows: 122532649 Data size: 105380558466 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col12 (type: bigint), _col13 (type: decimal(17,2)), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)), _col18 (type: decimal(17,2)), _col19 (type: int) - Select Operator [SEL_251] - outputColumnNames:["_col0","_col1","_col10","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col2","_col20","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 122532649 Data size: 105380558466 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_250] - predicate:(_col34 <= _col15) (type: boolean) - Statistics:Num rows: 122532649 Data size: 105380558466 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_715] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int), _col2 (type: string), _col3 (type: string)","1":"_col1 (type: int), _col2 (type: string), _col3 (type: string)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col31","_col34","_col35","_col36","_col37"] - | Statistics:Num rows: 367597947 Data size: 316141675400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_247] - | key expressions:_col1 (type: int), _col2 (type: string), _col3 (type: string) - | Map-reduce partition columns:_col1 (type: int), _col2 (type: string), _col3 (type: string) - | sort order:+++ - | Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), _col15 (type: bigint), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)), _col18 (type: decimal(17,2)) - | Select Operator [SEL_123] - | outputColumnNames:["_col0","_col1","_col10","_col11","_col15","_col16","_col17","_col18","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_122] - | | aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: string), KEY._col7 (type: string), KEY._col8 (type: string), KEY._col9 (type: string), KEY._col10 (type: string), KEY._col11 (type: string), KEY._col12 (type: int), KEY._col13 (type: int), KEY._col14 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"] - | | Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_121] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), _col12 (type: int), _col13 (type: int), _col14 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), _col12 (type: int), _col13 (type: int), _col14 (type: int) - | sort order:+++++++++++++++ - | Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col15 (type: bigint), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)), _col18 (type: decimal(17,2)) - | Group By Operator [GBY_120] - | aggregations:["count()","sum(_col15)","sum(_col16)","sum(_col17)"] - | keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), 2000 (type: int), _col13 (type: int), _col14 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"] - | Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_118] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col13","_col14","_col15","_col16","_col17"] - | Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_697] - | | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)","2":"_col0 (type: int)"} - | | outputColumnNames:["_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53"] - | | Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - | |<-Map 36 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_115] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col3 (type: string) - | | Select Operator [SEL_76] - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_659] - | | predicate:((((i_color) IN ('maroon', 'burnished', 'dim', 'steel', 'navajo', 'chocolate') and i_current_price BETWEEN 35 AND 45) and i_current_price BETWEEN 36 AND 50) and i_item_sk is not null) (type: boolean) - | | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_74] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_114] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 303799944 Data size: 261274100967 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | | Merge Join Operator [MERGEJOIN_695] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col37 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | | Statistics:Num rows: 303799944 Data size: 261274100967 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 35 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_112] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_73] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_658] - | | | predicate:ib_income_band_sk is not null (type: boolean) - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_71] - | | | alias:ib1 - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_111] - | | key expressions:_col37 (type: int) - | | Map-reduce partition columns:_col37 (type: int) - | | sort order:+ - | | Statistics:Num rows: 276181762 Data size: 237521904822 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | | Merge Join Operator [MERGEJOIN_694] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col35 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | | Statistics:Num rows: 276181762 Data size: 237521904822 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 34 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_109] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_70] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_657] - | | | predicate:ib_income_band_sk is not null (type: boolean) - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_68] - | | | alias:ib1 - | | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 14 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_108] - | | key expressions:_col35 (type: int) - | | Map-reduce partition columns:_col35 (type: int) - | | sort order:+ - | | Statistics:Num rows: 251074324 Data size: 215928999704 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col37 (type: int), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | | Merge Join Operator [MERGEJOIN_693] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col17 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | | Statistics:Num rows: 251074324 Data size: 215928999704 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 33 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_106] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | | | Select Operator [SEL_67] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_656] - | | | predicate:ca_address_sk is not null (type: boolean) - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_65] - | | | alias:ad1 - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 13 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_105] - | | key expressions:_col17 (type: int) - | | Map-reduce partition columns:_col17 (type: int) - | | sort order:+ - | | Statistics:Num rows: 228249381 Data size: 196299086386 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int), _col37 (type: int), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string) - | | Merge Join Operator [MERGEJOIN_692] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42"] - | | | Statistics:Num rows: 228249381 Data size: 196299086386 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 32 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_103] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | | | Select Operator [SEL_64] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_655] - | | | predicate:ca_address_sk is not null (type: boolean) - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_62] - | | | alias:ad1 - | | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 12 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_102] - | | key expressions:_col5 (type: int) - | | Map-reduce partition columns:_col5 (type: int) - | | sort order:+ - | | Statistics:Num rows: 207499433 Data size: 178453711029 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int), _col37 (type: int) - | | Merge Join Operator [MERGEJOIN_691] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col16 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col5","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37"] - | | | Statistics:Num rows: 207499433 Data size: 178453711029 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 31 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_100] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: int) - | | | Select Operator [SEL_61] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_654] - | | | predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) (type: boolean) - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_59] - | | | alias:hd1 - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_99] - | | key expressions:_col16 (type: int) - | | Map-reduce partition columns:_col16 (type: int) - | | sort order:+ - | | Statistics:Num rows: 188635845 Data size: 162230642874 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int) - | | Merge Join Operator [MERGEJOIN_690] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col35"] - | | | Statistics:Num rows: 188635845 Data size: 162230642874 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 30 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_97] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: int) - | | | Select Operator [SEL_58] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_653] - | | | predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) (type: boolean) - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_56] - | | | alias:hd1 - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_96] - | | key expressions:_col4 (type: int) - | | Map-reduce partition columns:_col4 (type: int) - | | sort order:+ - | | Statistics:Num rows: 171487129 Data size: 147482399417 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | | Merge Join Operator [MERGEJOIN_689] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col7 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col4","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28"] - | | | Statistics:Num rows: 171487129 Data size: 147482399417 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 29 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_94] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_55] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_652] - | | | predicate:p_promo_sk is not null (type: boolean) - | | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_53] - | | | alias:promotion - | | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 9 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_93] - | | key expressions:_col7 (type: int) - | | Map-reduce partition columns:_col7 (type: int) - | | sort order:+ - | | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | | Select Operator [SEL_52] - | | outputColumnNames:["_col1","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col4","_col5","_col7","_col9"] - | | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_51] - | | predicate:(_col30 <> _col32) (type: boolean) - | | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | | Merge Join Operator [MERGEJOIN_688] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col15 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col30","_col32"] - | | | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 28 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_49] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_26] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_651] - | | | predicate:cd_demo_sk is not null (type: boolean) - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_24] - | | | alias:cd1 - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 8 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_48] - | | key expressions:_col15 (type: int) - | | Map-reduce partition columns:_col15 (type: int) - | | sort order:+ - | | Statistics:Num rows: 141724895 Data size: 121886275227 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col30 (type: string) - | | Merge Join Operator [MERGEJOIN_687] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28","_col30"] - | | | Statistics:Num rows: 141724895 Data size: 121886275227 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 27 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_46] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_23] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_650] - | | | predicate:cd_demo_sk is not null (type: boolean) - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_21] - | | | alias:cd1 - | | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 7 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_45] - | | key expressions:_col3 (type: int) - | | Map-reduce partition columns:_col3 (type: int) - | | sort order:+ - | | Statistics:Num rows: 128840811 Data size: 110805702351 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | | Merge Join Operator [MERGEJOIN_686] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col3","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28"] - | | | Statistics:Num rows: 128840811 Data size: 110805702351 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 26 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_43] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string), _col2 (type: string) - | | | Select Operator [SEL_20] - | | | outputColumnNames:["_col0","_col1","_col2"] - | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_649] - | | | predicate:((s_store_sk is not null and s_zip is not null) and s_store_name is not null) (type: boolean) - | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_18] - | | | alias:store - | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 6 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_42] - | | key expressions:_col6 (type: int) - | | Map-reduce partition columns:_col6 (type: int) - | | sort order:+ - | | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int) - | | Merge Join Operator [MERGEJOIN_685] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col18 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25"] - | | | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 25 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_40] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: int) - | | | Select Operator [SEL_17] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_648] - | | | predicate:d_date_sk is not null (type: boolean) - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_15] - | | | alias:d1 - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 5 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_39] - | | key expressions:_col18 (type: int) - | | Map-reduce partition columns:_col18 (type: int) - | | sort order:+ - | | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int) - | | Merge Join Operator [MERGEJOIN_684] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col19 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col23"] - | | | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 24 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_37] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: int) - | | | Select Operator [SEL_14] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_647] - | | | predicate:d_date_sk is not null (type: boolean) - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_12] - | | | alias:d1 - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 4 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_36] - | | key expressions:_col19 (type: int) - | | Map-reduce partition columns:_col19 (type: int) - | | sort order:+ - | | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col18 (type: int) - | | Merge Join Operator [MERGEJOIN_683] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"] - | | | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 23 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_34] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_11] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_646] - | | | predicate:((d_year = 2000) and d_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_9] - | | | alias:d1 - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 3 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_33] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col18 (type: int), _col19 (type: int) - | | Merge Join Operator [MERGEJOIN_682] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"] - | | | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 22 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_31] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int) - | | | Select Operator [SEL_8] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_645] - | | | predicate:(((((c_customer_sk is not null and c_first_sales_date_sk is not null) and c_first_shipto_date_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) and c_current_addr_sk is not null) (type: boolean) - | | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_6] - | | | alias:customer - | | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 2 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_30] - | | key expressions:_col2 (type: int) - | | Map-reduce partition columns:_col2 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)) - | | Merge Join Operator [MERGEJOIN_681] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int), _col8 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 1 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_27] - | | | key expressions:_col1 (type: int), _col8 (type: int) - | | | Map-reduce partition columns:_col1 (type: int), _col8 (type: int) - | | | sort order:++ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)) - | | | Select Operator [SEL_2] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_643] - | | | predicate:((((((((ss_ticket_number is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_promo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_0] - | | | alias:store_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_28] - | | key expressions:_col0 (type: int), _col1 (type: int) - | | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_644] - | | predicate:(sr_ticket_number is not null and sr_item_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_3] - | | alias:store_returns - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 39 [SIMPLE_EDGE] - | Reduce Output Operator [RS_116] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_92] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_91] - | predicate:(_col1 > (2 * _col2)) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Group By Operator [GBY_90] - | | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | | keys:KEY._col0 (type: int) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 38 [SIMPLE_EDGE] - | Reduce Output Operator [RS_89] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)), _col2 (type: decimal(19,2)) - | Group By Operator [GBY_88] - | aggregations:["sum(_col1)","sum(_col2)"] - | keys:_col0 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_86] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Merge Join Operator [MERGEJOIN_696] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int), _col1 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | outputColumnNames:["_col0","_col2","_col5","_col6","_col7"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 37 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_83] - | | key expressions:_col0 (type: int), _col1 (type: int) - | | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col2 (type: decimal(7,2)) - | | Select Operator [SEL_79] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_660] - | | predicate:(cs_item_sk is not null and cs_order_number is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_77] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 40 [SIMPLE_EDGE] - | Reduce Output Operator [RS_84] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)), _col4 (type: decimal(7,2)) - | Select Operator [SEL_82] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_661] - | predicate:(cr_item_sk is not null and cr_order_number is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_80] - | alias:catalog_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 58 [SIMPLE_EDGE] - Reduce Output Operator [RS_248] - key expressions:_col1 (type: int), _col2 (type: string), _col3 (type: string) - Map-reduce partition columns:_col1 (type: int), _col2 (type: string), _col3 (type: string) - sort order:+++ - Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - value expressions:_col12 (type: int), _col15 (type: bigint), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)), _col18 (type: decimal(17,2)) - Select Operator [SEL_246] - outputColumnNames:["_col1","_col12","_col15","_col16","_col17","_col18","_col2","_col3"] - Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_245] - | aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: string), KEY._col7 (type: string), KEY._col8 (type: string), KEY._col9 (type: string), KEY._col10 (type: string), KEY._col11 (type: string), KEY._col12 (type: string), KEY._col13 (type: int), KEY._col14 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"] - | Statistics:Num rows: 334179945 Data size: 287401516862 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 57 [SIMPLE_EDGE] - Reduce Output Operator [RS_244] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: int), _col14 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: string), _col8 (type: string), _col9 (type: string), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: int), _col14 (type: string) - sort order:+++++++++++++++ - Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - value expressions:_col15 (type: bigint), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)), _col18 (type: decimal(17,2)) - Group By Operator [GBY_243] - aggregations:["count()","sum(_col9)","sum(_col10)","sum(_col11)"] - keys:_col21 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string), _col50 (type: int), _col53 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"] - Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_242] - outputColumnNames:["_col21","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53","_col9","_col10","_col11"] - Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_714] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)","2":"_col0 (type: int)"} - | outputColumnNames:["_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53"] - | Statistics:Num rows: 668359891 Data size: 574803034585 Basic stats: COMPLETE Column stats: NONE - |<-Map 74 [SIMPLE_EDGE] - | Reduce Output Operator [RS_239] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: string) - | Select Operator [SEL_200] - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_678] - | predicate:((((i_color) IN ('maroon', 'burnished', 'dim', 'steel', 'navajo', 'chocolate') and i_current_price BETWEEN 35 AND 45) and i_current_price BETWEEN 36 AND 50) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 57750 Data size: 82945057 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_198] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 56 [SIMPLE_EDGE] - | Reduce Output Operator [RS_238] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 303799944 Data size: 261274100967 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | Merge Join Operator [MERGEJOIN_712] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col37 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | Statistics:Num rows: 303799944 Data size: 261274100967 Basic stats: COMPLETE Column stats: NONE - | |<-Map 73 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_236] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_197] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_677] - | | predicate:ib_income_band_sk is not null (type: boolean) - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_195] - | | alias:ib1 - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 55 [SIMPLE_EDGE] - | Reduce Output Operator [RS_235] - | key expressions:_col37 (type: int) - | Map-reduce partition columns:_col37 (type: int) - | sort order:+ - | Statistics:Num rows: 276181762 Data size: 237521904822 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | Merge Join Operator [MERGEJOIN_711] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col35 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | Statistics:Num rows: 276181762 Data size: 237521904822 Basic stats: COMPLETE Column stats: NONE - | |<-Map 72 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_233] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_194] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_676] - | | predicate:ib_income_band_sk is not null (type: boolean) - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_192] - | | alias:ib1 - | | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 54 [SIMPLE_EDGE] - | Reduce Output Operator [RS_232] - | key expressions:_col35 (type: int) - | Map-reduce partition columns:_col35 (type: int) - | sort order:+ - | Statistics:Num rows: 251074324 Data size: 215928999704 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col37 (type: int), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string), _col44 (type: string), _col45 (type: string), _col46 (type: string), _col47 (type: string) - | Merge Join Operator [MERGEJOIN_710] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col17 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"] - | | Statistics:Num rows: 251074324 Data size: 215928999704 Basic stats: COMPLETE Column stats: NONE - | |<-Map 71 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_230] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | | Select Operator [SEL_191] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_675] - | | predicate:ca_address_sk is not null (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_189] - | | alias:ad1 - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 53 [SIMPLE_EDGE] - | Reduce Output Operator [RS_229] - | key expressions:_col17 (type: int) - | Map-reduce partition columns:_col17 (type: int) - | sort order:+ - | Statistics:Num rows: 228249381 Data size: 196299086386 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int), _col37 (type: int), _col39 (type: string), _col40 (type: string), _col41 (type: string), _col42 (type: string) - | Merge Join Operator [MERGEJOIN_709] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42"] - | | Statistics:Num rows: 228249381 Data size: 196299086386 Basic stats: COMPLETE Column stats: NONE - | |<-Map 70 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_227] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | | Select Operator [SEL_188] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_674] - | | predicate:ca_address_sk is not null (type: boolean) - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_186] - | | alias:ad1 - | | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 52 [SIMPLE_EDGE] - | Reduce Output Operator [RS_226] - | key expressions:_col5 (type: int) - | Map-reduce partition columns:_col5 (type: int) - | sort order:+ - | Statistics:Num rows: 207499433 Data size: 178453711029 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int), _col37 (type: int) - | Merge Join Operator [MERGEJOIN_708] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col16 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col5","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37"] - | | Statistics:Num rows: 207499433 Data size: 178453711029 Basic stats: COMPLETE Column stats: NONE - | |<-Map 69 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_224] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_185] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_673] - | | predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) (type: boolean) - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_183] - | | alias:hd1 - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 51 [SIMPLE_EDGE] - | Reduce Output Operator [RS_223] - | key expressions:_col16 (type: int) - | Map-reduce partition columns:_col16 (type: int) - | sort order:+ - | Statistics:Num rows: 188635845 Data size: 162230642874 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col35 (type: int) - | Merge Join Operator [MERGEJOIN_707] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col35"] - | | Statistics:Num rows: 188635845 Data size: 162230642874 Basic stats: COMPLETE Column stats: NONE - | |<-Map 68 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_221] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_182] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_672] - | | predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) (type: boolean) - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_180] - | | alias:hd1 - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 50 [SIMPLE_EDGE] - | Reduce Output Operator [RS_220] - | key expressions:_col4 (type: int) - | Map-reduce partition columns:_col4 (type: int) - | sort order:+ - | Statistics:Num rows: 171487129 Data size: 147482399417 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | Merge Join Operator [MERGEJOIN_706] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col7 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col4","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28"] - | | Statistics:Num rows: 171487129 Data size: 147482399417 Basic stats: COMPLETE Column stats: NONE - | |<-Map 67 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_218] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_179] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_671] - | | predicate:p_promo_sk is not null (type: boolean) - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_177] - | | alias:promotion - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 49 [SIMPLE_EDGE] - | Reduce Output Operator [RS_217] - | key expressions:_col7 (type: int) - | Map-reduce partition columns:_col7 (type: int) - | sort order:+ - | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | Select Operator [SEL_176] - | outputColumnNames:["_col1","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col4","_col5","_col7","_col9"] - | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_175] - | predicate:(_col30 <> _col32) (type: boolean) - | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_705] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col15 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col30","_col32"] - | | Statistics:Num rows: 155897387 Data size: 134074905655 Basic stats: COMPLETE Column stats: NONE - | |<-Map 66 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_173] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_150] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_670] - | | predicate:cd_demo_sk is not null (type: boolean) - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_148] - | | alias:cd1 - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 48 [SIMPLE_EDGE] - | Reduce Output Operator [RS_172] - | key expressions:_col15 (type: int) - | Map-reduce partition columns:_col15 (type: int) - | sort order:+ - | Statistics:Num rows: 141724895 Data size: 121886275227 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string), _col30 (type: string) - | Merge Join Operator [MERGEJOIN_704] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28","_col30"] - | | Statistics:Num rows: 141724895 Data size: 121886275227 Basic stats: COMPLETE Column stats: NONE - | |<-Map 65 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_170] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_147] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_669] - | | predicate:cd_demo_sk is not null (type: boolean) - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_145] - | | alias:cd1 - | | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 47 [SIMPLE_EDGE] - | Reduce Output Operator [RS_169] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 128840811 Data size: 110805702351 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int), _col27 (type: string), _col28 (type: string) - | Merge Join Operator [MERGEJOIN_703] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28"] - | | Statistics:Num rows: 128840811 Data size: 110805702351 Basic stats: COMPLETE Column stats: NONE - | |<-Map 64 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_167] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string), _col2 (type: string) - | | Select Operator [SEL_144] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_668] - | | predicate:((s_store_sk is not null and s_zip is not null) and s_store_name is not null) (type: boolean) - | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_142] - | | alias:store - | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 46 [SIMPLE_EDGE] - | Reduce Output Operator [RS_166] - | key expressions:_col6 (type: int) - | Map-reduce partition columns:_col6 (type: int) - | sort order:+ - | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int), _col25 (type: int) - | Merge Join Operator [MERGEJOIN_702] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col18 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25"] - | | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - | |<-Map 63 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_164] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_141] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_667] - | | predicate:d_date_sk is not null (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_139] - | | alias:d1 - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 45 [SIMPLE_EDGE] - | Reduce Output Operator [RS_163] - | key expressions:_col18 (type: int) - | Map-reduce partition columns:_col18 (type: int) - | sort order:+ - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col23 (type: int) - | Merge Join Operator [MERGEJOIN_701] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col19 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col23"] - | | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - | |<-Map 62 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_161] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_138] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_666] - | | predicate:d_date_sk is not null (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_136] - | | alias:d1 - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 44 [SIMPLE_EDGE] - | Reduce Output Operator [RS_160] - | key expressions:_col19 (type: int) - | Map-reduce partition columns:_col19 (type: int) - | sort order:+ - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col18 (type: int) - | Merge Join Operator [MERGEJOIN_700] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"] - | | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - | |<-Map 61 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_158] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_135] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_665] - | | predicate:((d_year = 2001) and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_133] - | | alias:d1 - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 43 [SIMPLE_EDGE] - | Reduce Output Operator [RS_157] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)), _col15 (type: int), _col16 (type: int), _col17 (type: int), _col18 (type: int), _col19 (type: int) - | Merge Join Operator [MERGEJOIN_699] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"] - | | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | |<-Map 60 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_155] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int) - | | Select Operator [SEL_132] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_664] - | | predicate:(((((c_customer_sk is not null and c_first_sales_date_sk is not null) and c_first_shipto_date_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) and c_current_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_130] - | | alias:customer - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 42 [SIMPLE_EDGE] - | Reduce Output Operator [RS_154] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_698] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int), _col8 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 41 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_151] - | | key expressions:_col1 (type: int), _col8 (type: int) - | | Map-reduce partition columns:_col1 (type: int), _col8 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: decimal(7,2)) - | | Select Operator [SEL_126] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_662] - | | predicate:((((((((ss_ticket_number is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_promo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_124] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 59 [SIMPLE_EDGE] - | Reduce Output Operator [RS_152] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_129] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_663] - | predicate:(sr_ticket_number is not null and sr_item_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_127] - | alias:store_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 77 [SIMPLE_EDGE] - Reduce Output Operator [RS_240] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_216] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_215] - predicate:(_col1 > (2 * _col2)) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Group By Operator [GBY_214] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 76 [SIMPLE_EDGE] - Reduce Output Operator [RS_213] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: decimal(17,2)), _col2 (type: decimal(19,2)) - Group By Operator [GBY_212] - aggregations:["sum(_col1)","sum(_col2)"] - keys:_col0 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_210] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Merge Join Operator [MERGEJOIN_713] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int), _col1 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col0","_col2","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 75 [SIMPLE_EDGE] - | Reduce Output Operator [RS_207] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Select Operator [SEL_203] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_679] - | predicate:(cs_item_sk is not null and cs_order_number is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_201] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 78 [SIMPLE_EDGE] - Reduce Output Operator [RS_208] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)), _col4 (type: decimal(7,2)) - Select Operator [SEL_206] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_680] - predicate:(cr_item_sk is not null and cr_order_number is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_204] - alias:catalog_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 20 + File Output Operator [FS_254] + Select Operator [SEL_253] (rows=122532649 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20"] + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_252] + Select Operator [SEL_251] (rows=122532649 width=860) + Output:["_col0","_col1","_col10","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col2","_col20","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Filter Operator [FIL_250] (rows=122532649 width=860) + predicate:(_col34 <= _col15) + Merge Join Operator [MERGEJOIN_715] (rows=367597947 width=860) + Output:["_col0","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col31","_col34","_col35","_col36","_col37"],keys:{"0":"_col1, _col2, _col3","1":"_col1, _col2, _col3"} + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_247] + PartitionCols:_col1, _col2, _col3 + Select Operator [SEL_123] (rows=334179945 width=860) + Output:["_col0","_col1","_col10","_col11","_col15","_col16","_col17","_col18","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Group By Operator [GBY_122] (rows=334179945 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7, KEY._col8, KEY._col9, KEY._col10, KEY._col11, KEY._col12, KEY._col13, KEY._col14 + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_121] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 + Group By Operator [GBY_120] (rows=668359891 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["count()","sum(_col15)","sum(_col16)","sum(_col17)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, 2000, _col13, _col14 + Select Operator [SEL_118] (rows=668359891 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col13","_col14","_col15","_col16","_col17"] + Merge Join Operator [MERGEJOIN_697] (rows=668359891 width=860) + Output:["_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53"],keys:{"0":"_col1","1":"_col0","2":"_col0"} + <-Map 36 [SIMPLE_EDGE] + SHUFFLE [RS_115] + PartitionCols:_col0 + Select Operator [SEL_76] (rows=57750 width=1436) + Output:["_col0","_col3"] + Filter Operator [FIL_659] (rows=57750 width=1436) + predicate:((((i_color) IN ('maroon', 'burnished', 'dim', 'steel', 'navajo', 'chocolate') and i_current_price BETWEEN 35 AND 45) and i_current_price BETWEEN 36 AND 50) and i_item_sk is not null) + TableScan [TS_74] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price","i_color","i_product_name"] + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_114] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_695] (rows=303799944 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col37","1":"_col0"} + <-Map 35 [SIMPLE_EDGE] + SHUFFLE [RS_112] + PartitionCols:_col0 + Select Operator [SEL_73] (rows=20 width=12) + Output:["_col0"] + Filter Operator [FIL_658] (rows=20 width=12) + predicate:ib_income_band_sk is not null + TableScan [TS_71] (rows=20 width=12) + default@income_band,ib1,Tbl:COMPLETE,Col:NONE,Output:["ib_income_band_sk"] + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_111] + PartitionCols:_col37 + Merge Join Operator [MERGEJOIN_694] (rows=276181762 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col35","1":"_col0"} + <-Map 34 [SIMPLE_EDGE] + SHUFFLE [RS_109] + PartitionCols:_col0 + Select Operator [SEL_70] (rows=20 width=12) + Output:["_col0"] + Filter Operator [FIL_657] (rows=20 width=12) + predicate:ib_income_band_sk is not null + TableScan [TS_68] (rows=20 width=12) + default@income_band,ib1,Tbl:COMPLETE,Col:NONE,Output:["ib_income_band_sk"] + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_108] + PartitionCols:_col35 + Merge Join Operator [MERGEJOIN_693] (rows=251074324 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col17","1":"_col0"} + <-Map 33 [SIMPLE_EDGE] + SHUFFLE [RS_106] + PartitionCols:_col0 + Select Operator [SEL_67] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_656] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_65] (rows=40000000 width=1014) + default@customer_address,ad1,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_street_number","ca_street_name","ca_city","ca_zip"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_105] + PartitionCols:_col17 + Merge Join Operator [MERGEJOIN_692] (rows=228249381 width=860) + Output:["_col1","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42"],keys:{"0":"_col5","1":"_col0"} + <-Map 32 [SIMPLE_EDGE] + SHUFFLE [RS_103] + PartitionCols:_col0 + Select Operator [SEL_64] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_655] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_62] (rows=40000000 width=1014) + default@customer_address,ad1,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_street_number","ca_street_name","ca_city","ca_zip"] + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_102] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_691] (rows=207499433 width=860) + Output:["_col1","_col5","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37"],keys:{"0":"_col16","1":"_col0"} + <-Map 31 [SIMPLE_EDGE] + SHUFFLE [RS_100] + PartitionCols:_col0 + Select Operator [SEL_61] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_654] (rows=7200 width=107) + predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) + TableScan [TS_59] (rows=7200 width=107) + default@household_demographics,hd1,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_income_band_sk"] + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_99] + PartitionCols:_col16 + Merge Join Operator [MERGEJOIN_690] (rows=188635845 width=860) + Output:["_col1","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col35"],keys:{"0":"_col4","1":"_col0"} + <-Map 30 [SIMPLE_EDGE] + SHUFFLE [RS_97] + PartitionCols:_col0 + Select Operator [SEL_58] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_653] (rows=7200 width=107) + predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) + TableScan [TS_56] (rows=7200 width=107) + default@household_demographics,hd1,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_income_band_sk"] + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_96] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_689] (rows=171487129 width=860) + Output:["_col1","_col4","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28"],keys:{"0":"_col7","1":"_col0"} + <-Map 29 [SIMPLE_EDGE] + SHUFFLE [RS_94] + PartitionCols:_col0 + Select Operator [SEL_55] (rows=2300 width=1179) + Output:["_col0"] + Filter Operator [FIL_652] (rows=2300 width=1179) + predicate:p_promo_sk is not null + TableScan [TS_53] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_93] + PartitionCols:_col7 + Select Operator [SEL_52] (rows=155897387 width=860) + Output:["_col1","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col4","_col5","_col7","_col9"] + Filter Operator [FIL_51] (rows=155897387 width=860) + predicate:(_col30 <> _col32) + Merge Join Operator [MERGEJOIN_688] (rows=155897387 width=860) + Output:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col30","_col32"],keys:{"0":"_col15","1":"_col0"} + <-Map 28 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=19800 width=362) + Output:["_col0","_col1"] + Filter Operator [FIL_651] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_24] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col15 + Merge Join Operator [MERGEJOIN_687] (rows=141724895 width=860) + Output:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28","_col30"],keys:{"0":"_col3","1":"_col0"} + <-Map 27 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=19800 width=362) + Output:["_col0","_col1"] + Filter Operator [FIL_650] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_21] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_686] (rows=128840811 width=860) + Output:["_col1","_col3","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28"],keys:{"0":"_col6","1":"_col0"} + <-Map 26 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_649] (rows=1704 width=1910) + predicate:((s_store_sk is not null and s_zip is not null) and s_store_name is not null) + TableScan [TS_18] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_zip"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_685] (rows=117128008 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25"],keys:{"0":"_col18","1":"_col0"} + <-Map 25 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_648] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_15] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col18 + Merge Join Operator [MERGEJOIN_684] (rows=106480005 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col23"],keys:{"0":"_col19","1":"_col0"} + <-Map 24 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_647] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_12] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col19 + Merge Join Operator [MERGEJOIN_683] (rows=96800003 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col0","1":"_col0"} + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_646] (rows=36524 width=1119) + predicate:((d_year = 2000) and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_682] (rows=88000001 width=860) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col2","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_645] (rows=80000000 width=860) + predicate:(((((c_customer_sk is not null and c_first_sales_date_sk is not null) and c_first_shipto_date_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) and c_current_addr_sk is not null) + TableScan [TS_6] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_hdemo_sk","c_current_addr_sk","c_first_shipto_date_sk","c_first_sales_date_sk"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_681] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11"],keys:{"0":"_col1, _col8","1":"_col0, _col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col1, _col8 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] + Filter Operator [FIL_643] (rows=1 width=0) + predicate:((((((((ss_ticket_number is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_promo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_promo_sk","ss_ticket_number","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0, _col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_644] (rows=1 width=0) + predicate:(sr_ticket_number is not null and sr_item_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_ticket_number"] + <-Reducer 39 [SIMPLE_EDGE] + SHUFFLE [RS_116] + PartitionCols:_col0 + Select Operator [SEL_92] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_91] (rows=1 width=0) + predicate:(_col1 > (2 * _col2)) + Group By Operator [GBY_90] (rows=1 width=0) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0 + <-Reducer 38 [SIMPLE_EDGE] + SHUFFLE [RS_89] + PartitionCols:_col0 + Group By Operator [GBY_88] (rows=1 width=0) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col1)","sum(_col2)"],keys:_col0 + Select Operator [SEL_86] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_696] (rows=1 width=0) + Output:["_col0","_col2","_col5","_col6","_col7"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Map 37 [SIMPLE_EDGE] + SHUFFLE [RS_83] + PartitionCols:_col0, _col1 + Select Operator [SEL_79] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_660] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_order_number is not null) + TableScan [TS_77] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_item_sk","cs_order_number","cs_ext_list_price"] + <-Map 40 [SIMPLE_EDGE] + SHUFFLE [RS_84] + PartitionCols:_col0, _col1 + Select Operator [SEL_82] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_661] (rows=1 width=0) + predicate:(cr_item_sk is not null and cr_order_number is not null) + TableScan [TS_80] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_refunded_cash","cr_reversed_charge","cr_store_credit"] + <-Reducer 58 [SIMPLE_EDGE] + SHUFFLE [RS_248] + PartitionCols:_col1, _col2, _col3 + Select Operator [SEL_246] (rows=334179945 width=860) + Output:["_col1","_col12","_col15","_col16","_col17","_col18","_col2","_col3"] + Group By Operator [GBY_245] (rows=334179945 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["count(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7, KEY._col8, KEY._col9, KEY._col10, KEY._col11, KEY._col12, KEY._col13, KEY._col14 + <-Reducer 57 [SIMPLE_EDGE] + SHUFFLE [RS_244] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 + Group By Operator [GBY_243] (rows=668359891 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18"],aggregations:["count()","sum(_col9)","sum(_col10)","sum(_col11)"],keys:_col21, _col23, _col25, _col27, _col28, _col39, _col40, _col41, _col42, _col44, _col45, _col46, _col47, _col50, _col53 + Select Operator [SEL_242] (rows=668359891 width=860) + Output:["_col21","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53","_col9","_col10","_col11"] + Merge Join Operator [MERGEJOIN_714] (rows=668359891 width=860) + Output:["_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47","_col50","_col53"],keys:{"0":"_col1","1":"_col0","2":"_col0"} + <-Map 74 [SIMPLE_EDGE] + SHUFFLE [RS_239] + PartitionCols:_col0 + Select Operator [SEL_200] (rows=57750 width=1436) + Output:["_col0","_col3"] + Filter Operator [FIL_678] (rows=57750 width=1436) + predicate:((((i_color) IN ('maroon', 'burnished', 'dim', 'steel', 'navajo', 'chocolate') and i_current_price BETWEEN 35 AND 45) and i_current_price BETWEEN 36 AND 50) and i_item_sk is not null) + TableScan [TS_198] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price","i_color","i_product_name"] + <-Reducer 56 [SIMPLE_EDGE] + SHUFFLE [RS_238] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_712] (rows=303799944 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col37","1":"_col0"} + <-Map 73 [SIMPLE_EDGE] + SHUFFLE [RS_236] + PartitionCols:_col0 + Select Operator [SEL_197] (rows=20 width=12) + Output:["_col0"] + Filter Operator [FIL_677] (rows=20 width=12) + predicate:ib_income_band_sk is not null + TableScan [TS_195] (rows=20 width=12) + default@income_band,ib1,Tbl:COMPLETE,Col:NONE,Output:["ib_income_band_sk"] + <-Reducer 55 [SIMPLE_EDGE] + SHUFFLE [RS_235] + PartitionCols:_col37 + Merge Join Operator [MERGEJOIN_711] (rows=276181762 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col35","1":"_col0"} + <-Map 72 [SIMPLE_EDGE] + SHUFFLE [RS_233] + PartitionCols:_col0 + Select Operator [SEL_194] (rows=20 width=12) + Output:["_col0"] + Filter Operator [FIL_676] (rows=20 width=12) + predicate:ib_income_band_sk is not null + TableScan [TS_192] (rows=20 width=12) + default@income_band,ib1,Tbl:COMPLETE,Col:NONE,Output:["ib_income_band_sk"] + <-Reducer 54 [SIMPLE_EDGE] + SHUFFLE [RS_232] + PartitionCols:_col35 + Merge Join Operator [MERGEJOIN_710] (rows=251074324 width=860) + Output:["_col1","_col9","_col10","_col11","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42","_col44","_col45","_col46","_col47"],keys:{"0":"_col17","1":"_col0"} + <-Map 71 [SIMPLE_EDGE] + SHUFFLE [RS_230] + PartitionCols:_col0 + Select Operator [SEL_191] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_675] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_189] (rows=40000000 width=1014) + default@customer_address,ad1,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_street_number","ca_street_name","ca_city","ca_zip"] + <-Reducer 53 [SIMPLE_EDGE] + SHUFFLE [RS_229] + PartitionCols:_col17 + Merge Join Operator [MERGEJOIN_709] (rows=228249381 width=860) + Output:["_col1","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37","_col39","_col40","_col41","_col42"],keys:{"0":"_col5","1":"_col0"} + <-Map 70 [SIMPLE_EDGE] + SHUFFLE [RS_227] + PartitionCols:_col0 + Select Operator [SEL_188] (rows=40000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_674] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_186] (rows=40000000 width=1014) + default@customer_address,ad1,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_street_number","ca_street_name","ca_city","ca_zip"] + <-Reducer 52 [SIMPLE_EDGE] + SHUFFLE [RS_226] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_708] (rows=207499433 width=860) + Output:["_col1","_col5","_col9","_col10","_col11","_col17","_col23","_col25","_col27","_col28","_col35","_col37"],keys:{"0":"_col16","1":"_col0"} + <-Map 69 [SIMPLE_EDGE] + SHUFFLE [RS_224] + PartitionCols:_col0 + Select Operator [SEL_185] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_673] (rows=7200 width=107) + predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) + TableScan [TS_183] (rows=7200 width=107) + default@household_demographics,hd1,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_income_band_sk"] + <-Reducer 51 [SIMPLE_EDGE] + SHUFFLE [RS_223] + PartitionCols:_col16 + Merge Join Operator [MERGEJOIN_707] (rows=188635845 width=860) + Output:["_col1","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col35"],keys:{"0":"_col4","1":"_col0"} + <-Map 68 [SIMPLE_EDGE] + SHUFFLE [RS_221] + PartitionCols:_col0 + Select Operator [SEL_182] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_672] (rows=7200 width=107) + predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) + TableScan [TS_180] (rows=7200 width=107) + default@household_demographics,hd1,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_income_band_sk"] + <-Reducer 50 [SIMPLE_EDGE] + SHUFFLE [RS_220] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_706] (rows=171487129 width=860) + Output:["_col1","_col4","_col5","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28"],keys:{"0":"_col7","1":"_col0"} + <-Map 67 [SIMPLE_EDGE] + SHUFFLE [RS_218] + PartitionCols:_col0 + Select Operator [SEL_179] (rows=2300 width=1179) + Output:["_col0"] + Filter Operator [FIL_671] (rows=2300 width=1179) + predicate:p_promo_sk is not null + TableScan [TS_177] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk"] + <-Reducer 49 [SIMPLE_EDGE] + SHUFFLE [RS_217] + PartitionCols:_col7 + Select Operator [SEL_176] (rows=155897387 width=860) + Output:["_col1","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col4","_col5","_col7","_col9"] + Filter Operator [FIL_175] (rows=155897387 width=860) + predicate:(_col30 <> _col32) + Merge Join Operator [MERGEJOIN_705] (rows=155897387 width=860) + Output:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col16","_col17","_col23","_col25","_col27","_col28","_col30","_col32"],keys:{"0":"_col15","1":"_col0"} + <-Map 66 [SIMPLE_EDGE] + SHUFFLE [RS_173] + PartitionCols:_col0 + Select Operator [SEL_150] (rows=19800 width=362) + Output:["_col0","_col1"] + Filter Operator [FIL_670] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_148] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status"] + <-Reducer 48 [SIMPLE_EDGE] + SHUFFLE [RS_172] + PartitionCols:_col15 + Merge Join Operator [MERGEJOIN_704] (rows=141724895 width=860) + Output:["_col1","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28","_col30"],keys:{"0":"_col3","1":"_col0"} + <-Map 65 [SIMPLE_EDGE] + SHUFFLE [RS_170] + PartitionCols:_col0 + Select Operator [SEL_147] (rows=19800 width=362) + Output:["_col0","_col1"] + Filter Operator [FIL_669] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_145] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status"] + <-Reducer 47 [SIMPLE_EDGE] + SHUFFLE [RS_169] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_703] (rows=128840811 width=860) + Output:["_col1","_col3","_col4","_col5","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25","_col27","_col28"],keys:{"0":"_col6","1":"_col0"} + <-Map 64 [SIMPLE_EDGE] + SHUFFLE [RS_167] + PartitionCols:_col0 + Select Operator [SEL_144] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_668] (rows=1704 width=1910) + predicate:((s_store_sk is not null and s_zip is not null) and s_store_name is not null) + TableScan [TS_142] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_zip"] + <-Reducer 46 [SIMPLE_EDGE] + SHUFFLE [RS_166] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_702] (rows=117128008 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col23","_col25"],keys:{"0":"_col18","1":"_col0"} + <-Map 63 [SIMPLE_EDGE] + SHUFFLE [RS_164] + PartitionCols:_col0 + Select Operator [SEL_141] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_667] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_139] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 45 [SIMPLE_EDGE] + SHUFFLE [RS_163] + PartitionCols:_col18 + Merge Join Operator [MERGEJOIN_701] (rows=106480005 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col23"],keys:{"0":"_col19","1":"_col0"} + <-Map 62 [SIMPLE_EDGE] + SHUFFLE [RS_161] + PartitionCols:_col0 + Select Operator [SEL_138] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_666] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_136] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 44 [SIMPLE_EDGE] + SHUFFLE [RS_160] + PartitionCols:_col19 + Merge Join Operator [MERGEJOIN_700] (rows=96800003 width=860) + Output:["_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col0","1":"_col0"} + <-Map 61 [SIMPLE_EDGE] + SHUFFLE [RS_158] + PartitionCols:_col0 + Select Operator [SEL_135] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_665] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_133] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 43 [SIMPLE_EDGE] + SHUFFLE [RS_157] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_699] (rows=88000001 width=860) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11","_col15","_col16","_col17","_col18","_col19"],keys:{"0":"_col2","1":"_col0"} + <-Map 60 [SIMPLE_EDGE] + SHUFFLE [RS_155] + PartitionCols:_col0 + Select Operator [SEL_132] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_664] (rows=80000000 width=860) + predicate:(((((c_customer_sk is not null and c_first_sales_date_sk is not null) and c_first_shipto_date_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) and c_current_addr_sk is not null) + TableScan [TS_130] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_hdemo_sk","c_current_addr_sk","c_first_shipto_date_sk","c_first_sales_date_sk"] + <-Reducer 42 [SIMPLE_EDGE] + SHUFFLE [RS_154] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_698] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9","_col10","_col11"],keys:{"0":"_col1, _col8","1":"_col0, _col1"} + <-Map 41 [SIMPLE_EDGE] + SHUFFLE [RS_151] + PartitionCols:_col1, _col8 + Select Operator [SEL_126] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11"] + Filter Operator [FIL_662] (rows=1 width=0) + predicate:((((((((ss_ticket_number is not null and ss_item_sk is not null) and ss_customer_sk is not null) and ss_sold_date_sk is not null) and ss_store_sk is not null) and ss_cdemo_sk is not null) and ss_promo_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) + TableScan [TS_124] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk","ss_cdemo_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_promo_sk","ss_ticket_number","ss_wholesale_cost","ss_list_price","ss_coupon_amt"] + <-Map 59 [SIMPLE_EDGE] + SHUFFLE [RS_152] + PartitionCols:_col0, _col1 + Select Operator [SEL_129] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_663] (rows=1 width=0) + predicate:(sr_ticket_number is not null and sr_item_sk is not null) + TableScan [TS_127] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_ticket_number"] + <-Reducer 77 [SIMPLE_EDGE] + SHUFFLE [RS_240] + PartitionCols:_col0 + Select Operator [SEL_216] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_215] (rows=1 width=0) + predicate:(_col1 > (2 * _col2)) + Group By Operator [GBY_214] (rows=1 width=0) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0 + <-Reducer 76 [SIMPLE_EDGE] + SHUFFLE [RS_213] + PartitionCols:_col0 + Group By Operator [GBY_212] (rows=1 width=0) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col1)","sum(_col2)"],keys:_col0 + Select Operator [SEL_210] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_713] (rows=1 width=0) + Output:["_col0","_col2","_col5","_col6","_col7"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Map 75 [SIMPLE_EDGE] + SHUFFLE [RS_207] + PartitionCols:_col0, _col1 + Select Operator [SEL_203] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_679] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_order_number is not null) + TableScan [TS_201] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_item_sk","cs_order_number","cs_ext_list_price"] + <-Map 78 [SIMPLE_EDGE] + SHUFFLE [RS_208] + PartitionCols:_col0, _col1 + Select Operator [SEL_206] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_680] (rows=1 width=0) + predicate:(cr_item_sk is not null and cr_order_number is not null) + TableScan [TS_204] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_refunded_cash","cr_reversed_charge","cr_store_credit"] diff --git a/ql/src/test/results/clientpositive/perf/query65.q.out b/ql/src/test/results/clientpositive/perf/query65.q.out index 12bdd33..8898e9a 100644 --- a/ql/src/test/results/clientpositive/perf/query65.q.out +++ b/ql/src/test/results/clientpositive/perf/query65.q.out @@ -90,226 +90,116 @@ Reducer 8 <- Map 11 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_55] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_54] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_53] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 204974 Data size: 294399674 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_52] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 204974 Data size: 294399674 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)), _col3 (type: decimal(7,2)), _col4 (type: decimal(7,2)), _col5 (type: string) - Select Operator [SEL_51] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 204974 Data size: 294399674 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_50] - predicate:(_col11 <= CAST( (0.1 * UDFToDouble(_col8)) AS decimal(30,15))) (type: boolean) - Statistics:Num rows: 204974 Data size: 294399674 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_76] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col7 (type: int), _col0 (type: int), _col2 (type: int)","1":"_col0 (type: int), _col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col8","_col11"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_48] - | key expressions:_col0 (type: int), _col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col0 (type: int), _col1 (type: int) - | sort order:+++ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(17,2)) - | Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(17,2)) - | Group By Operator [GBY_35] - | aggregations:["sum(_col3)"] - | keys:_col1 (type: int), _col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_74] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_31] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_27] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_70] - | | predicate:((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_store_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_25] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_30] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_71] - | predicate:(d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_28] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col7 (type: int), _col0 (type: int), _col2 (type: int) - Map-reduce partition columns:_col7 (type: int), _col0 (type: int), _col2 (type: int) - sort order:+++ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col3 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)), _col6 (type: string), _col8 (type: decimal(21,6)) - Merge Join Operator [MERGEJOIN_75] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | sort order: - | Statistics:Num rows: 10044 Data size: 11239348 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: decimal(21,6)) - | Group By Operator [GBY_23] - | | aggregations:["avg(VALUE._col0)"] - | | keys:KEY._col0 (type: int) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 10044 Data size: 11239348 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: struct) - | Group By Operator [GBY_21] - | aggregations:["avg(_col2)"] - | keys:_col1 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_18] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_17] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(17,2)) - | Group By Operator [GBY_16] - | aggregations:["sum(_col3)"] - | keys:_col1 (type: int), _col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_73] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_13] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_11] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_69] - | | predicate:(d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_9] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_68] - | predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_6] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_44] - sort order: - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: string), _col2 (type: int), _col3 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)), _col6 (type: string) - Merge Join Operator [MERGEJOIN_72] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_41] - | sort order: - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_66] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - sort order: - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: string), _col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)), _col4 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_67] - predicate:i_item_sk is not null (type: boolean) - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_55] + Limit [LIM_54] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_53] (rows=204974 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_52] + Select Operator [SEL_51] (rows=204974 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_50] (rows=204974 width=1436) + predicate:(_col11 <= CAST( (0.1 * UDFToDouble(_col8)) AS decimal(30,15))) + Merge Join Operator [MERGEJOIN_76] (rows=614922 width=1436) + Output:["_col1","_col3","_col4","_col5","_col6","_col8","_col11"],keys:{"0":"_col7, _col0, _col2","1":"_col0, _col0, _col1"} + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col0, _col0, _col1 + Select Operator [SEL_38] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_37] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=40176 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_74] (rows=40176 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_27] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_70] (rows=1 width=0) + predicate:((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_store_sk is not null) + TableScan [TS_25] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_store_sk","ss_sales_price"] + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_71] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) + TableScan [TS_28] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col7, _col0, _col2 + Merge Join Operator [MERGEJOIN_75] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],keys:{} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_45] + Group By Operator [GBY_23] (rows=10044 width=1119) + Output:["_col0","_col1"],aggregations:["avg(VALUE._col0)"],keys:KEY._col0 + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Group By Operator [GBY_21] (rows=20088 width=1119) + Output:["_col0","_col1"],aggregations:["avg(_col2)"],keys:_col1 + Select Operator [SEL_19] (rows=20088 width=1119) + Output:["_col1","_col2"] + Group By Operator [GBY_18] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1 + Group By Operator [GBY_16] (rows=40176 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col3)"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_73] (rows=40176 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_69] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1212 AND 1223 and d_date_sk is not null) + TableScan [TS_9] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_68] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) + TableScan [TS_6] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_store_sk","ss_sales_price"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_44] + Merge Join Operator [MERGEJOIN_72] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_41] + Select Operator [SEL_2] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_66] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_0] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_42] + Select Operator [SEL_5] (rows=462000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_67] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_desc","i_current_price","i_wholesale_cost","i_brand"] diff --git a/ql/src/test/results/clientpositive/perf/query66.q.out b/ql/src/test/results/clientpositive/perf/query66.q.out index b2e6bf7..3f285e9 100644 --- a/ql/src/test/results/clientpositive/perf/query66.q.out +++ b/ql/src/test/results/clientpositive/perf/query66.q.out @@ -453,347 +453,180 @@ Reducer 8 <- Union 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 9 - File Output Operator [FS_76] - compressed:false - Statistics:Num rows: 100 Data size: 47100 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_75] - Number of rows:100 - Statistics:Num rows: 100 Data size: 47100 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_74] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - | Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_73] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col8 (type: decimal(38,2)), _col9 (type: decimal(38,2)), _col10 (type: decimal(38,2)), _col11 (type: decimal(38,2)), _col12 (type: decimal(38,2)), _col13 (type: decimal(38,2)), _col14 (type: decimal(38,2)), _col15 (type: decimal(38,2)), _col16 (type: decimal(38,2)), _col17 (type: decimal(38,2)), _col18 (type: decimal(38,2)), _col19 (type: decimal(38,2)), _col20 (type: decimal(38,12)), _col21 (type: decimal(38,12)), _col22 (type: decimal(38,12)), _col23 (type: decimal(38,12)), _col24 (type: decimal(38,12)), _col25 (type: decimal(38,12)), _col26 (type: decimal(38,12)), _col27 (type: decimal(38,12)), _col28 (type: decimal(38,12)), _col29 (type: decimal(38,12)), _col30 (type: decimal(38,12)), _col31 (type: decimal(38,12)), _col32 (type: decimal(38,2)), _col33 (type: decimal(38,2)), _col34 (type: decimal(38,2)), _col35 (type: decimal(38,2)), _col36 (type: decimal(38,2)), _col37 (type: decimal(38,2)), _col38 (type: decimal(38,2)), _col39 (type: decimal(38,2)), _col40 (type: decimal(38,2)), _col41 (type: decimal(38,2)), _col42 (type: decimal(38,2)), _col43 (type: decimal(38,2)) - Select Operator [SEL_72] - outputColumnNames:["_col0","_col1","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col2","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col3","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col4","_col40","_col41","_col42","_col43","_col5","_col6","_col8","_col9"] - Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_71] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)","sum(VALUE._col24)","sum(VALUE._col25)","sum(VALUE._col26)","sum(VALUE._col27)","sum(VALUE._col28)","sum(VALUE._col29)","sum(VALUE._col30)","sum(VALUE._col31)","sum(VALUE._col32)","sum(VALUE._col33)","sum(VALUE._col34)","sum(VALUE._col35)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: string), KEY._col7 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - | Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - |<-Union 7 [SIMPLE_EDGE] - |<-Reducer 19 [CONTAINS] - | Reduce Output Operator [RS_70] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: int) - | sort order:++++++++ - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col8 (type: decimal(38,2)), _col9 (type: decimal(38,2)), _col10 (type: decimal(38,2)), _col11 (type: decimal(38,2)), _col12 (type: decimal(38,2)), _col13 (type: decimal(38,2)), _col14 (type: decimal(38,2)), _col15 (type: decimal(38,2)), _col16 (type: decimal(38,2)), _col17 (type: decimal(38,2)), _col18 (type: decimal(38,2)), _col19 (type: decimal(38,2)), _col20 (type: decimal(38,12)), _col21 (type: decimal(38,12)), _col22 (type: decimal(38,12)), _col23 (type: decimal(38,12)), _col24 (type: decimal(38,12)), _col25 (type: decimal(38,12)), _col26 (type: decimal(38,12)), _col27 (type: decimal(38,12)), _col28 (type: decimal(38,12)), _col29 (type: decimal(38,12)), _col30 (type: decimal(38,12)), _col31 (type: decimal(38,12)), _col32 (type: decimal(38,2)), _col33 (type: decimal(38,2)), _col34 (type: decimal(38,2)), _col35 (type: decimal(38,2)), _col36 (type: decimal(38,2)), _col37 (type: decimal(38,2)), _col38 (type: decimal(38,2)), _col39 (type: decimal(38,2)), _col40 (type: decimal(38,2)), _col41 (type: decimal(38,2)), _col42 (type: decimal(38,2)), _col43 (type: decimal(38,2)) - | Group By Operator [GBY_69] - | aggregations:["sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)","sum(_col31)","sum(_col32)","sum(_col33)","sum(_col34)","sum(_col35)","sum(_col36)","sum(_col37)","sum(_col38)","sum(_col39)","sum(_col40)","sum(_col41)","sum(_col42)","sum(_col43)"] - | keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), 2002 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_67] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_65] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - | Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_64] - | | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - | | Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_63] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: int) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: int) - | sort order:+++++++ - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col7 (type: decimal(28,2)), _col8 (type: decimal(28,2)), _col9 (type: decimal(28,2)), _col10 (type: decimal(28,2)), _col11 (type: decimal(28,2)), _col12 (type: decimal(28,2)), _col13 (type: decimal(28,2)), _col14 (type: decimal(28,2)), _col15 (type: decimal(28,2)), _col16 (type: decimal(28,2)), _col17 (type: decimal(28,2)), _col18 (type: decimal(28,2)), _col19 (type: decimal(28,2)), _col20 (type: decimal(28,2)), _col21 (type: decimal(28,2)), _col22 (type: decimal(28,2)), _col23 (type: decimal(28,2)), _col24 (type: decimal(28,2)), _col25 (type: decimal(28,2)), _col26 (type: decimal(28,2)), _col27 (type: decimal(28,2)), _col28 (type: decimal(28,2)), _col29 (type: decimal(28,2)), _col30 (type: decimal(28,2)) - | Group By Operator [GBY_62] - | aggregations:["sum(_col7)","sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)"] - | keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), 2002 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_60] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_122] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | |<-Map 23 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_58] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Select Operator [SEL_47] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_114] - | | predicate:((sm_carrier) IN ('DIAMOND', 'AIRBORNE') and sm_ship_mode_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_45] - | | alias:ship_mode - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_57] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string), _col16 (type: int) - | Merge Join Operator [MERGEJOIN_121] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - | |<-Map 22 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_55] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_44] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_113] - | | predicate:(t_time BETWEEN 49530 AND 78330 and t_time_sk is not null) (type: boolean) - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_42] - | | alias:time_dim - | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_54] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string), _col16 (type: int) - | Merge Join Operator [MERGEJOIN_120] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_52] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: int) - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col2"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_112] - | | predicate:((d_year = 2002) and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_51] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string) - | Merge Join Operator [MERGEJOIN_119] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13"] - | | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_48] - | | key expressions:_col3 (type: int) - | | Map-reduce partition columns:_col3 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | | Select Operator [SEL_35] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_110] - | | predicate:(((cs_warehouse_sk is not null and cs_sold_date_sk is not null) and cs_sold_time_sk is not null) and cs_ship_mode_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_33] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_49] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: int), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string) - | Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_111] - | predicate:w_warehouse_sk is not null (type: boolean) - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_36] - | alias:warehouse - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [CONTAINS] - Reduce Output Operator [RS_70] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: int) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), _col7 (type: int) - sort order:++++++++ - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - value expressions:_col8 (type: decimal(38,2)), _col9 (type: decimal(38,2)), _col10 (type: decimal(38,2)), _col11 (type: decimal(38,2)), _col12 (type: decimal(38,2)), _col13 (type: decimal(38,2)), _col14 (type: decimal(38,2)), _col15 (type: decimal(38,2)), _col16 (type: decimal(38,2)), _col17 (type: decimal(38,2)), _col18 (type: decimal(38,2)), _col19 (type: decimal(38,2)), _col20 (type: decimal(38,12)), _col21 (type: decimal(38,12)), _col22 (type: decimal(38,12)), _col23 (type: decimal(38,12)), _col24 (type: decimal(38,12)), _col25 (type: decimal(38,12)), _col26 (type: decimal(38,12)), _col27 (type: decimal(38,12)), _col28 (type: decimal(38,12)), _col29 (type: decimal(38,12)), _col30 (type: decimal(38,12)), _col31 (type: decimal(38,12)), _col32 (type: decimal(38,2)), _col33 (type: decimal(38,2)), _col34 (type: decimal(38,2)), _col35 (type: decimal(38,2)), _col36 (type: decimal(38,2)), _col37 (type: decimal(38,2)), _col38 (type: decimal(38,2)), _col39 (type: decimal(38,2)), _col40 (type: decimal(38,2)), _col41 (type: decimal(38,2)), _col42 (type: decimal(38,2)), _col43 (type: decimal(38,2)) - Group By Operator [GBY_69] - aggregations:["sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)","sum(_col31)","sum(_col32)","sum(_col33)","sum(_col34)","sum(_col35)","sum(_col36)","sum(_col37)","sum(_col38)","sum(_col39)","sum(_col40)","sum(_col41)","sum(_col42)","sum(_col43)"] - keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string), 2002 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_67] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_32] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_31] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string), KEY._col5 (type: string), KEY._col6 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - | Statistics:Num rows: 26136 Data size: 12310056 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: int) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: int) - sort order:+++++++ - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - value expressions:_col7 (type: decimal(28,2)), _col8 (type: decimal(28,2)), _col9 (type: decimal(28,2)), _col10 (type: decimal(28,2)), _col11 (type: decimal(28,2)), _col12 (type: decimal(28,2)), _col13 (type: decimal(28,2)), _col14 (type: decimal(28,2)), _col15 (type: decimal(28,2)), _col16 (type: decimal(28,2)), _col17 (type: decimal(28,2)), _col18 (type: decimal(28,2)), _col19 (type: decimal(28,2)), _col20 (type: decimal(28,2)), _col21 (type: decimal(28,2)), _col22 (type: decimal(28,2)), _col23 (type: decimal(28,2)), _col24 (type: decimal(28,2)), _col25 (type: decimal(28,2)), _col26 (type: decimal(28,2)), _col27 (type: decimal(28,2)), _col28 (type: decimal(28,2)), _col29 (type: decimal(28,2)), _col30 (type: decimal(28,2)) - Group By Operator [GBY_29] - aggregations:["sum(_col7)","sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)"] - keys:_col0 (type: string), _col1 (type: int), _col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string), 2002 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] - Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_118] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_109] - | predicate:((sm_carrier) IN ('DIAMOND', 'AIRBORNE') and sm_ship_mode_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_12] - | alias:ship_mode - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string), _col16 (type: int) - Merge Join Operator [MERGEJOIN_117] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_108] - | predicate:(t_time BETWEEN 49530 AND 78330 and t_time_sk is not null) (type: boolean) - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:time_dim - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string), _col16 (type: int) - Merge Join Operator [MERGEJOIN_116] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_107] - | predicate:((d_year = 2002) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: string), _col9 (type: int), _col10 (type: string), _col11 (type: string), _col12 (type: string), _col13 (type: string) - Merge Join Operator [MERGEJOIN_115] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13"] - | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_105] - | predicate:(((ws_warehouse_sk is not null and ws_sold_date_sk is not null) and ws_sold_time_sk is not null) and ws_ship_mode_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: int), _col3 (type: string), _col4 (type: string), _col5 (type: string), _col6 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_106] - predicate:w_warehouse_sk is not null (type: boolean) - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:warehouse - Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 9 + File Output Operator [FS_76] + Limit [LIM_75] (rows=100 width=471) + Number of rows:100 + Select Operator [SEL_74] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_73] + Select Operator [SEL_72] (rows=26136 width=471) + Output:["_col0","_col1","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col2","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col3","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col4","_col40","_col41","_col42","_col43","_col5","_col6","_col8","_col9"] + Group By Operator [GBY_71] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)","sum(VALUE._col24)","sum(VALUE._col25)","sum(VALUE._col26)","sum(VALUE._col27)","sum(VALUE._col28)","sum(VALUE._col29)","sum(VALUE._col30)","sum(VALUE._col31)","sum(VALUE._col32)","sum(VALUE._col33)","sum(VALUE._col34)","sum(VALUE._col35)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7 + <-Union 7 [SIMPLE_EDGE] + <-Reducer 19 [CONTAINS] + Reduce Output Operator [RS_70] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 + Group By Operator [GBY_69] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"],aggregations:["sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)","sum(_col31)","sum(_col32)","sum(_col33)","sum(_col34)","sum(_col35)","sum(_col36)","sum(_col37)","sum(_col38)","sum(_col39)","sum(_col40)","sum(_col41)","sum(_col42)","sum(_col43)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, 2002 + Select Operator [SEL_67] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] + Select Operator [SEL_65] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] + Group By Operator [GBY_64] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_63] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 + Group By Operator [GBY_62] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"],aggregations:["sum(_col7)","sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, 2002 + Select Operator [SEL_60] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] + Merge Join Operator [MERGEJOIN_122] (rows=52272 width=471) + Output:["_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col2","1":"_col0"} + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col0 + Select Operator [SEL_47] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_114] (rows=1 width=0) + predicate:((sm_carrier) IN ('DIAMOND', 'AIRBORNE') and sm_ship_mode_sk is not null) + TableScan [TS_45] (rows=1 width=0) + default@ship_mode,ship_mode,Tbl:PARTIAL,Col:NONE,Output:["sm_ship_mode_sk","sm_carrier"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_57] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_121] (rows=47520 width=471) + Output:["_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col1","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col0 + Select Operator [SEL_44] (rows=43200 width=471) + Output:["_col0"] + Filter Operator [FIL_113] (rows=43200 width=471) + predicate:(t_time BETWEEN 49530 AND 78330 and t_time_sk is not null) + TableScan [TS_42] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_time"] + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_54] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_120] (rows=40176 width=1119) + Output:["_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col0","1":"_col0"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col0 + Select Operator [SEL_41] (rows=36524 width=1119) + Output:["_col0","_col2"] + Filter Operator [FIL_112] (rows=36524 width=1119) + predicate:((d_year = 2002) and d_date_sk is not null) + TableScan [TS_39] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_51] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_119] (rows=29 width=1054) + Output:["_col0","_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13"],keys:{"0":"_col3","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col3 + Select Operator [SEL_35] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_110] (rows=1 width=0) + predicate:(((cs_warehouse_sk is not null and cs_sold_date_sk is not null) and cs_sold_time_sk is not null) and cs_ship_mode_sk is not null) + TableScan [TS_33] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_sold_time_sk","cs_ship_mode_sk","cs_warehouse_sk","cs_quantity","cs_ext_sales_price","cs_net_paid_inc_ship_tax"] + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col0 + Select Operator [SEL_38] (rows=27 width=1029) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_111] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_36] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name","w_warehouse_sq_ft","w_city","w_county","w_state","w_country"] + <-Reducer 6 [CONTAINS] + Reduce Output Operator [RS_70] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 + Group By Operator [GBY_69] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"],aggregations:["sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)","sum(_col31)","sum(_col32)","sum(_col33)","sum(_col34)","sum(_col35)","sum(_col36)","sum(_col37)","sum(_col38)","sum(_col39)","sum(_col40)","sum(_col41)","sum(_col42)","sum(_col43)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, 2002 + Select Operator [SEL_67] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30","_col31","_col32","_col33","_col34","_col35","_col36","_col37","_col38","_col39","_col40","_col41","_col42","_col43"] + Select Operator [SEL_32] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] + Group By Operator [GBY_31] (rows=26136 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)","sum(VALUE._col3)","sum(VALUE._col4)","sum(VALUE._col5)","sum(VALUE._col6)","sum(VALUE._col7)","sum(VALUE._col8)","sum(VALUE._col9)","sum(VALUE._col10)","sum(VALUE._col11)","sum(VALUE._col12)","sum(VALUE._col13)","sum(VALUE._col14)","sum(VALUE._col15)","sum(VALUE._col16)","sum(VALUE._col17)","sum(VALUE._col18)","sum(VALUE._col19)","sum(VALUE._col20)","sum(VALUE._col21)","sum(VALUE._col22)","sum(VALUE._col23)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6 + Group By Operator [GBY_29] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"],aggregations:["sum(_col7)","sum(_col8)","sum(_col9)","sum(_col10)","sum(_col11)","sum(_col12)","sum(_col13)","sum(_col14)","sum(_col15)","sum(_col16)","sum(_col17)","sum(_col18)","sum(_col19)","sum(_col20)","sum(_col21)","sum(_col22)","sum(_col23)","sum(_col24)","sum(_col25)","sum(_col26)","sum(_col27)","sum(_col28)","sum(_col29)","sum(_col30)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, 2002 + Select Operator [SEL_27] (rows=52272 width=471) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col7","_col8","_col9","_col10","_col11","_col12","_col13","_col14","_col15","_col16","_col17","_col18","_col19","_col20","_col21","_col22","_col23","_col24","_col25","_col26","_col27","_col28","_col29","_col30"] + Merge Join Operator [MERGEJOIN_118] (rows=52272 width=471) + Output:["_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col2","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_109] (rows=1 width=0) + predicate:((sm_carrier) IN ('DIAMOND', 'AIRBORNE') and sm_ship_mode_sk is not null) + TableScan [TS_12] (rows=1 width=0) + default@ship_mode,ship_mode,Tbl:PARTIAL,Col:NONE,Output:["sm_ship_mode_sk","sm_carrier"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_117] (rows=47520 width=471) + Output:["_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col1","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=43200 width=471) + Output:["_col0"] + Filter Operator [FIL_108] (rows=43200 width=471) + predicate:(t_time BETWEEN 49530 AND 78330 and t_time_sk is not null) + TableScan [TS_9] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_time"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_116] (rows=40176 width=1119) + Output:["_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13","_col16"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0","_col2"] + Filter Operator [FIL_107] (rows=36524 width=1119) + predicate:((d_year = 2002) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_115] (rows=29 width=1054) + Output:["_col0","_col1","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col12","_col13"],keys:{"0":"_col3","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col3 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_105] (rows=1 width=0) + predicate:(((ws_warehouse_sk is not null and ws_sold_date_sk is not null) and ws_sold_time_sk is not null) and ws_ship_mode_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_sold_time_sk","ws_ship_mode_sk","ws_warehouse_sk","ws_quantity","ws_sales_price","ws_net_paid_inc_tax"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=27 width=1029) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_106] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_3] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name","w_warehouse_sq_ft","w_city","w_county","w_state","w_country"] diff --git a/ql/src/test/results/clientpositive/perf/query67.q.out b/ql/src/test/results/clientpositive/perf/query67.q.out index 0a61d0f..be7dc34 100644 --- a/ql/src/test/results/clientpositive/perf/query67.q.out +++ b/ql/src/test/results/clientpositive/perf/query67.q.out @@ -95,155 +95,83 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_36] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_35] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_34] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 762300 Data size: 1094874777 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), _col8 (type: decimal(28,2)), _col9 (type: int) - sort order:++++++++++ - Statistics:Num rows: 762300 Data size: 1094874777 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 762300 Data size: 1094874777 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_46] - predicate:(rank_window_0 <= 100) (type: boolean) - Statistics:Num rows: 762300 Data size: 1094874777 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_28] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col9(DESC)","partition by:":"_col0"}] - Statistics:Num rows: 2286900 Data size: 3284624331 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9"] - | Statistics:Num rows: 2286900 Data size: 3284624331 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: string), _col9 (type: decimal(28,2)) - Map-reduce partition columns:_col0 (type: string) - sort order:+- - Statistics:Num rows: 2286900 Data size: 3284624331 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), _col9 (type: decimal(28,2)) - Group By Operator [GBY_25] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: int), KEY._col5 (type: int), KEY._col6 (type: int), KEY._col7 (type: string), KEY._col8 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9"] - | Statistics:Num rows: 2286900 Data size: 3284624331 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), _col8 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), _col8 (type: string) - sort order:+++++++++ - Statistics:Num rows: 4573800 Data size: 6569248662 Basic stats: COMPLETE Column stats: NONE - value expressions:_col9 (type: decimal(28,2)) - Group By Operator [GBY_23] - aggregations:["sum(_col8)"] - keys:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), '0' (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 4573800 Data size: 6569248662 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_53] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col7","_col8","_col9","_col11","_col13","_col14","_col15","_col16"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_50] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col11 (type: string) - Merge Join Operator [MERGEJOIN_52] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col7","_col8","_col9","_col11"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_49] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int) - Merge Join Operator [MERGEJOIN_51] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col7","_col8","_col9"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_47] - | predicate:((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_item_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int), _col3 (type: int), _col4 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col2","_col3","_col4"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_48] - predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_36] + Limit [LIM_35] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_34] (rows=762300 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_33] + Select Operator [SEL_29] (rows=762300 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Filter Operator [FIL_46] (rows=762300 width=1436) + predicate:(rank_window_0 <= 100) + PTF Operator [PTF_28] (rows=2286900 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col9(DESC)","partition by:":"_col0"}] + Select Operator [SEL_27] (rows=2286900 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Group By Operator [GBY_25] (rows=2286900 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col9"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5, KEY._col6, KEY._col7, KEY._col8 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 + Group By Operator [GBY_23] (rows=4573800 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"],aggregations:["sum(_col8)"],keys:_col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, '0' + Select Operator [SEL_21] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_53] (rows=508200 width=1436) + Output:["_col3","_col4","_col7","_col8","_col9","_col11","_col13","_col14","_col15","_col16"],keys:{"0":"_col1","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=462000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_50] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_9] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand","i_class","i_category","i_product_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_52] (rows=44193 width=1119) + Output:["_col1","_col3","_col4","_col7","_col8","_col9","_col11"],keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_49] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_51] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col4","_col7","_col8","_col9"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_47] (rows=1 width=0) + predicate:((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_item_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_store_sk","ss_quantity","ss_sales_price"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0","_col2","_col3","_col4"] + Filter Operator [FIL_48] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq","d_year","d_moy","d_qoy"] diff --git a/ql/src/test/results/clientpositive/perf/query68.q.out b/ql/src/test/results/clientpositive/perf/query68.q.out index 8ecde89..af1d12b 100644 --- a/ql/src/test/results/clientpositive/perf/query68.q.out +++ b/ql/src/test/results/clientpositive/perf/query68.q.out @@ -15,227 +15,120 @@ Reducer 8 <- Map 15 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 9 - File Output Operator [FS_50] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_49] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_48] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: string), _col4 (type: int) - sort order:++ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)) - Select Operator [SEL_46] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_45] - predicate:(_col11 <> _col2) (type: boolean) - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_90] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col7 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5","_col8","_col9","_col11"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_84] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_36] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col7 (type: int) - Map-reduce partition columns:_col7 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: string), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col8 (type: string), _col9 (type: string) - Merge Join Operator [MERGEJOIN_89] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5","_col7","_col8","_col9"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_83] - | predicate:(c_customer_sk is not null and c_current_addr_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_33] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: string), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_30] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) - Group By Operator [GBY_28] - aggregations:["sum(_col6)","sum(_col7)","sum(_col8)"] - keys:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col18 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col1","_col3","_col5","_col18","_col6","_col7","_col8"] - Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_88] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col7","_col8","_col18"] - | Statistics:Num rows: 44000000 Data size: 44654715780 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_14] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:ca_address_sk is not null (type: boolean) - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:(((hd_dep_count = 4) or (hd_vehicle_count = 2)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_86] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_80] - | predicate:((s_city) IN ('Rosedale', 'Bethlehem') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_85] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_78] - | predicate:((((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_79] - predicate:(((d_year) IN (1998, 1999, 2000) and d_dom BETWEEN 1 AND 2) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 9 + File Output Operator [FS_50] + Limit [LIM_49] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_48] (rows=96800003 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_47] + Select Operator [SEL_46] (rows=96800003 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_45] (rows=96800003 width=860) + predicate:(_col11 <> _col2) + Merge Join Operator [MERGEJOIN_90] (rows=96800003 width=860) + Output:["_col0","_col2","_col3","_col4","_col5","_col8","_col9","_col11"],keys:{"0":"_col7","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_38] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_84] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_36] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_city"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col7 + Merge Join Operator [MERGEJOIN_89] (rows=88000001 width=860) + Output:["_col0","_col2","_col3","_col4","_col5","_col7","_col8","_col9"],keys:{"0":"_col1","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_35] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_83] (rows=80000000 width=860) + predicate:(c_customer_sk is not null and c_current_addr_sk is not null) + TableScan [TS_33] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_addr_sk","c_first_name","c_last_name"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col1 + Select Operator [SEL_31] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_30] (rows=22000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_28] (rows=44000000 width=1014) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col6)","sum(_col7)","sum(_col8)"],keys:_col1, _col3, _col5, _col18 + Select Operator [SEL_27] (rows=44000000 width=1014) + Output:["_col1","_col3","_col5","_col18","_col6","_col7","_col8"] + Merge Join Operator [MERGEJOIN_88] (rows=44000000 width=1014) + Output:["_col1","_col3","_col5","_col6","_col7","_col8","_col18"],keys:{"0":"_col3","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=40000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_82] (rows=40000000 width=1014) + predicate:ca_address_sk is not null + TableScan [TS_12] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_city"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_87] (rows=24305 width=1119) + Output:["_col1","_col3","_col5","_col6","_col7","_col8"],keys:{"0":"_col2","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=7200 width=107) + Output:["_col0"] + Filter Operator [FIL_81] (rows=7200 width=107) + predicate:(((hd_dep_count = 4) or (hd_vehicle_count = 2)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_86] (rows=22096 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col7","_col8"],keys:{"0":"_col4","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_80] (rows=852 width=1910) + predicate:((s_city) IN ('Rosedale', 'Bethlehem') and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_city"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_85] (rows=20088 width=1119) + Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + Filter Operator [FIL_78] (rows=1 width=0) + predicate:((((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_addr_sk is not null) and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_ticket_number","ss_ext_sales_price","ss_ext_list_price","ss_ext_tax"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_79] (rows=18262 width=1119) + predicate:(((d_year) IN (1998, 1999, 2000) and d_dom BETWEEN 1 AND 2) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"] diff --git a/ql/src/test/results/clientpositive/perf/query7.q.out b/ql/src/test/results/clientpositive/perf/query7.q.out index a463a8b..f7b9e91 100644 --- a/ql/src/test/results/clientpositive/perf/query7.q.out +++ b/ql/src/test/results/clientpositive/perf/query7.q.out @@ -13,162 +13,86 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_35] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_34] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: double), _col2 (type: decimal(11,6)), _col3 (type: decimal(11,6)), _col4 (type: decimal(11,6)) - Group By Operator [GBY_30] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 279510 Data size: 401454093 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: struct), _col2 (type: struct), _col3 (type: struct), _col4 (type: struct) - Group By Operator [GBY_28] - aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"] - keys:_col15 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - outputColumnNames:["_col15","_col4","_col5","_col7","_col6"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col7","_col15"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:(((p_channel_email = 'N') or (p_channel_event = 'N')) and p_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:promotion - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col15 (type: string) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5","_col6","_col7","_col15"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_53] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_56] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_52] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_55] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 2722 Data size: 986020 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_50] - | predicate:(((ss_cdemo_sk is not null and ss_sold_date_sk is not null) and ss_item_sk is not null) and ss_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_51] - predicate:((((cd_gender = 'F') and (cd_marital_status = 'W')) and (cd_education_status = 'Primary')) and cd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 2475 Data size: 896382 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer_demographics - Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_35] + Limit [LIM_34] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_33] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Group By Operator [GBY_30] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)","avg(VALUE._col3)"],keys:KEY._col0 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Group By Operator [GBY_28] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["avg(_col4)","avg(_col5)","avg(_col7)","avg(_col6)"],keys:_col15 + Select Operator [SEL_27] (rows=559020 width=1436) + Output:["_col15","_col4","_col5","_col7","_col6"] + Merge Join Operator [MERGEJOIN_58] (rows=559020 width=1436) + Output:["_col4","_col5","_col6","_col7","_col15"],keys:{"0":"_col3","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=2300 width=1179) + Output:["_col0"] + Filter Operator [FIL_54] (rows=2300 width=1179) + predicate:(((p_channel_email = 'N') or (p_channel_event = 'N')) and p_promo_sk is not null) + TableScan [TS_12] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk","p_channel_email","p_channel_event"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_57] (rows=508200 width=1436) + Output:["_col3","_col4","_col5","_col6","_col7","_col15"],keys:{"0":"_col1","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_53] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_9] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_56] (rows=40176 width=1119) + Output:["_col1","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_52] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_55] (rows=2722 width=362) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col2","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col2 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_50] (rows=1 width=0) + predicate:(((ss_cdemo_sk is not null and ss_sold_date_sk is not null) and ss_item_sk is not null) and ss_promo_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_cdemo_sk","ss_promo_sk","ss_quantity","ss_list_price","ss_sales_price","ss_coupon_amt"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=2475 width=362) + Output:["_col0"] + Filter Operator [FIL_51] (rows=2475 width=362) + predicate:((((cd_gender = 'F') and (cd_marital_status = 'W')) and (cd_education_status = 'Primary')) and cd_demo_sk is not null) + TableScan [TS_3] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_gender","cd_marital_status","cd_education_status"] diff --git a/ql/src/test/results/clientpositive/perf/query70.q.out b/ql/src/test/results/clientpositive/perf/query70.q.out index d8fd350..668b62e 100644 --- a/ql/src/test/results/clientpositive/perf/query70.q.out +++ b/ql/src/test/results/clientpositive/perf/query70.q.out @@ -17,252 +17,133 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE), Reducer 14 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_61] - compressed:false - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_60] - Number of rows:100 - Statistics:Num rows: 100 Data size: 111900 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_59] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_58] - key expressions:_col3 (type: string), CASE WHEN ((_col3 = 0)) THEN (_col1) END (type: string), _col4 (type: int) - sort order:-++ - Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(17,2)), _col1 (type: string), _col2 (type: string) - Select Operator [SEL_56] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_55] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col4","partition by:":"_col5, CASE WHEN ((_col5 = 2)) THEN (_col0) END"}] - Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_54] - | outputColumnNames:["_col0","_col1","_col4","_col5"] - | Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_53] - key expressions:_col5 (type: string), CASE WHEN ((_col5 = 2)) THEN (_col0) END (type: string), _col4 (type: decimal(17,2)) - Map-reduce partition columns:_col5 (type: string), CASE WHEN ((_col5 = 2)) THEN (_col0) END (type: string) - sort order:+++ - Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string) - Select Operator [SEL_52] - outputColumnNames:["_col0","_col1","_col4","_col5"] - Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_51] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 66289 Data size: 74179138 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_50] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 132579 Data size: 148359396 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(17,2)) - Group By Operator [GBY_49] - aggregations:["sum(_col2)"] - keys:_col6 (type: string), _col7 (type: string), '0' (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 132579 Data size: 148359396 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_48] - outputColumnNames:["_col6","_col7","_col2"] - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_90] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col6","_col7"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_86] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_42] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: decimal(7,2)) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_79] - | | predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_0] - | | alias:ss - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_80] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_46] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 7365 Data size: 8242187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string) - Merge Join Operator [MERGEJOIN_89] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 7365 Data size: 8242187 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_38] - | key expressions:_col2 (type: string) - | Map-reduce partition columns:_col2 (type: string) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:(s_store_sk is not null and s_state is not null) (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:s - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 14 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 6696 Data size: 7492898 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_37] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 6696 Data size: 7492898 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_31] - outputColumnNames:["_col0"] - Statistics:Num rows: 6696 Data size: 7492898 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_82] - predicate:((rank_window_0 <= 5) and _col0 is not null) (type: boolean) - Statistics:Num rows: 6696 Data size: 7492898 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_30] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1(DESC)","partition by:":"_col0"}] - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 13 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: string), _col1 (type: decimal(17,2)) - Map-reduce partition columns:_col0 (type: string) - sort order:+- - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_27] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 12 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)) - Group By Operator [GBY_25] - aggregations:["sum(_col2)"] - keys:_col4 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_24] - outputColumnNames:["_col4","_col2"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_88] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_85] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col4 (type: string) - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4"] - | Statistics:Num rows: 1874 Data size: 3581903 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_83] - | predicate:(ss_store_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_9] - | alias:ss - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_84] - predicate:s_store_sk is not null (type: boolean) - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_12] - alias:s - Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_61] + Limit [LIM_60] (rows=100 width=1119) + Number of rows:100 + Select Operator [SEL_59] (rows=66289 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_58] + Select Operator [SEL_56] (rows=66289 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4"] + PTF Operator [PTF_55] (rows=66289 width=1119) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col4","partition by:":"_col5, CASE WHEN ((_col5 = 2)) THEN (_col0) END"}] + Select Operator [SEL_54] (rows=66289 width=1119) + Output:["_col0","_col1","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_53] + PartitionCols:_col5, CASE WHEN ((_col5 = 2)) THEN (_col0) END + Select Operator [SEL_52] (rows=66289 width=1119) + Output:["_col0","_col1","_col4","_col5"] + Group By Operator [GBY_51] (rows=66289 width=1119) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_50] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_49] (rows=132579 width=1119) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col2)"],keys:_col6, _col7, '0' + Select Operator [SEL_48] (rows=44193 width=1119) + Output:["_col6","_col7","_col2"] + Merge Join Operator [MERGEJOIN_90] (rows=44193 width=1119) + Output:["_col2","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_86] (rows=40176 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_79] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,ss,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_store_sk","ss_net_profit"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_80] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_89] (rows=7365 width=1119) + Output:["_col0","_col1","_col2"],keys:{"0":"_col2","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col2 + Select Operator [SEL_8] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_81] (rows=1704 width=1910) + predicate:(s_store_sk is not null and s_state is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,s,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_county","s_state"] + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0 + Group By Operator [GBY_37] (rows=6696 width=1119) + Output:["_col0"],keys:_col0 + Select Operator [SEL_31] (rows=6696 width=1119) + Output:["_col0"] + Filter Operator [FIL_82] (rows=6696 width=1119) + predicate:((rank_window_0 <= 5) and _col0 is not null) + PTF Operator [PTF_30] (rows=20088 width=1119) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1(DESC)","partition by:":"_col0"}] + Select Operator [SEL_29] (rows=20088 width=1119) + Output:["_col0","_col1"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Group By Operator [GBY_27] (rows=20088 width=1119) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Group By Operator [GBY_25] (rows=40176 width=1119) + Output:["_col0","_col1"],aggregations:["sum(_col2)"],keys:_col4 + Select Operator [SEL_24] (rows=40176 width=1119) + Output:["_col4","_col2"] + Merge Join Operator [MERGEJOIN_88] (rows=40176 width=1119) + Output:["_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_85] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_15] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_87] (rows=1874 width=1911) + Output:["_col0","_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col1 + Select Operator [SEL_11] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_83] (rows=1 width=0) + predicate:(ss_store_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_9] (rows=1 width=0) + default@store_sales,ss,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_store_sk","ss_net_profit"] + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_84] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_12] (rows=1704 width=1910) + default@store,s,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_state"] diff --git a/ql/src/test/results/clientpositive/perf/query71.q.out b/ql/src/test/results/clientpositive/perf/query71.q.out index fa50e56..55d5004 100644 --- a/ql/src/test/results/clientpositive/perf/query71.q.out +++ b/ql/src/test/results/clientpositive/perf/query71.q.out @@ -14,229 +14,123 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 7 <- Map 6 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE), Union 8 (CONTAINS) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_53] - compressed:false - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_52] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_51] - key expressions:_col4 (type: decimal(17,2)), _col0 (type: int) - sort order:-+ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: int), _col3 (type: int) - Group By Operator [GBY_48] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: string), KEY._col2 (type: int), KEY._col3 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col0 (type: int), _col1 (type: string), _col2 (type: int), _col3 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: string), _col2 (type: int), _col3 (type: int) - sort order:++++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)) - Group By Operator [GBY_46] - aggregations:["sum(_col4)"] - keys:_col1 (type: int), _col2 (type: string), _col8 (type: int), _col9 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_45] - outputColumnNames:["_col1","_col2","_col8","_col9","_col4"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4","_col8","_col9"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_43] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int) - | Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:(((t_meal_time = 'breakfast') or (t_meal_time = 'dinner')) and t_time_sk is not null) (type: boolean) - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_36] - | alias:time_dim - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: string), _col4 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_86] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4","_col6"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_75] - | predicate:((i_manager_id = 1) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Union 8 [SIMPLE_EDGE] - |<-Reducer 11 [CONTAINS] - | Reduce Output Operator [RS_40] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 60264 Data size: 67436088 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(7,2)), _col2 (type: int) - | Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_84] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_19] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_15] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_78] - | | predicate:((cs_sold_date_sk is not null and cs_item_sk is not null) and cs_sold_time_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_13] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_18] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_79] - | predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 14 [CONTAINS] - | Reduce Output Operator [RS_40] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 60264 Data size: 67436088 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: decimal(7,2)), _col2 (type: int) - | Select Operator [SEL_34] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_85] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_31] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_27] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_80] - | | predicate:((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_sold_time_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_25] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_30] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_28] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [CONTAINS] - Reduce Output Operator [RS_40] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 60264 Data size: 67436088 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: decimal(7,2)), _col2 (type: int) - Select Operator [SEL_12] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_83] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_76] - | predicate:((ws_sold_date_sk is not null and ws_item_sk is not null) and ws_sold_time_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_3] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_8] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_77] - predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_6] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_53] + Select Operator [SEL_52] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_51] + Group By Operator [GBY_48] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_46] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"],aggregations:["sum(_col4)"],keys:_col1, _col2, _col8, _col9 + Select Operator [SEL_45] (rows=279510 width=1436) + Output:["_col1","_col2","_col8","_col9","_col4"] + Merge Join Operator [MERGEJOIN_87] (rows=279510 width=1436) + Output:["_col1","_col2","_col4","_col8","_col9"],keys:{"0":"_col6","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_38] (rows=86400 width=471) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_82] (rows=86400 width=471) + predicate:(((t_meal_time = 'breakfast') or (t_meal_time = 'dinner')) and t_time_sk is not null) + TableScan [TS_36] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute","t_meal_time"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_86] (rows=254100 width=1436) + Output:["_col1","_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=231000 width=1436) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_75] (rows=231000 width=1436) + predicate:((i_manager_id = 1) and i_item_sk is not null) + TableScan [TS_0] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_brand","i_manager_id"] + <-Union 8 [SIMPLE_EDGE] + <-Reducer 11 [CONTAINS] + Reduce Output Operator [RS_40] + PartitionCols:_col1 + Select Operator [SEL_22] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_84] (rows=20088 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_15] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_78] (rows=1 width=0) + predicate:((cs_sold_date_sk is not null and cs_item_sk is not null) and cs_sold_time_sk is not null) + TableScan [TS_13] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_sold_time_sk","cs_item_sk","cs_ext_sales_price"] + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_79] (rows=18262 width=1119) + predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) + TableScan [TS_16] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 14 [CONTAINS] + Reduce Output Operator [RS_40] + PartitionCols:_col1 + Select Operator [SEL_34] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_85] (rows=20088 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_27] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_80] (rows=1 width=0) + predicate:((ss_sold_date_sk is not null and ss_item_sk is not null) and ss_sold_time_sk is not null) + TableScan [TS_25] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_sold_time_sk","ss_item_sk","ss_ext_sales_price"] + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_81] (rows=18262 width=1119) + predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) + TableScan [TS_28] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 7 [CONTAINS] + Reduce Output Operator [RS_40] + PartitionCols:_col1 + Select Operator [SEL_12] (rows=20088 width=1119) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_83] (rows=20088 width=1119) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_76] (rows=1 width=0) + predicate:((ws_sold_date_sk is not null and ws_item_sk is not null) and ws_sold_time_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_sold_time_sk","ws_item_sk","ws_ext_sales_price"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_77] (rows=18262 width=1119) + predicate:(((d_moy = 12) and d_date_sk is not null) and (d_year = 2001)) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] diff --git a/ql/src/test/results/clientpositive/perf/query72.q.out b/ql/src/test/results/clientpositive/perf/query72.q.out index bb56f0d..3063727 100644 --- a/ql/src/test/results/clientpositive/perf/query72.q.out +++ b/ql/src/test/results/clientpositive/perf/query72.q.out @@ -19,334 +19,174 @@ Reducer 8 <- Map 20 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Map 21 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 13 - File Output Operator [FS_74] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_73] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_72] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 165056 Data size: 237066834 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 12 [SIMPLE_EDGE] - Reduce Output Operator [RS_71] - key expressions:_col5 (type: bigint), _col0 (type: string), _col1 (type: string), _col2 (type: int) - sort order:-+++ - Statistics:Num rows: 165056 Data size: 237066834 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint) - Group By Operator [GBY_69] - | aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 165056 Data size: 237066834 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_68] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: int) - sort order:+++ - Statistics:Num rows: 330112 Data size: 474133669 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - Group By Operator [GBY_67] - aggregations:["count(_col3)","count(_col4)","count()"] - keys:_col0 (type: string), _col1 (type: string), _col2 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 330112 Data size: 474133669 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_65] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 330112 Data size: 474133669 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_141] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col4 (type: int), _col6 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col13","_col15","_col22","_col28"] - | Statistics:Num rows: 330112 Data size: 474133669 Basic stats: COMPLETE Column stats: NONE - |<-Map 23 [SIMPLE_EDGE] - | Reduce Output Operator [RS_63] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_58] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_57] - | alias:catalog_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_62] - key expressions:_col4 (type: int), _col6 (type: int) - Map-reduce partition columns:_col4 (type: int), _col6 (type: int) - sort order:++ - Statistics:Num rows: 300102 Data size: 431030599 Basic stats: COMPLETE Column stats: NONE - value expressions:_col13 (type: string), _col15 (type: string), _col22 (type: int), _col28 (type: int) - Merge Join Operator [MERGEJOIN_140] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col6","_col13","_col15","_col22","_col28"] - | Statistics:Num rows: 300102 Data size: 431030599 Basic stats: COMPLETE Column stats: NONE - |<-Map 22 [SIMPLE_EDGE] - | Reduce Output Operator [RS_60] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_56] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_55] - | alias:promotion - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_59] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 272820 Data size: 391845991 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col6 (type: int), _col13 (type: string), _col15 (type: string), _col22 (type: int) - Select Operator [SEL_54] - outputColumnNames:["_col13","_col15","_col22","_col4","_col5","_col6"] - Statistics:Num rows: 272820 Data size: 391845991 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_53] - predicate:(UDFToDouble(_col27) > (UDFToDouble(_col21) + 5.0)) (type: boolean) - Statistics:Num rows: 272820 Data size: 391845991 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_139] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col5","_col6","_col13","_col15","_col21","_col22","_col27"] - | Statistics:Num rows: 818460 Data size: 1175537975 Basic stats: COMPLETE Column stats: NONE - |<-Map 21 [SIMPLE_EDGE] - | Reduce Output Operator [RS_51] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_129] - | predicate:d_date_sk is not null (type: boolean) - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_50] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 744055 Data size: 1068670864 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col5 (type: int), _col6 (type: int), _col13 (type: string), _col15 (type: string), _col21 (type: string), _col22 (type: int) - Merge Join Operator [MERGEJOIN_138] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col8 (type: int), _col22 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col1","_col4","_col5","_col6","_col13","_col15","_col21","_col22"] - | Statistics:Num rows: 744055 Data size: 1068670864 Basic stats: COMPLETE Column stats: NONE - |<-Map 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_48] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_28] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_128] - | predicate:(d_week_seq is not null and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_26] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_47] - key expressions:_col8 (type: int), _col22 (type: int) - Map-reduce partition columns:_col8 (type: int), _col22 (type: int) - sort order:++ - Statistics:Num rows: 676414 Data size: 971518947 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col13 (type: string), _col15 (type: string), _col21 (type: string) - Merge Join Operator [MERGEJOIN_137] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4","_col5","_col6","_col8","_col13","_col15","_col21","_col22"] - | Statistics:Num rows: 676414 Data size: 971518947 Basic stats: COMPLETE Column stats: NONE - |<-Map 19 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: int) - | Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_127] - | predicate:((d_date_sk is not null and (d_year = 2001)) and d_week_seq is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_44] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col8 (type: int), _col13 (type: string), _col15 (type: string) - Merge Join Operator [MERGEJOIN_136] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col4","_col5","_col6","_col8","_col13","_col15"] - | Statistics:Num rows: 614922 Data size: 883199024 Basic stats: COMPLETE Column stats: NONE - |<-Map 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_42] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_22] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_126] - | predicate:((hd_buy_potential = '1001-5000') and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_20] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_41] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col8 (type: int), _col13 (type: string), _col15 (type: string) - Merge Join Operator [MERGEJOIN_135] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3","_col4","_col5","_col6","_col8","_col13","_col15"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_125] - | predicate:((cd_marital_status = 'M') and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_38] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col8 (type: int), _col13 (type: string), _col15 (type: string) - Merge Join Operator [MERGEJOIN_134] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col13","_col15"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_16] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_124] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_14] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_35] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col8 (type: int), _col13 (type: string) - Merge Join Operator [MERGEJOIN_133] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col10 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col13"] - | Statistics:Num rows: 29 Data size: 30582 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_33] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_123] - | predicate:w_warehouse_sk is not null (type: boolean) - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_11] - | alias:warehouse - | Statistics:Num rows: 27 Data size: 27802 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col10 (type: int) - Map-reduce partition columns:_col10 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col8 (type: int) - Select Operator [SEL_10] - outputColumnNames:["_col0","_col1","_col10","_col2","_col3","_col4","_col5","_col6","_col8"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_9] - predicate:(_col11 < _col7) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Merge Join Operator [MERGEJOIN_132] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col10","_col11"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col4 (type: int) - | Map-reduce partition columns:_col4 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_121] - | predicate:((((cs_item_sk is not null and cs_bill_cdemo_sk is not null) and cs_bill_hdemo_sk is not null) and cs_sold_date_sk is not null) and cs_ship_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_122] - predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:inventory - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 13 + File Output Operator [FS_74] + Limit [LIM_73] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_72] (rows=165056 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_71] + Group By Operator [GBY_69] (rows=165056 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_68] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_67] (rows=330112 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(_col3)","count(_col4)","count()"],keys:_col0, _col1, _col2 + Select Operator [SEL_65] (rows=330112 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_141] (rows=330112 width=1436) + Output:["_col13","_col15","_col22","_col28"],keys:{"0":"_col4, _col6","1":"_col0, _col1"} + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_63] + PartitionCols:_col0, _col1 + Select Operator [SEL_58] (rows=1 width=0) + Output:["_col0","_col1"] + TableScan [TS_57] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number"] + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_62] + PartitionCols:_col4, _col6 + Merge Join Operator [MERGEJOIN_140] (rows=300102 width=1436) + Output:["_col4","_col6","_col13","_col15","_col22","_col28"],keys:{"0":"_col5","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_60] + PartitionCols:_col0 + Select Operator [SEL_56] (rows=2300 width=1179) + Output:["_col0"] + TableScan [TS_55] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col5 + Select Operator [SEL_54] (rows=272820 width=1436) + Output:["_col13","_col15","_col22","_col4","_col5","_col6"] + Filter Operator [FIL_53] (rows=272820 width=1436) + predicate:(UDFToDouble(_col27) > (UDFToDouble(_col21) + 5.0)) + Merge Join Operator [MERGEJOIN_139] (rows=818460 width=1436) + Output:["_col4","_col5","_col6","_col13","_col15","_col21","_col22","_col27"],keys:{"0":"_col1","1":"_col0"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_51] + PartitionCols:_col0 + Select Operator [SEL_31] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_129] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_29] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_50] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_138] (rows=744055 width=1436) + Output:["_col1","_col4","_col5","_col6","_col13","_col15","_col21","_col22"],keys:{"0":"_col8, _col22","1":"_col0, _col1"} + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col0, _col1 + Select Operator [SEL_28] (rows=73049 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_128] (rows=73049 width=1119) + predicate:(d_week_seq is not null and d_date_sk is not null) + TableScan [TS_26] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_week_seq"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col8, _col22 + Merge Join Operator [MERGEJOIN_137] (rows=676414 width=1436) + Output:["_col1","_col4","_col5","_col6","_col8","_col13","_col15","_col21","_col22"],keys:{"0":"_col0","1":"_col0"} + <-Map 19 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col0 + Select Operator [SEL_25] (rows=36524 width=1119) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_127] (rows=36524 width=1119) + predicate:((d_date_sk is not null and (d_year = 2001)) and d_week_seq is not null) + TableScan [TS_23] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_week_seq","d_year"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_136] (rows=614922 width=1436) + Output:["_col0","_col1","_col4","_col5","_col6","_col8","_col13","_col15"],keys:{"0":"_col3","1":"_col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0 + Select Operator [SEL_22] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_126] (rows=3600 width=107) + predicate:((hd_buy_potential = '1001-5000') and hd_demo_sk is not null) + TableScan [TS_20] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_135] (rows=559020 width=1436) + Output:["_col0","_col1","_col3","_col4","_col5","_col6","_col8","_col13","_col15"],keys:{"0":"_col2","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=9900 width=362) + Output:["_col0"] + Filter Operator [FIL_125] (rows=9900 width=362) + predicate:((cd_marital_status = 'M') and cd_demo_sk is not null) + TableScan [TS_17] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_134] (rows=508200 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col13","_col15"],keys:{"0":"_col4","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_124] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_14] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_desc"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_133] (rows=29 width=1054) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col8","_col13"],keys:{"0":"_col10","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=27 width=1029) + Output:["_col0","_col1"] + Filter Operator [FIL_123] (rows=27 width=1029) + predicate:w_warehouse_sk is not null + TableScan [TS_11] (rows=27 width=1029) + default@warehouse,warehouse,Tbl:COMPLETE,Col:NONE,Output:["w_warehouse_sk","w_warehouse_name"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col10 + Select Operator [SEL_10] (rows=1 width=0) + Output:["_col0","_col1","_col10","_col2","_col3","_col4","_col5","_col6","_col8"] + Filter Operator [FIL_9] (rows=1 width=0) + predicate:(_col11 < _col7) + Merge Join Operator [MERGEJOIN_132] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col10","_col11"],keys:{"0":"_col4","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_121] (rows=1 width=0) + predicate:((((cs_item_sk is not null and cs_bill_cdemo_sk is not null) and cs_bill_hdemo_sk is not null) and cs_sold_date_sk is not null) and cs_ship_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_ship_date_sk","cs_bill_cdemo_sk","cs_bill_hdemo_sk","cs_item_sk","cs_promo_sk","cs_order_number","cs_quantity"] + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_122] (rows=1 width=0) + predicate:((inv_item_sk is not null and inv_warehouse_sk is not null) and inv_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_warehouse_sk","inv_quantity_on_hand"] diff --git a/ql/src/test/results/clientpositive/perf/query73.q.out b/ql/src/test/results/clientpositive/perf/query73.q.out index 9c88854..dec5a86 100644 --- a/ql/src/test/results/clientpositive/perf/query73.q.out +++ b/ql/src/test/results/clientpositive/perf/query73.q.out @@ -13,165 +13,88 @@ Reducer 6 <- Map 11 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_36] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_35] - key expressions:_col5 (type: bigint) - sort order:- - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: int) - Select Operator [SEL_34] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_60] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - | Select Operator [SEL_30] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_56] - | predicate:c_customer_sk is not null (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_28] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_31] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 6076 Data size: 6799525 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: bigint) - Filter Operator [FIL_26] - predicate:_col2 BETWEEN 1 AND 5 (type: boolean) - Statistics:Num rows: 6076 Data size: 6799525 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 12152 Data size: 13599051 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 12152 Data size: 13599051 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_22] - aggregations:["count()"] - keys:_col1 (type: int), _col4 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_59] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col4"] - | Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_55] - | predicate:(((((hd_buy_potential = '1001-5000') or (hd_buy_potential = '5001-10000')) and (hd_vehicle_count > 0)) and (CASE WHEN ((hd_vehicle_count > 0)) THEN ((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count))) ELSE (null) END > 1.0)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 800 Data size: 85600 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col4 (type: int) - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col4"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:((s_county) IN ('Kittitas County', 'Adams County', 'Richland County', 'Furnas County') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col4 (type: int) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_52] - | predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_53] - predicate:(((d_year) IN (1998, 1999, 2000) and d_dom BETWEEN 1 AND 2) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_37] + Select Operator [SEL_36] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_35] + Select Operator [SEL_34] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_60] (rows=88000001 width=860) + Output:["_col0","_col2","_col4","_col5","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Select Operator [SEL_30] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_56] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_28] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_salutation","c_first_name","c_last_name","c_preferred_cust_flag"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col1 + Filter Operator [FIL_26] (rows=6076 width=1119) + predicate:_col2 BETWEEN 1 AND 5 + Select Operator [SEL_25] (rows=12152 width=1119) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_24] (rows=12152 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0, _col1 + Group By Operator [GBY_22] (rows=24305 width=1119) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col1, _col4 + Merge Join Operator [MERGEJOIN_59] (rows=24305 width=1119) + Output:["_col1","_col4"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=800 width=107) + Output:["_col0"] + Filter Operator [FIL_55] (rows=800 width=107) + predicate:(((((hd_buy_potential = '1001-5000') or (hd_buy_potential = '5001-10000')) and (hd_vehicle_count > 0)) and (CASE WHEN ((hd_vehicle_count > 0)) THEN ((UDFToDouble(hd_dep_count) / UDFToDouble(hd_vehicle_count))) ELSE (null) END > 1.0)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential","hd_dep_count","hd_vehicle_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_58] (rows=22096 width=1119) + Output:["_col1","_col2","_col4"],keys:{"0":"_col3","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_54] (rows=852 width=1910) + predicate:((s_county) IN ('Kittitas County', 'Adams County', 'Richland County', 'Furnas County') and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_county"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_57] (rows=20088 width=1119) + Output:["_col1","_col2","_col3","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_52] (rows=1 width=0) + predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_store_sk","ss_ticket_number"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_53] (rows=18262 width=1119) + predicate:(((d_year) IN (1998, 1999, 2000) and d_dom BETWEEN 1 AND 2) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dom"] diff --git a/ql/src/test/results/clientpositive/perf/query75.q.out b/ql/src/test/results/clientpositive/perf/query75.q.out index f3f9827..daf7ad7 100644 --- a/ql/src/test/results/clientpositive/perf/query75.q.out +++ b/ql/src/test/results/clientpositive/perf/query75.q.out @@ -29,700 +29,359 @@ Reducer 7 <- Reducer 31 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 8 - File Output Operator [FS_150] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_149] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_148] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - | Statistics:Num rows: 169103 Data size: 242878993 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_147] - key expressions:_col8 (type: bigint) - sort order:+ - Statistics:Num rows: 169103 Data size: 242878993 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: bigint), _col7 (type: bigint), _col9 (type: double) - Select Operator [SEL_146] - outputColumnNames:["_col0","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 169103 Data size: 242878993 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_145] - predicate:((CAST( _col5 AS decimal(17,2)) / CAST( _col12 AS decimal(17,2))) < 0.9) (type: boolean) - Statistics:Num rows: 169103 Data size: 242878993 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_253] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int)","1":"_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col12","_col13"] - | Statistics:Num rows: 507310 Data size: 728638416 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 31 [SIMPLE_EDGE] - | Reduce Output Operator [RS_143] - | key expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | sort order:++++ - | Statistics:Num rows: 461191 Data size: 662398546 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int), _col5 (type: bigint), _col6 (type: double) - | Group By Operator [GBY_140] - | | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: int), KEY._col4 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 461191 Data size: 662398546 Basic stats: COMPLETE Column stats: NONE - | |<-Union 30 [SIMPLE_EDGE] - | |<-Reducer 29 [CONTAINS] - | | Reduce Output Operator [RS_139] - | | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | sort order:+++++ - | | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col5 (type: bigint), _col6 (type: double) - | | Group By Operator [GBY_138] - | | aggregations:["sum(_col5)","sum(_col6)"] - | | keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_91] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | | Merge Join Operator [MERGEJOIN_246] - | | | condition map:[{"":"Left Outer Join0 to 1"}] - | | | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | | | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"] - | | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 34 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_89] - | | | key expressions:_col1 (type: int), _col0 (type: int) - | | | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | | | sort order:++ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | | | Select Operator [SEL_81] - | | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_80] - | | | alias:catalog_returns - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Reducer 28 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_88] - | | key expressions:_col2 (type: int), _col1 (type: int) - | | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | | sort order:++ - | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int), _col12 (type: int) - | | Merge Join Operator [MERGEJOIN_245] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"] - | | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 33 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_86] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:2001 (type: int) - | | | Select Operator [SEL_79] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_225] - | | | predicate:((d_year = 2001) and d_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_77] - | | | alias:date_dim - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 27 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_85] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | | Merge Join Operator [MERGEJOIN_244] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 26 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_82] - | | | key expressions:_col1 (type: int) - | | | Map-reduce partition columns:_col1 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | | | Select Operator [SEL_73] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_223] - | | | predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_71] - | | | alias:catalog_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 32 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_83] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - | | Select Operator [SEL_76] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_224] - | | predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_74] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 38 [CONTAINS] - | | Reduce Output Operator [RS_139] - | | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | sort order:+++++ - | | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col5 (type: bigint), _col6 (type: double) - | | Group By Operator [GBY_138] - | | aggregations:["sum(_col5)","sum(_col6)"] - | | keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_112] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | | Merge Join Operator [MERGEJOIN_249] - | | | condition map:[{"":"Left Outer Join0 to 1"}] - | | | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | | | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"] - | | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 41 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_110] - | | | key expressions:_col1 (type: int), _col0 (type: int) - | | | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | | | sort order:++ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | | | Select Operator [SEL_102] - | | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_101] - | | | alias:store_returns - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Reducer 37 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_109] - | | key expressions:_col2 (type: int), _col1 (type: int) - | | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | | sort order:++ - | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int), _col12 (type: int) - | | Merge Join Operator [MERGEJOIN_248] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"] - | | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 40 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_107] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:2001 (type: int) - | | | Select Operator [SEL_100] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_229] - | | | predicate:((d_year = 2001) and d_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_98] - | | | alias:date_dim - | | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 36 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_106] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | | Merge Join Operator [MERGEJOIN_247] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 35 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_103] - | | | key expressions:_col1 (type: int) - | | | Map-reduce partition columns:_col1 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | | | Select Operator [SEL_94] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_227] - | | | predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_92] - | | | alias:store_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 39 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_104] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - | | Select Operator [SEL_97] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_228] - | | predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - | | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_95] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 45 [CONTAINS] - | Reduce Output Operator [RS_139] - | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | sort order:+++++ - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: bigint), _col6 (type: double) - | Group By Operator [GBY_138] - | aggregations:["sum(_col5)","sum(_col6)"] - | keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_135] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_252] - | | condition map:[{"":"Left Outer Join0 to 1"}] - | | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"] - | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | |<-Map 48 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_133] - | | key expressions:_col1 (type: int), _col0 (type: int) - | | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_125] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_124] - | | alias:web_returns - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 44 [SIMPLE_EDGE] - | Reduce Output Operator [RS_132] - | key expressions:_col2 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int), _col12 (type: int) - | Merge Join Operator [MERGEJOIN_251] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"] - | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | |<-Map 47 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_130] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | value expressions:2001 (type: int) - | | Select Operator [SEL_123] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_233] - | | predicate:((d_year = 2001) and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_121] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 43 [SIMPLE_EDGE] - | Reduce Output Operator [RS_129] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | Merge Join Operator [MERGEJOIN_250] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | |<-Map 42 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_126] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | | Select Operator [SEL_117] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_231] - | | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_115] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 46 [SIMPLE_EDGE] - | Reduce Output Operator [RS_127] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - | Select Operator [SEL_120] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_232] - | predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_118] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_142] - key expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - Map-reduce partition columns:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - sort order:++++ - Statistics:Num rows: 461191 Data size: 662398546 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: bigint), _col6 (type: double) - Select Operator [SEL_70] - outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 461191 Data size: 662398546 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_69] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: int), KEY._col4 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 461191 Data size: 662398546 Basic stats: COMPLETE Column stats: NONE - |<-Union 5 [SIMPLE_EDGE] - |<-Reducer 15 [CONTAINS] - | Reduce Output Operator [RS_68] - | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | sort order:+++++ - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: bigint), _col6 (type: double) - | Group By Operator [GBY_67] - | aggregations:["sum(_col5)","sum(_col6)"] - | keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_65] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_41] - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_240] - | | condition map:[{"":"Left Outer Join0 to 1"}] - | | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"] - | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_39] - | | key expressions:_col1 (type: int), _col0 (type: int) - | | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_31] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_30] - | | alias:store_returns - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_38] - | key expressions:_col2 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | Merge Join Operator [MERGEJOIN_239] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_29] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_217] - | | predicate:((d_year = 2002) and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_27] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_35] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | Merge Join Operator [MERGEJOIN_238] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_32] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | | Select Operator [SEL_23] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_215] - | | predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_21] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_33] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - | Select Operator [SEL_26] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_216] - | predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_24] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 22 [CONTAINS] - | Reduce Output Operator [RS_68] - | key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | sort order:+++++ - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: bigint), _col6 (type: double) - | Group By Operator [GBY_67] - | aggregations:["sum(_col5)","sum(_col6)"] - | keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_65] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_64] - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_243] - | | condition map:[{"":"Left Outer Join0 to 1"}] - | | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"] - | | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - | |<-Map 25 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_62] - | | key expressions:_col1 (type: int), _col0 (type: int) - | | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_54] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_53] - | | alias:web_returns - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 21 [SIMPLE_EDGE] - | Reduce Output Operator [RS_61] - | key expressions:_col2 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | Merge Join Operator [MERGEJOIN_242] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - | |<-Map 24 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_59] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_52] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_221] - | | predicate:((d_year = 2002) and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_50] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_58] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - | Merge Join Operator [MERGEJOIN_241] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - | |<-Map 19 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_55] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | | Select Operator [SEL_46] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_219] - | | predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_44] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 23 [SIMPLE_EDGE] - | Reduce Output Operator [RS_56] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - | Select Operator [SEL_49] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_220] - | predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_47] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [CONTAINS] - Reduce Output Operator [RS_68] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - sort order:+++++ - Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: bigint), _col6 (type: double) - Group By Operator [GBY_67] - aggregations:["sum(_col5)","sum(_col6)"] - keys:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_65] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 922383 Data size: 1324798530 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_20] - outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_237] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col2 (type: int), _col1 (type: int)","1":"_col1 (type: int), _col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"] - | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col1 (type: int), _col0 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col0 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col2 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_10] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_9] - | alias:catalog_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col2 (type: int), _col1 (type: int) - Map-reduce partition columns:_col2 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - Merge Join Operator [MERGEJOIN_236] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_213] - | predicate:((d_year = 2002) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: int), _col7 (type: int), _col8 (type: int), _col10 (type: int) - Merge Join Operator [MERGEJOIN_235] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_211] - | predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:catalog_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col5"] - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_212] - predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) (type: boolean) - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 8 + File Output Operator [FS_150] + Limit [LIM_149] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_148] (rows=169103 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_147] + Select Operator [SEL_146] (rows=169103 width=1436) + Output:["_col0","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + Filter Operator [FIL_145] (rows=169103 width=1436) + predicate:((CAST( _col5 AS decimal(17,2)) / CAST( _col12 AS decimal(17,2))) < 0.9) + Merge Join Operator [MERGEJOIN_253] (rows=507310 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col12","_col13"],keys:{"0":"_col1, _col2, _col3, _col4","1":"_col1, _col2, _col3, _col4"} + <-Reducer 31 [SIMPLE_EDGE] + SHUFFLE [RS_143] + PartitionCols:_col1, _col2, _col3, _col4 + Group By Operator [GBY_140] (rows=461191 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Union 30 [SIMPLE_EDGE] + <-Reducer 29 [CONTAINS] + Reduce Output Operator [RS_139] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_138] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_91] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_246] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 34 [SIMPLE_EDGE] + SHUFFLE [RS_89] + PartitionCols:_col1, _col0 + Select Operator [SEL_81] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_80] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_return_quantity","cr_return_amount"] + <-Reducer 28 [SIMPLE_EDGE] + SHUFFLE [RS_88] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_245] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"],keys:{"0":"_col0","1":"_col0"} + <-Map 33 [SIMPLE_EDGE] + SHUFFLE [RS_86] + PartitionCols:_col0 + Select Operator [SEL_79] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_225] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_77] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 27 [SIMPLE_EDGE] + SHUFFLE [RS_85] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_244] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 26 [SIMPLE_EDGE] + SHUFFLE [RS_82] + PartitionCols:_col1 + Select Operator [SEL_73] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_223] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_71] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_order_number","cs_quantity","cs_ext_sales_price"] + <-Map 32 [SIMPLE_EDGE] + SHUFFLE [RS_83] + PartitionCols:_col0 + Select Operator [SEL_76] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_224] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_74] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] + <-Reducer 38 [CONTAINS] + Reduce Output Operator [RS_139] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_138] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_112] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_249] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 41 [SIMPLE_EDGE] + SHUFFLE [RS_110] + PartitionCols:_col1, _col0 + Select Operator [SEL_102] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_101] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_ticket_number","sr_return_quantity","sr_return_amt"] + <-Reducer 37 [SIMPLE_EDGE] + SHUFFLE [RS_109] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_248] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"],keys:{"0":"_col0","1":"_col0"} + <-Map 40 [SIMPLE_EDGE] + SHUFFLE [RS_107] + PartitionCols:_col0 + Select Operator [SEL_100] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_229] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_98] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 36 [SIMPLE_EDGE] + SHUFFLE [RS_106] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_247] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 35 [SIMPLE_EDGE] + SHUFFLE [RS_103] + PartitionCols:_col1 + Select Operator [SEL_94] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_227] (rows=1 width=0) + predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_92] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ticket_number","ss_quantity","ss_ext_sales_price"] + <-Map 39 [SIMPLE_EDGE] + SHUFFLE [RS_104] + PartitionCols:_col0 + Select Operator [SEL_97] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_228] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_95] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] + <-Reducer 45 [CONTAINS] + Reduce Output Operator [RS_139] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_138] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_135] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_252] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col12","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 48 [SIMPLE_EDGE] + SHUFFLE [RS_133] + PartitionCols:_col1, _col0 + Select Operator [SEL_125] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_124] (rows=1 width=0) + default@web_returns,web_returns,Tbl:PARTIAL,Col:NONE,Output:["wr_item_sk","wr_order_number","wr_return_quantity","wr_return_amt"] + <-Reducer 44 [SIMPLE_EDGE] + SHUFFLE [RS_132] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_251] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10","_col12"],keys:{"0":"_col0","1":"_col0"} + <-Map 47 [SIMPLE_EDGE] + SHUFFLE [RS_130] + PartitionCols:_col0 + Select Operator [SEL_123] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_233] (rows=36524 width=1119) + predicate:((d_year = 2001) and d_date_sk is not null) + TableScan [TS_121] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 43 [SIMPLE_EDGE] + SHUFFLE [RS_129] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_250] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 42 [SIMPLE_EDGE] + SHUFFLE [RS_126] + PartitionCols:_col1 + Select Operator [SEL_117] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_231] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_115] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_order_number","ws_quantity","ws_ext_sales_price"] + <-Map 46 [SIMPLE_EDGE] + SHUFFLE [RS_127] + PartitionCols:_col0 + Select Operator [SEL_120] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_232] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_118] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_142] + PartitionCols:_col1, _col2, _col3, _col4 + Select Operator [SEL_70] (rows=461191 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5","_col6"] + Group By Operator [GBY_69] (rows=461191 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Union 5 [SIMPLE_EDGE] + <-Reducer 15 [CONTAINS] + Reduce Output Operator [RS_68] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_67] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_65] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Select Operator [SEL_41] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_240] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col1, _col0 + Select Operator [SEL_31] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_30] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_ticket_number","sr_return_quantity","sr_return_amt"] + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_239] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0 + Select Operator [SEL_29] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_217] (rows=36524 width=1119) + predicate:((d_year = 2002) and d_date_sk is not null) + TableScan [TS_27] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_238] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col1 + Select Operator [SEL_23] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_215] (rows=1 width=0) + predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_21] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ticket_number","ss_quantity","ss_ext_sales_price"] + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_216] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_24] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] + <-Reducer 22 [CONTAINS] + Reduce Output Operator [RS_68] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_67] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_65] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Select Operator [SEL_64] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_243] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 25 [SIMPLE_EDGE] + SHUFFLE [RS_62] + PartitionCols:_col1, _col0 + Select Operator [SEL_54] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_53] (rows=1 width=0) + default@web_returns,web_returns,Tbl:PARTIAL,Col:NONE,Output:["wr_item_sk","wr_order_number","wr_return_quantity","wr_return_amt"] + <-Reducer 21 [SIMPLE_EDGE] + SHUFFLE [RS_61] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_242] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 24 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col0 + Select Operator [SEL_52] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_221] (rows=36524 width=1119) + predicate:((d_year = 2002) and d_date_sk is not null) + TableScan [TS_50] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 20 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_241] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 19 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col1 + Select Operator [SEL_46] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_219] (rows=1 width=0) + predicate:(ws_item_sk is not null and ws_sold_date_sk is not null) + TableScan [TS_44] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_order_number","ws_quantity","ws_ext_sales_price"] + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col0 + Select Operator [SEL_49] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_220] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_47] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] + <-Reducer 4 [CONTAINS] + Reduce Output Operator [RS_68] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_67] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col5)","sum(_col6)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_65] (rows=922383 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Select Operator [SEL_20] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col4","_col5","_col6"] + Merge Join Operator [MERGEJOIN_237] (rows=307461 width=1436) + Output:["_col3","_col4","_col6","_col7","_col8","_col10","_col15","_col16"],keys:{"0":"_col2, _col1","1":"_col1, _col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col1, _col0 + Select Operator [SEL_10] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_9] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_return_quantity","cr_return_amount"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col2, _col1 + Merge Join Operator [MERGEJOIN_236] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_213] (rows=36524 width=1119) + predicate:((d_year = 2002) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_235] (rows=254100 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col6","_col7","_col8","_col10"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_211] (rows=1 width=0) + predicate:(cs_item_sk is not null and cs_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_item_sk","cs_order_number","cs_quantity","cs_ext_sales_price"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col5"] + Filter Operator [FIL_212] (rows=231000 width=1436) + predicate:((((((i_category = 'Sports') and i_item_sk is not null) and i_category_id is not null) and i_manufact_id is not null) and i_class_id is not null) and i_brand_id is not null) + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand_id","i_class_id","i_category_id","i_category","i_manufact_id"] diff --git a/ql/src/test/results/clientpositive/perf/query76.q.out b/ql/src/test/results/clientpositive/perf/query76.q.out index e540ee7..c246000 100644 --- a/ql/src/test/results/clientpositive/perf/query76.q.out +++ b/ql/src/test/results/clientpositive/perf/query76.q.out @@ -15,270 +15,141 @@ Reducer 5 <- Union 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_59] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_58] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_57] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 838530 Data size: 1204362280 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_56] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 838530 Data size: 1204362280 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: bigint), _col6 (type: decimal(17,2)) - Group By Operator [GBY_54] - | aggregations:["count(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: int), KEY._col3 (type: int), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 838530 Data size: 1204362280 Basic stats: COMPLETE Column stats: NONE - |<-Union 4 [SIMPLE_EDGE] - |<-Reducer 11 [CONTAINS] - | Reduce Output Operator [RS_53] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | sort order:+++++ - | Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: bigint), _col6 (type: decimal(17,2)) - | Group By Operator [GBY_52] - | aggregations:["count()","sum(_col5)"] - | keys:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_87] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col5","_col7","_col8"] - | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_29] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int) - | | Select Operator [SEL_24] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_80] - | | predicate:d_date_sk is not null (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_22] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(7,2)), _col5 (type: string) - | Merge Join Operator [MERGEJOIN_86] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col3","_col5"] - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_26] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_21] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_79] - | | predicate:i_item_sk is not null (type: boolean) - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_19] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_18] - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_78] - | predicate:((ws_item_sk is not null and ws_web_page_sk is null) and ws_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_16] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 16 [CONTAINS] - | Reduce Output Operator [RS_53] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | sort order:+++++ - | Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: bigint), _col6 (type: decimal(17,2)) - | Group By Operator [GBY_52] - | aggregations:["count()","sum(_col5)"] - | keys:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_49] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_89] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col5","_col7","_col8"] - | | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_47] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int) - | | Select Operator [SEL_42] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_83] - | | predicate:d_date_sk is not null (type: boolean) - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_40] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_46] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(7,2)), _col5 (type: string) - | Merge Join Operator [MERGEJOIN_88] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col3","_col5"] - | | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_43] - | | key expressions:_col2 (type: int) - | | Map-reduce partition columns:_col2 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col3 (type: decimal(7,2)) - | | Select Operator [SEL_36] - | | outputColumnNames:["_col0","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_81] - | | predicate:((cs_item_sk is not null and cs_warehouse_sk is null) and cs_sold_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_34] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_44] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_39] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:i_item_sk is not null (type: boolean) - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_37] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [CONTAINS] - Reduce Output Operator [RS_53] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: bigint), _col6 (type: decimal(17,2)) - Group By Operator [GBY_52] - aggregations:["count()","sum(_col5)"] - keys:_col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 1677060 Data size: 2408724561 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_85] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col5","_col7","_col8"] - | Statistics:Num rows: 559020 Data size: 802908187 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_77] - | predicate:d_date_sk is not null (type: boolean) - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col5 (type: string) - Merge Join Operator [MERGEJOIN_84] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col5"] - | Statistics:Num rows: 508200 Data size: 729916518 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col3 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_75] - | predicate:((ss_addr_sk is null and ss_item_sk is not null) and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_76] - predicate:i_item_sk is not null (type: boolean) - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_59] + Limit [LIM_58] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_57] (rows=838530 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_56] + Group By Operator [GBY_54] (rows=838530 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["count(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Union 4 [SIMPLE_EDGE] + <-Reducer 11 [CONTAINS] + Reduce Output Operator [RS_53] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_52] (rows=1677060 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["count()","sum(_col5)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_31] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_87] (rows=559020 width=1436) + Output:["_col3","_col5","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Select Operator [SEL_24] (rows=73049 width=1119) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_80] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_22] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_86] (rows=508200 width=1436) + Output:["_col0","_col3","_col5"],keys:{"0":"_col1","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Select Operator [SEL_21] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_79] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_19] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_category"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col1 + Select Operator [SEL_18] (rows=1 width=0) + Output:["_col0","_col1","_col3"] + Filter Operator [FIL_78] (rows=1 width=0) + predicate:((ws_item_sk is not null and ws_web_page_sk is null) and ws_sold_date_sk is not null) + TableScan [TS_16] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_web_page_sk","ws_ext_sales_price"] + <-Reducer 16 [CONTAINS] + Reduce Output Operator [RS_53] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_52] (rows=1677060 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["count()","sum(_col5)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_49] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_89] (rows=559020 width=1436) + Output:["_col3","_col5","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0 + Select Operator [SEL_42] (rows=73049 width=1119) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_83] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_40] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_88] (rows=508200 width=1436) + Output:["_col0","_col3","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col2 + Select Operator [SEL_36] (rows=1 width=0) + Output:["_col0","_col2","_col3"] + Filter Operator [FIL_81] (rows=1 width=0) + predicate:((cs_item_sk is not null and cs_warehouse_sk is null) and cs_sold_date_sk is not null) + TableScan [TS_34] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_warehouse_sk","cs_item_sk","cs_ext_sales_price"] + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col0 + Select Operator [SEL_39] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_82] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_37] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_category"] + <-Reducer 3 [CONTAINS] + Reduce Output Operator [RS_53] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_52] (rows=1677060 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["count()","sum(_col5)"],keys:_col0, _col1, _col2, _col3, _col4 + Select Operator [SEL_15] (rows=559020 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_85] (rows=559020 width=1436) + Output:["_col3","_col5","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=73049 width=1119) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_77] (rows=73049 width=1119) + predicate:d_date_sk is not null + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_qoy"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_84] (rows=508200 width=1436) + Output:["_col0","_col3","_col5"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col3"] + Filter Operator [FIL_75] (rows=1 width=0) + predicate:((ss_addr_sk is null and ss_item_sk is not null) and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_addr_sk","ss_ext_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=462000 width=1436) + Output:["_col0","_col1"] + Filter Operator [FIL_76] (rows=462000 width=1436) + predicate:i_item_sk is not null + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_category"] diff --git a/ql/src/test/results/clientpositive/perf/query79.q.out b/ql/src/test/results/clientpositive/perf/query79.q.out index a0d5a51..96d7cb0 100644 --- a/ql/src/test/results/clientpositive/perf/query79.q.out +++ b/ql/src/test/results/clientpositive/perf/query79.q.out @@ -13,169 +13,90 @@ Reducer 6 <- Map 11 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_36] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col5 (type: decimal(17,2)) - sort order:++++ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: decimal(17,2)) - Select Operator [SEL_33] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_60] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col6","_col7"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_56] - | predicate:c_customer_sk is not null (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_27] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 12152 Data size: 13599051 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: string), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)) - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 12152 Data size: 13599051 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | keys:KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 12152 Data size: 13599051 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) - Group By Operator [GBY_22] - aggregations:["sum(_col6)","sum(_col7)"] - keys:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col13 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col1","_col3","_col5","_col13","_col6","_col7"] - Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_59] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col7","_col13"] - | Statistics:Num rows: 24305 Data size: 27199223 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 6000 Data size: 642000 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 6000 Data size: 642000 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_55] - | predicate:(((hd_dep_count = 8) or (hd_vehicle_count > 0)) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 6000 Data size: 642000 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col13 (type: string) - Merge Join Operator [MERGEJOIN_58] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col7","_col13"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_54] - | predicate:(s_number_employees BETWEEN 200 AND 295 and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_57] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_52] - | predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_53] - predicate:(((d_dow = 1) and (d_year) IN (1998, 1999, 2000)) and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_37] + Limit [LIM_36] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_35] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_34] + Select Operator [SEL_33] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_60] (rows=88000001 width=860) + Output:["_col0","_col2","_col3","_col4","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_29] (rows=80000000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_56] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_27] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_first_name","c_last_name"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col1 + Select Operator [SEL_25] (rows=12152 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_24] (rows=12152 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0, _col1, _col2, _col3 + Group By Operator [GBY_22] (rows=24305 width=1119) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col6)","sum(_col7)"],keys:_col1, _col3, _col5, _col13 + Select Operator [SEL_21] (rows=24305 width=1119) + Output:["_col1","_col3","_col5","_col13","_col6","_col7"] + Merge Join Operator [MERGEJOIN_59] (rows=24305 width=1119) + Output:["_col1","_col3","_col5","_col6","_col7","_col13"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=6000 width=107) + Output:["_col0"] + Filter Operator [FIL_55] (rows=6000 width=107) + predicate:(((hd_dep_count = 8) or (hd_vehicle_count > 0)) and hd_demo_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_58] (rows=22096 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col7","_col13"],keys:{"0":"_col4","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=852 width=1910) + Output:["_col0","_col2"] + Filter Operator [FIL_54] (rows=852 width=1910) + predicate:(s_number_employees BETWEEN 200 AND 295 and s_store_sk is not null) + TableScan [TS_6] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_number_employees","s_city"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_57] (rows=20088 width=1119) + Output:["_col1","_col2","_col3","_col4","_col5","_col6","_col7"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_52] (rows=1 width=0) + predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_hdemo_sk is not null) and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk","ss_hdemo_sk","ss_addr_sk","ss_store_sk","ss_ticket_number","ss_coupon_amt","ss_net_profit"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_53] (rows=18262 width=1119) + predicate:(((d_dow = 1) and (d_year) IN (1998, 1999, 2000)) and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_dow"] diff --git a/ql/src/test/results/clientpositive/perf/query80.q.out b/ql/src/test/results/clientpositive/perf/query80.q.out index 37cb542..364b597 100644 --- a/ql/src/test/results/clientpositive/perf/query80.q.out +++ b/ql/src/test/results/clientpositive/perf/query80.q.out @@ -27,567 +27,290 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE), Union 8 (CONTAINS) Reducer 9 <- Union 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 10 - File Output Operator [FS_125] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_124] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_123] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 419265 Data size: 602181139 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_122] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 419265 Data size: 602181139 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(27,2)), _col3 (type: decimal(32,2)), _col4 (type: decimal(33,2)) - Select Operator [SEL_121] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 419265 Data size: 602181139 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_120] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col3","_col4","_col5"] - | Statistics:Num rows: 419265 Data size: 602181139 Basic stats: COMPLETE Column stats: NONE - |<-Union 8 [SIMPLE_EDGE] - |<-Reducer 22 [CONTAINS] - | Reduce Output Operator [RS_119] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(27,2)), _col4 (type: decimal(32,2)), _col5 (type: decimal(33,2)) - | Group By Operator [GBY_118] - | aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"] - | keys:_col0 (type: string), _col1 (type: string), '0' (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_75] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_74] - | | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 21 [SIMPLE_EDGE] - | Reduce Output Operator [RS_73] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)), _col2 (type: decimal(22,2)), _col3 (type: decimal(23,2)) - | Group By Operator [GBY_72] - | aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"] - | keys:_col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_70] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_211] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | |<-Map 27 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_68] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_54] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_194] - | | predicate:((p_channel_tv = 'N') and p_promo_sk is not null) (type: boolean) - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_52] - | | alias:promotion - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_67] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - | Merge Join Operator [MERGEJOIN_210] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - | |<-Map 26 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_65] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_51] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_193] - | | predicate:((i_current_price > 50) and i_item_sk is not null) (type: boolean) - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_49] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 19 [SIMPLE_EDGE] - | Reduce Output Operator [RS_64] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 50600 Data size: 23318689 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - | Merge Join Operator [MERGEJOIN_209] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2","_col3","_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 50600 Data size: 23318689 Basic stats: COMPLETE Column stats: NONE - | |<-Map 25 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_62] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 46000 Data size: 21198808 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_48] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 46000 Data size: 21198808 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_192] - | | predicate:cp_catalog_page_sk is not null (type: boolean) - | | Statistics:Num rows: 46000 Data size: 21198808 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_46] - | | alias:catalog_page - | | Statistics:Num rows: 46000 Data size: 21198808 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_61] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_208] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 24 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_59] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_45] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_191] - | | predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_43] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_58] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_202] - | | condition map:[{"":"Left Outer Join0 to 1"}] - | | keys:{"0":"_col2 (type: int), _col4 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_55] - | | key expressions:_col2 (type: int), _col4 (type: int) - | | Map-reduce partition columns:_col2 (type: int), _col4 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | | Select Operator [SEL_40] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_189] - | | predicate:(((cs_sold_date_sk is not null and cs_catalog_page_sk is not null) and cs_item_sk is not null) and cs_promo_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_38] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 23 [SIMPLE_EDGE] - | Reduce Output Operator [RS_56] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)) - | Select Operator [SEL_42] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_41] - | alias:catalog_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 34 [CONTAINS] - | Reduce Output Operator [RS_119] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: decimal(27,2)), _col4 (type: decimal(32,2)), _col5 (type: decimal(33,2)) - | Group By Operator [GBY_118] - | aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"] - | keys:_col0 (type: string), _col1 (type: string), '0' (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_115] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_114] - | | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 33 [SIMPLE_EDGE] - | Reduce Output Operator [RS_113] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: decimal(17,2)), _col2 (type: decimal(22,2)), _col3 (type: decimal(23,2)) - | Group By Operator [GBY_112] - | aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"] - | keys:_col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_110] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_215] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - | |<-Map 39 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_108] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_94] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_200] - | | predicate:((p_channel_tv = 'N') and p_promo_sk is not null) (type: boolean) - | | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_92] - | | alias:promotion - | | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 32 [SIMPLE_EDGE] - | Reduce Output Operator [RS_107] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - | Merge Join Operator [MERGEJOIN_214] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - | |<-Map 38 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_105] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_91] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_199] - | | predicate:((i_current_price > 50) and i_item_sk is not null) (type: boolean) - | | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_89] - | | alias:item - | | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 31 [SIMPLE_EDGE] - | Reduce Output Operator [RS_104] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - | Merge Join Operator [MERGEJOIN_213] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3","_col5","_col6","_col9","_col10","_col14"] - | | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - | |<-Map 37 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_102] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_88] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_198] - | | predicate:web_site_sk is not null (type: boolean) - | | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_86] - | | alias:web_site - | | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 30 [SIMPLE_EDGE] - | Reduce Output Operator [RS_101] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_212] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 36 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_99] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_85] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_197] - | | predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) (type: boolean) - | | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_83] - | | alias:date_dim - | | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 29 [SIMPLE_EDGE] - | Reduce Output Operator [RS_98] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - | Merge Join Operator [MERGEJOIN_203] - | | condition map:[{"":"Left Outer Join0 to 1"}] - | | keys:{"0":"_col1 (type: int), _col4 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 28 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_95] - | | key expressions:_col1 (type: int), _col4 (type: int) - | | Map-reduce partition columns:_col1 (type: int), _col4 (type: int) - | | sort order:++ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | | Select Operator [SEL_80] - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_195] - | | predicate:(((ws_sold_date_sk is not null and ws_web_site_sk is not null) and ws_item_sk is not null) and ws_promo_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_78] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 35 [SIMPLE_EDGE] - | Reduce Output Operator [RS_96] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)) - | Select Operator [SEL_82] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_81] - | alias:web_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 7 [CONTAINS] - Reduce Output Operator [RS_119] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(27,2)), _col4 (type: decimal(32,2)), _col5 (type: decimal(33,2)) - Group By Operator [GBY_118] - aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"] - keys:_col0 (type: string), _col1 (type: string), '0' (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 838530 Data size: 1204362279 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_37] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_36] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 93170 Data size: 133818031 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_35] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(17,2)), _col2 (type: decimal(22,2)), _col3 (type: decimal(23,2)) - Group By Operator [GBY_34] - aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_32] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_207] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col5","_col6","_col9","_col10","_col14"] - | Statistics:Num rows: 186340 Data size: 267636062 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_30] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_16] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_188] - | predicate:((p_channel_tv = 'N') and p_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 1150 Data size: 1356710 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_14] - | alias:promotion - | Statistics:Num rows: 2300 Data size: 2713420 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - Merge Join Operator [MERGEJOIN_206] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col5","_col6","_col9","_col10","_col14"] - | Statistics:Num rows: 169400 Data size: 243305506 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_13] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_187] - | predicate:((i_current_price > 50) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 154000 Data size: 221186819 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_11] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col14 (type: string) - Merge Join Operator [MERGEJOIN_205] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col5","_col6","_col9","_col10","_col14"] - | Statistics:Num rows: 44193 Data size: 49453132 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_10] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_186] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_8] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_204] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_7] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_185] - | predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_5] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_201] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col1 (type: int), _col4 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_17] - | key expressions:_col1 (type: int), _col4 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col4 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_183] - | predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_item_sk is not null) and ss_promo_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)) - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 10 + File Output Operator [FS_125] + Limit [LIM_124] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_123] (rows=419265 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_122] + Select Operator [SEL_121] (rows=419265 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_120] (rows=419265 width=1436) + Output:["_col0","_col1","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Union 8 [SIMPLE_EDGE] + <-Reducer 22 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_118] (rows=838530 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0, _col1, '0' + Select Operator [SEL_75] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_74] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0 + <-Reducer 21 [SIMPLE_EDGE] + SHUFFLE [RS_73] + PartitionCols:_col0 + Group By Operator [GBY_72] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"],keys:_col0 + Select Operator [SEL_70] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_211] (rows=186340 width=1436) + Output:["_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col3","1":"_col0"} + <-Map 27 [SIMPLE_EDGE] + SHUFFLE [RS_68] + PartitionCols:_col0 + Select Operator [SEL_54] (rows=1150 width=1179) + Output:["_col0"] + Filter Operator [FIL_194] (rows=1150 width=1179) + predicate:((p_channel_tv = 'N') and p_promo_sk is not null) + TableScan [TS_52] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk","p_channel_tv"] + <-Reducer 20 [SIMPLE_EDGE] + SHUFFLE [RS_67] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_210] (rows=169400 width=1436) + Output:["_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col2","1":"_col0"} + <-Map 26 [SIMPLE_EDGE] + SHUFFLE [RS_65] + PartitionCols:_col0 + Select Operator [SEL_51] (rows=154000 width=1436) + Output:["_col0"] + Filter Operator [FIL_193] (rows=154000 width=1436) + predicate:((i_current_price > 50) and i_item_sk is not null) + TableScan [TS_49] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price"] + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_64] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_209] (rows=50600 width=460) + Output:["_col2","_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col1","1":"_col0"} + <-Map 25 [SIMPLE_EDGE] + SHUFFLE [RS_62] + PartitionCols:_col0 + Select Operator [SEL_48] (rows=46000 width=460) + Output:["_col0","_col1"] + Filter Operator [FIL_192] (rows=46000 width=460) + predicate:cp_catalog_page_sk is not null + TableScan [TS_46] (rows=46000 width=460) + default@catalog_page,catalog_page,Tbl:COMPLETE,Col:NONE,Output:["cp_catalog_page_sk","cp_catalog_page_id"] + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_61] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_208] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 24 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col0 + Select Operator [SEL_45] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_191] (rows=36524 width=1119) + predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) + TableScan [TS_43] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_202] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col2, _col4","1":"_col0, _col1"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col2, _col4 + Select Operator [SEL_40] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_189] (rows=1 width=0) + predicate:(((cs_sold_date_sk is not null and cs_catalog_page_sk is not null) and cs_item_sk is not null) and cs_promo_sk is not null) + TableScan [TS_38] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_catalog_page_sk","cs_item_sk","cs_promo_sk","cs_order_number","cs_ext_sales_price","cs_net_profit"] + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col0, _col1 + Select Operator [SEL_42] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_41] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_item_sk","cr_order_number","cr_return_amount","cr_net_loss"] + <-Reducer 34 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_118] (rows=838530 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0, _col1, '0' + Select Operator [SEL_115] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_114] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0 + <-Reducer 33 [SIMPLE_EDGE] + SHUFFLE [RS_113] + PartitionCols:_col0 + Group By Operator [GBY_112] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"],keys:_col0 + Select Operator [SEL_110] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_215] (rows=186340 width=1436) + Output:["_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col3","1":"_col0"} + <-Map 39 [SIMPLE_EDGE] + SHUFFLE [RS_108] + PartitionCols:_col0 + Select Operator [SEL_94] (rows=1150 width=1179) + Output:["_col0"] + Filter Operator [FIL_200] (rows=1150 width=1179) + predicate:((p_channel_tv = 'N') and p_promo_sk is not null) + TableScan [TS_92] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk","p_channel_tv"] + <-Reducer 32 [SIMPLE_EDGE] + SHUFFLE [RS_107] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_214] (rows=169400 width=1436) + Output:["_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col1","1":"_col0"} + <-Map 38 [SIMPLE_EDGE] + SHUFFLE [RS_105] + PartitionCols:_col0 + Select Operator [SEL_91] (rows=154000 width=1436) + Output:["_col0"] + Filter Operator [FIL_199] (rows=154000 width=1436) + predicate:((i_current_price > 50) and i_item_sk is not null) + TableScan [TS_89] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price"] + <-Reducer 31 [SIMPLE_EDGE] + SHUFFLE [RS_104] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_213] (rows=44193 width=1119) + Output:["_col1","_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col2","1":"_col0"} + <-Map 37 [SIMPLE_EDGE] + SHUFFLE [RS_102] + PartitionCols:_col0 + Select Operator [SEL_88] (rows=84 width=1850) + Output:["_col0","_col1"] + Filter Operator [FIL_198] (rows=84 width=1850) + predicate:web_site_sk is not null + TableScan [TS_86] (rows=84 width=1850) + default@web_site,web_site,Tbl:COMPLETE,Col:NONE,Output:["web_site_sk","web_site_id"] + <-Reducer 30 [SIMPLE_EDGE] + SHUFFLE [RS_101] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_212] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 36 [SIMPLE_EDGE] + SHUFFLE [RS_99] + PartitionCols:_col0 + Select Operator [SEL_85] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_197] (rows=36524 width=1119) + predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) + TableScan [TS_83] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 29 [SIMPLE_EDGE] + SHUFFLE [RS_98] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_203] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col1, _col4","1":"_col0, _col1"} + <-Map 28 [SIMPLE_EDGE] + SHUFFLE [RS_95] + PartitionCols:_col1, _col4 + Select Operator [SEL_80] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_195] (rows=1 width=0) + predicate:(((ws_sold_date_sk is not null and ws_web_site_sk is not null) and ws_item_sk is not null) and ws_promo_sk is not null) + TableScan [TS_78] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_web_site_sk","ws_promo_sk","ws_order_number","ws_ext_sales_price","ws_net_profit"] + <-Map 35 [SIMPLE_EDGE] + SHUFFLE [RS_96] + PartitionCols:_col0, _col1 + Select Operator [SEL_82] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_81] (rows=1 width=0) + default@web_returns,web_returns,Tbl:PARTIAL,Col:NONE,Output:["wr_item_sk","wr_order_number","wr_return_amt","wr_net_loss"] + <-Reducer 7 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_118] (rows=838530 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col2)","sum(_col3)","sum(_col4)"],keys:_col0, _col1, '0' + Select Operator [SEL_37] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4"] + Group By Operator [GBY_36] (rows=93170 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"],keys:KEY._col0 + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col0 + Group By Operator [GBY_34] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(_col1)","sum(_col2)","sum(_col3)"],keys:_col0 + Select Operator [SEL_32] (rows=186340 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_207] (rows=186340 width=1436) + Output:["_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col3","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=1150 width=1179) + Output:["_col0"] + Filter Operator [FIL_188] (rows=1150 width=1179) + predicate:((p_channel_tv = 'N') and p_promo_sk is not null) + TableScan [TS_14] (rows=2300 width=1179) + default@promotion,promotion,Tbl:COMPLETE,Col:NONE,Output:["p_promo_sk","p_channel_tv"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_206] (rows=169400 width=1436) + Output:["_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col1","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=154000 width=1436) + Output:["_col0"] + Filter Operator [FIL_187] (rows=154000 width=1436) + predicate:((i_current_price > 50) and i_item_sk is not null) + TableScan [TS_11] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_current_price"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_205] (rows=44193 width=1119) + Output:["_col1","_col3","_col5","_col6","_col9","_col10","_col14"],keys:{"0":"_col2","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Select Operator [SEL_10] (rows=1704 width=1910) + Output:["_col0","_col1"] + Filter Operator [FIL_186] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_8] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_id"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_204] (rows=40176 width=1119) + Output:["_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col0","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_7] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_185] (rows=36524 width=1119) + predicate:(d_date BETWEEN 1998-08-04 AND 1998-09-04 and d_date_sk is not null) + TableScan [TS_5] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_201] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col5","_col6","_col9","_col10"],keys:{"0":"_col1, _col4","1":"_col0, _col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col1, _col4 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_183] (rows=1 width=0) + predicate:(((ss_sold_date_sk is not null and ss_store_sk is not null) and ss_item_sk is not null) and ss_promo_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_store_sk","ss_promo_sk","ss_ticket_number","ss_ext_sales_price","ss_net_profit"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1 + Select Operator [SEL_4] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + TableScan [TS_3] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_ticket_number","sr_return_amt","sr_net_loss"] diff --git a/ql/src/test/results/clientpositive/perf/query82.q.out b/ql/src/test/results/clientpositive/perf/query82.q.out index 654a772..91d17f2 100644 --- a/ql/src/test/results/clientpositive/perf/query82.q.out +++ b/ql/src/test/results/clientpositive/perf/query82.q.out @@ -11,117 +11,65 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_27] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_26] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: decimal(7,2)) - Group By Operator [GBY_22] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: decimal(7,2)) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)) - sort order:+++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_20] - keys:_col1 (type: string), _col2 (type: string), _col3 (type: decimal(7,2)) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_43] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_17] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_40] - | predicate:(d_date BETWEEN '2002-05-30' AND '2002-07-30' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_42] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"_col0 (type: int)","1":"_col1 (type: int)","2":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_38] - | predicate:(((i_manufact_id) IN (437, 129, 727, 663) and i_current_price BETWEEN 30 AND 60) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 115500 Data size: 165890114 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_39] - | predicate:((inv_quantity_on_hand BETWEEN 100 AND 500 and inv_item_sk is not null) and inv_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_3] - | alias:inventory - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_11] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_41] - predicate:ss_item_sk is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_9] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_27] + Limit [LIM_26] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_25] (rows=139755 width=1436) + Output:["_col0","_col1","_col2"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_24] + Group By Operator [GBY_22] (rows=139755 width=1436) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_20] (rows=279510 width=1436) + Output:["_col0","_col1","_col2"],keys:_col1, _col2, _col3 + Merge Join Operator [MERGEJOIN_43] (rows=279510 width=1436) + Output:["_col1","_col2","_col3"],keys:{"0":"_col5","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_40] (rows=36524 width=1119) + predicate:(d_date BETWEEN '2002-05-30' AND '2002-07-30' and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_42] (rows=254100 width=1436) + Output:["_col1","_col2","_col3","_col5"],keys:{"0":"_col0","1":"_col1","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=115500 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_38] (rows=115500 width=1436) + predicate:(((i_manufact_id) IN (437, 129, 727, 663) and i_current_price BETWEEN 30 AND 60) and i_item_sk is not null) + TableScan [TS_0] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_manufact_id"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_39] (rows=1 width=0) + predicate:((inv_quantity_on_hand BETWEEN 100 AND 500 and inv_item_sk is not null) and inv_date_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@inventory,inventory,Tbl:PARTIAL,Col:NONE,Output:["inv_date_sk","inv_item_sk","inv_quantity_on_hand"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_41] (rows=1 width=0) + predicate:ss_item_sk is not null + TableScan [TS_9] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_item_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query84.q.out b/ql/src/test/results/clientpositive/perf/query84.q.out index e522f23..597aeb8 100644 --- a/ql/src/test/results/clientpositive/perf/query84.q.out +++ b/ql/src/test/results/clientpositive/perf/query84.q.out @@ -12,160 +12,88 @@ Reducer 5 <- Map 10 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_35] - compressed:false - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_34] - Number of rows:100 - Statistics:Num rows: 100 Data size: 86000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_33] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 234256017 Data size: 201464909002 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 234256017 Data size: 201464909002 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 234256017 Data size: 201464909002 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_66] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col11 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col5"] - | Statistics:Num rows: 234256017 Data size: 201464909002 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_29] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_61] - | predicate:(((ib_upper_bound <= 82287) and (ib_lower_bound >= 32287)) and ib_income_band_sk is not null) (type: boolean) - | Statistics:Num rows: 2 Data size: 24 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:income_band - | Statistics:Num rows: 20 Data size: 240 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col11 (type: int) - Map-reduce partition columns:_col11 (type: int) - sort order:+ - Statistics:Num rows: 212960011 Data size: 183149913305 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col4 (type: string), _col5 (type: string) - Merge Join Operator [MERGEJOIN_65] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col5","_col11"] - | Statistics:Num rows: 212960011 Data size: 183149913305 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_26] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_60] - | predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) (type: boolean) - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 193600006 Data size: 166499917578 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col4 (type: string), _col5 (type: string) - Merge Join Operator [MERGEJOIN_64] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 1 to 2"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)","2":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5"] - | Statistics:Num rows: 193600006 Data size: 166499917578 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_62] - | predicate:sr_cdemo_sk is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_15] - | alias:store_returns - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_59] - | predicate:cd_demo_sk is not null (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col2 (type: int), _col4 (type: string), _col5 (type: string) - Merge Join Operator [MERGEJOIN_63] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col4","_col5"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col1 (type: int), _col2 (type: int), _col4 (type: string), _col5 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_57] - | predicate:((c_current_addr_sk is not null and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_58] - predicate:((ca_city = 'Hopewell') and ca_address_sk is not null) (type: boolean) - Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:customer_address - Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_35] + Limit [LIM_34] (rows=100 width=860) + Number of rows:100 + Select Operator [SEL_33] (rows=234256017 width=860) + Output:["_col0","_col1"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_32] + Select Operator [SEL_31] (rows=234256017 width=860) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_66] (rows=234256017 width=860) + Output:["_col0","_col4","_col5"],keys:{"0":"_col11","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=2 width=12) + Output:["_col0"] + Filter Operator [FIL_61] (rows=2 width=12) + predicate:(((ib_upper_bound <= 82287) and (ib_lower_bound >= 32287)) and ib_income_band_sk is not null) + TableScan [TS_12] (rows=20 width=12) + default@income_band,income_band,Tbl:COMPLETE,Col:NONE,Output:["ib_income_band_sk","ib_lower_bound","ib_upper_bound"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col11 + Merge Join Operator [MERGEJOIN_65] (rows=212960011 width=860) + Output:["_col0","_col4","_col5","_col11"],keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=7200 width=107) + Output:["_col0","_col1"] + Filter Operator [FIL_60] (rows=7200 width=107) + predicate:(hd_demo_sk is not null and hd_income_band_sk is not null) + TableScan [TS_9] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_income_band_sk"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_64] (rows=193600006 width=860) + Output:["_col0","_col2","_col4","_col5"],keys:{"0":"_col1","1":"_col0","2":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_62] (rows=1 width=0) + predicate:sr_cdemo_sk is not null + TableScan [TS_15] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_cdemo_sk"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=19800 width=362) + Output:["_col0"] + Filter Operator [FIL_59] (rows=19800 width=362) + predicate:cd_demo_sk is not null + TableScan [TS_6] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_63] (rows=88000001 width=860) + Output:["_col0","_col1","_col2","_col4","_col5"],keys:{"0":"_col3","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col3 + Select Operator [SEL_2] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_57] (rows=80000000 width=860) + predicate:((c_current_addr_sk is not null and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) + TableScan [TS_0] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_id","c_current_cdemo_sk","c_current_hdemo_sk","c_current_addr_sk","c_first_name","c_last_name"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=20000000 width=1014) + Output:["_col0"] + Filter Operator [FIL_58] (rows=20000000 width=1014) + predicate:((ca_city = 'Hopewell') and ca_address_sk is not null) + TableScan [TS_3] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_city"] diff --git a/ql/src/test/results/clientpositive/perf/query85.q.out b/ql/src/test/results/clientpositive/perf/query85.q.out index 54061ce..a923aea 100644 --- a/ql/src/test/results/clientpositive/perf/query85.q.out +++ b/ql/src/test/results/clientpositive/perf/query85.q.out @@ -16,260 +16,138 @@ Reducer 8 <- Map 17 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 10 - File Output Operator [FS_57] - compressed:false - Statistics:Num rows: 100 Data size: 101400 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_56] - Number of rows:100 - Statistics:Num rows: 100 Data size: 101400 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_55] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 9982500 Data size: 10131039080 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_54] - key expressions:_col0 (type: string), _col1 (type: double), _col2 (type: decimal(11,6)), _col3 (type: decimal(11,6)) - sort order:++++ - Statistics:Num rows: 9982500 Data size: 10131039080 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_53] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 9982500 Data size: 10131039080 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_52] - | aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 9982500 Data size: 10131039080 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_51] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 19965000 Data size: 20262078161 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: struct), _col2 (type: struct), _col3 (type: struct) - Group By Operator [GBY_50] - aggregations:["avg(_col4)","avg(_col14)","avg(_col13)"] - keys:_col28 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 19965000 Data size: 20262078161 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_49] - outputColumnNames:["_col28","_col4","_col14","_col13"] - Statistics:Num rows: 19965000 Data size: 20262078161 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_107] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col11 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col13","_col14","_col28"] - | Statistics:Num rows: 19965000 Data size: 20262078161 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_47] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 72 Data size: 14400 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_42] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 72 Data size: 14400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_100] - | predicate:r_reason_sk is not null (type: boolean) - | Statistics:Num rows: 72 Data size: 14400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_40] - | alias:reason - | Statistics:Num rows: 72 Data size: 14400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_46] - key expressions:_col11 (type: int) - Map-reduce partition columns:_col11 (type: int) - sort order:+ - Statistics:Num rows: 18150000 Data size: 18420070657 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_106] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col4","_col11","_col13","_col14"] - | Statistics:Num rows: 18150000 Data size: 18420070657 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_44] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_39] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_99] - | predicate:((d_year = 1998) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_37] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_43] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: int), _col11 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Select Operator [SEL_36] - outputColumnNames:["_col0","_col11","_col13","_col14","_col4"] - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_35] - predicate:(((_col23) IN ('KY', 'GA', 'NM') and _col6 BETWEEN 100 AND 200) or ((_col23) IN ('MT', 'OR', 'IN') and _col6 BETWEEN 150 AND 300) or ((_col23) IN ('WI', 'MO', 'WV') and _col6 BETWEEN 50 AND 250)) (type: boolean) - Statistics:Num rows: 16500000 Data size: 16745518417 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_105] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col9 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col6","_col11","_col13","_col14","_col23"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_33] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_28] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_98] - | predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_26] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col9 (type: int) - Map-reduce partition columns:_col9 (type: int) - sort order:+ - Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)), _col11 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_104] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col10 (type: int), _col17 (type: string), _col18 (type: string)","1":"_col0 (type: int), _col1 (type: string), _col2 (type: string)"} - | outputColumnNames:["_col0","_col4","_col6","_col9","_col11","_col13","_col14"] - | Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_30] - | key expressions:_col0 (type: int), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_97] - | predicate:((((((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree')) and cd_education_status is not null) and ((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U'))) and cd_marital_status is not null) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:cd1 - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col10 (type: int), _col17 (type: string), _col18 (type: string) - Map-reduce partition columns:_col10 (type: int), _col17 (type: string), _col18 (type: string) - sort order:+++ - Statistics:Num rows: 8166 Data size: 2957518 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)), _col9 (type: int), _col11 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Select Operator [SEL_22] - outputColumnNames:["_col0","_col10","_col11","_col13","_col14","_col17","_col18","_col4","_col6","_col9"] - Statistics:Num rows: 8166 Data size: 2957518 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_21] - predicate:(((_col17 = 'M') and (_col18 = '4 yr Degree') and _col5 BETWEEN 100.0 AND 150.0) or ((_col17 = 'D') and (_col18 = 'Primary') and _col5 BETWEEN 50.0 AND 100.0) or ((_col17 = 'U') and (_col18 = 'Advanced Degree') and _col5 BETWEEN 150.0 AND 200.0)) (type: boolean) - Statistics:Num rows: 8166 Data size: 2957518 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_103] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col8 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col5","_col6","_col9","_col10","_col11","_col13","_col14","_col17","_col18"] - | Statistics:Num rows: 21780 Data size: 7888165 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_96] - | predicate:((((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) and cd_education_status is not null) and cd_marital_status is not null) (type: boolean) - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:cd1 - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col8 (type: int) - Map-reduce partition columns:_col8 (type: int) - sort order:+ - Statistics:Num rows: 5062 Data size: 2965795 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col9 (type: int), _col10 (type: int), _col11 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_102] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col13","_col14"] - | Statistics:Num rows: 5062 Data size: 2965795 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_95] - | predicate:wp_web_page_sk is not null (type: boolean) - | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:web_page - | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col8 (type: int), _col9 (type: int), _col10 (type: int), _col11 (type: int), _col13 (type: decimal(7,2)), _col14 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_101] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int), _col3 (type: int)","1":"_col0 (type: int), _col5 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col13","_col14"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: int), _col3 (type: int) - | Map-reduce partition columns:_col1 (type: int), _col3 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int), _col4 (type: int), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_93] - | predicate:(((((ws_item_sk is not null and (ws_sales_price BETWEEN 100.0 AND 150.0 or ws_sales_price BETWEEN 50.0 AND 100.0 or ws_sales_price BETWEEN 150.0 AND 200.0)) and ws_order_number is not null) and (ws_net_profit BETWEEN 100 AND 200 or ws_net_profit BETWEEN 150 AND 300 or ws_net_profit BETWEEN 50 AND 250)) and ws_web_page_sk is not null) and ws_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int), _col5 (type: int) - Map-reduce partition columns:_col0 (type: int), _col5 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_94] - predicate:(((((wr_order_number is not null and wr_item_sk is not null) and wr_refunded_cdemo_sk is not null) and wr_returning_cdemo_sk is not null) and wr_refunded_addr_sk is not null) and wr_reason_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:web_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 10 + File Output Operator [FS_57] + Limit [LIM_56] (rows=100 width=1014) + Number of rows:100 + Select Operator [SEL_55] (rows=9982500 width=1014) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_54] + Select Operator [SEL_53] (rows=9982500 width=1014) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_52] (rows=9982500 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(VALUE._col0)","avg(VALUE._col1)","avg(VALUE._col2)"],keys:KEY._col0 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_51] + PartitionCols:_col0 + Group By Operator [GBY_50] (rows=19965000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["avg(_col4)","avg(_col14)","avg(_col13)"],keys:_col28 + Select Operator [SEL_49] (rows=19965000 width=1014) + Output:["_col28","_col4","_col14","_col13"] + Merge Join Operator [MERGEJOIN_107] (rows=19965000 width=1014) + Output:["_col4","_col13","_col14","_col28"],keys:{"0":"_col11","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0 + Select Operator [SEL_42] (rows=72 width=200) + Output:["_col0","_col1"] + Filter Operator [FIL_100] (rows=72 width=200) + predicate:r_reason_sk is not null + TableScan [TS_40] (rows=72 width=200) + default@reason,reason,Tbl:COMPLETE,Col:NONE,Output:["r_reason_sk","r_reason_desc"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col11 + Merge Join Operator [MERGEJOIN_106] (rows=18150000 width=1014) + Output:["_col4","_col11","_col13","_col14"],keys:{"0":"_col0","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col0 + Select Operator [SEL_39] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_99] (rows=36524 width=1119) + predicate:((d_year = 1998) and d_date_sk is not null) + TableScan [TS_37] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_43] + PartitionCols:_col0 + Select Operator [SEL_36] (rows=16500000 width=1014) + Output:["_col0","_col11","_col13","_col14","_col4"] + Filter Operator [FIL_35] (rows=16500000 width=1014) + predicate:(((_col23) IN ('KY', 'GA', 'NM') and _col6 BETWEEN 100 AND 200) or ((_col23) IN ('MT', 'OR', 'IN') and _col6 BETWEEN 150 AND 300) or ((_col23) IN ('WI', 'MO', 'WV') and _col6 BETWEEN 50 AND 250)) + Merge Join Operator [MERGEJOIN_105] (rows=22000000 width=1014) + Output:["_col0","_col4","_col6","_col11","_col13","_col14","_col23"],keys:{"0":"_col9","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0 + Select Operator [SEL_28] (rows=20000000 width=1014) + Output:["_col0","_col1"] + Filter Operator [FIL_98] (rows=20000000 width=1014) + predicate:((((ca_state) IN ('KY', 'GA', 'NM') or (ca_state) IN ('MT', 'OR', 'IN') or (ca_state) IN ('WI', 'MO', 'WV')) and (ca_country = 'United States')) and ca_address_sk is not null) + TableScan [TS_26] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state","ca_country"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col9 + Merge Join Operator [MERGEJOIN_104] (rows=21780 width=362) + Output:["_col0","_col4","_col6","_col9","_col11","_col13","_col14"],keys:{"0":"_col10, _col17, _col18","1":"_col0, _col1, _col2"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0, _col1, _col2 + Select Operator [SEL_25] (rows=19800 width=362) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_97] (rows=19800 width=362) + predicate:((((((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree')) and cd_education_status is not null) and ((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U'))) and cd_marital_status is not null) and cd_demo_sk is not null) + TableScan [TS_23] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col10, _col17, _col18 + Select Operator [SEL_22] (rows=8166 width=362) + Output:["_col0","_col10","_col11","_col13","_col14","_col17","_col18","_col4","_col6","_col9"] + Filter Operator [FIL_21] (rows=8166 width=362) + predicate:(((_col17 = 'M') and (_col18 = '4 yr Degree') and _col5 BETWEEN 100.0 AND 150.0) or ((_col17 = 'D') and (_col18 = 'Primary') and _col5 BETWEEN 50.0 AND 100.0) or ((_col17 = 'U') and (_col18 = 'Advanced Degree') and _col5 BETWEEN 150.0 AND 200.0)) + Merge Join Operator [MERGEJOIN_103] (rows=21780 width=362) + Output:["_col0","_col4","_col5","_col6","_col9","_col10","_col11","_col13","_col14","_col17","_col18"],keys:{"0":"_col8","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=19800 width=362) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_96] (rows=19800 width=362) + predicate:((((((cd_marital_status = 'M') or (cd_marital_status = 'D') or (cd_marital_status = 'U')) and ((cd_education_status = '4 yr Degree') or (cd_education_status = 'Primary') or (cd_education_status = 'Advanced Degree'))) and cd_demo_sk is not null) and cd_education_status is not null) and cd_marital_status is not null) + TableScan [TS_9] (rows=19800 width=362) + default@customer_demographics,cd1,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col8 + Merge Join Operator [MERGEJOIN_102] (rows=5062 width=585) + Output:["_col0","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col13","_col14"],keys:{"0":"_col2","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=4602 width=585) + Output:["_col0"] + Filter Operator [FIL_95] (rows=4602 width=585) + predicate:wp_web_page_sk is not null + TableScan [TS_6] (rows=4602 width=585) + default@web_page,web_page,Tbl:COMPLETE,Col:NONE,Output:["wp_web_page_sk"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_101] (rows=1 width=0) + Output:["_col0","_col2","_col4","_col5","_col6","_col8","_col9","_col10","_col11","_col13","_col14"],keys:{"0":"_col1, _col3","1":"_col0, _col5"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1, _col3 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Filter Operator [FIL_93] (rows=1 width=0) + predicate:(((((ws_item_sk is not null and (ws_sales_price BETWEEN 100.0 AND 150.0 or ws_sales_price BETWEEN 50.0 AND 100.0 or ws_sales_price BETWEEN 150.0 AND 200.0)) and ws_order_number is not null) and (ws_net_profit BETWEEN 100 AND 200 or ws_net_profit BETWEEN 150 AND 300 or ws_net_profit BETWEEN 50 AND 250)) and ws_web_page_sk is not null) and ws_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_item_sk","ws_web_page_sk","ws_order_number","ws_quantity","ws_sales_price","ws_net_profit"] + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0, _col5 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_94] (rows=1 width=0) + predicate:(((((wr_order_number is not null and wr_item_sk is not null) and wr_refunded_cdemo_sk is not null) and wr_returning_cdemo_sk is not null) and wr_refunded_addr_sk is not null) and wr_reason_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@web_returns,web_returns,Tbl:PARTIAL,Col:NONE,Output:["wr_item_sk","wr_refunded_cdemo_sk","wr_refunded_addr_sk","wr_returning_cdemo_sk","wr_reason_sk","wr_order_number","wr_fee","wr_refunded_cash"] diff --git a/ql/src/test/results/clientpositive/perf/query87.q.out b/ql/src/test/results/clientpositive/perf/query87.q.out index a336189..52e1b12 100644 --- a/ql/src/test/results/clientpositive/perf/query87.q.out +++ b/ql/src/test/results/clientpositive/perf/query87.q.out @@ -19,316 +19,167 @@ Reducer 6 <- Reducer 19 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_74] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_72] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_71] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_70] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_69] - Statistics:Num rows: 24200000 Data size: 20812489029 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_68] - predicate:_col6 is null (type: boolean) - Statistics:Num rows: 24200000 Data size: 20812489029 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_112] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string), _col1 (type: string), _col2 (type: string)","1":"_col0 (type: string), _col1 (type: string), _col2 (type: string)"} - | outputColumnNames:["_col6"] - | Statistics:Num rows: 48400001 Data size: 41624978920 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 19 [SIMPLE_EDGE] - | Reduce Output Operator [RS_66] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_64] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_63] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_62] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_61] - | keys:_col3 (type: string), _col6 (type: string), _col7 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_110] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col6","_col7"] - | | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_58] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string), _col2 (type: string) - | | Select Operator [SEL_53] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_104] - | | predicate:c_customer_sk is not null (type: boolean) - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_51] - | | alias:customer - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_57] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: string) - | Merge Join Operator [MERGEJOIN_109] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_54] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_47] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_102] - | | predicate:(ws_sold_date_sk is not null and ws_bill_customer_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_45] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 20 [SIMPLE_EDGE] - | Reduce Output Operator [RS_55] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_50] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_103] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_48] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_65] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 24200000 Data size: 20812489029 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_44] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 24200000 Data size: 20812489029 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_43] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 24200000 Data size: 20812489029 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_111] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string), _col1 (type: string), _col2 (type: string)","1":"_col0 (type: string), _col1 (type: string), _col2 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 48400001 Data size: 41624978920 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_41] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_39] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_38] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | sort order:+++ - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_36] - | keys:_col3 (type: string), _col6 (type: string), _col7 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_108] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col3","_col6","_col7"] - | | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_33] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string), _col2 (type: string) - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_101] - | | predicate:c_customer_sk is not null (type: boolean) - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:customer - | | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: string) - | Merge Join Operator [MERGEJOIN_107] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col3"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_29] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int) - | | Select Operator [SEL_22] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_99] - | | predicate:(cs_sold_date_sk is not null and cs_bill_customer_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_20] - | | alias:catalog_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_30] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_25] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_100] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_23] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_40] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_19] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_18] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 44000000 Data size: 37840889108 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_16] - keys:_col3 (type: string), _col6 (type: string), _col7 (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_106] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col6","_col7"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_98] - | predicate:c_customer_sk is not null (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: string) - Merge Join Operator [MERGEJOIN_105] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_96] - | predicate:(ss_sold_date_sk is not null and ss_customer_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_97] - predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:date_dim - Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_74] + Group By Operator [GBY_72] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_71] + Group By Operator [GBY_70] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Select Operator [SEL_69] (rows=24200000 width=860) + Filter Operator [FIL_68] (rows=24200000 width=860) + predicate:_col6 is null + Merge Join Operator [MERGEJOIN_112] (rows=48400001 width=860) + Output:["_col6"],keys:{"0":"_col0, _col1, _col2","1":"_col0, _col1, _col2"} + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_66] + PartitionCols:_col0, _col1, _col2 + Select Operator [SEL_64] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_63] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_62] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_61] (rows=88000001 width=860) + Output:["_col0","_col1","_col2"],keys:_col3, _col6, _col7 + Merge Join Operator [MERGEJOIN_110] (rows=88000001 width=860) + Output:["_col3","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col0 + Select Operator [SEL_53] (rows=80000000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_104] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_51] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_first_name","c_last_name"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_57] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_109] (rows=40176 width=1119) + Output:["_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_54] + PartitionCols:_col0 + Select Operator [SEL_47] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_102] (rows=1 width=0) + predicate:(ws_sold_date_sk is not null and ws_bill_customer_sk is not null) + TableScan [TS_45] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_date_sk","ws_bill_customer_sk"] + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col0 + Select Operator [SEL_50] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_103] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_48] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_month_seq"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_65] + PartitionCols:_col0, _col1, _col2 + Select Operator [SEL_44] (rows=24200000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_43] (rows=24200000 width=860) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_111] (rows=48400001 width=860) + Output:["_col0","_col1","_col2","_col3"],keys:{"0":"_col0, _col1, _col2","1":"_col0, _col1, _col2"} + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0, _col1, _col2 + Select Operator [SEL_39] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_38] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_36] (rows=88000001 width=860) + Output:["_col0","_col1","_col2"],keys:_col3, _col6, _col7 + Merge Join Operator [MERGEJOIN_108] (rows=88000001 width=860) + Output:["_col3","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0 + Select Operator [SEL_28] (rows=80000000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_101] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_26] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_first_name","c_last_name"] + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_107] (rows=40176 width=1119) + Output:["_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Select Operator [SEL_22] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_99] (rows=1 width=0) + predicate:(cs_sold_date_sk is not null and cs_bill_customer_sk is not null) + TableScan [TS_20] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk"] + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Select Operator [SEL_25] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_100] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_23] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_month_seq"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0, _col1, _col2 + Select Operator [SEL_19] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_18] (rows=44000000 width=860) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_16] (rows=88000001 width=860) + Output:["_col0","_col1","_col2"],keys:_col3, _col6, _col7 + Merge Join Operator [MERGEJOIN_106] (rows=88000001 width=860) + Output:["_col3","_col6","_col7"],keys:{"0":"_col1","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=80000000 width=860) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_98] (rows=80000000 width=860) + predicate:c_customer_sk is not null + TableScan [TS_6] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_first_name","c_last_name"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_105] (rows=40176 width=1119) + Output:["_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_96] (rows=1 width=0) + predicate:(ss_sold_date_sk is not null and ss_customer_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_customer_sk"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0","_col1"] + Filter Operator [FIL_97] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date","d_month_seq"] diff --git a/ql/src/test/results/clientpositive/perf/query88.q.out b/ql/src/test/results/clientpositive/perf/query88.q.out index f139dd1..f13b3ea 100644 --- a/ql/src/test/results/clientpositive/perf/query88.q.out +++ b/ql/src/test/results/clientpositive/perf/query88.q.out @@ -233,925 +233,483 @@ Reducer 8 <- Reducer 36 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 44 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 12 - File Output Operator [FS_237] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_372] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_233] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint) - | Merge Join Operator [MERGEJOIN_371] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{} - | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_230] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - | | Merge Join Operator [MERGEJOIN_370] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{} - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 52 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_228] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_154] - | | | | aggregations:["count(VALUE._col0)"] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 51 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_153] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_152] - | | | aggregations:["count()"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_359] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 55 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_149] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_141] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_333] - | | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_139] - | | | | alias:store - | | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 50 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_148] - | | | key expressions:_col2 (type: int) - | | | Map-reduce partition columns:_col2 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_358] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col2"] - | | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 54 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_146] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_138] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_332] - | | | | predicate:(((t_hour = 11) and (t_minute < 30)) and t_time_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_136] - | | | | alias:time_dim - | | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 49 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_145] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col2 (type: int) - | | | Merge Join Operator [MERGEJOIN_357] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col0","_col2"] - | | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 48 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_142] - | | | | key expressions:_col1 (type: int) - | | | | Map-reduce partition columns:_col1 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | | Select Operator [SEL_132] - | | | | outputColumnNames:["_col0","_col1","_col2"] - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | Filter Operator [FIL_330] - | | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | TableScan [TS_130] - | | | | alias:store_sales - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | |<-Map 53 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_143] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_135] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_331] - | | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_133] - | | | alias:household_demographics - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 9 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_227] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint) - | | Merge Join Operator [MERGEJOIN_369] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{} - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 44 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_225] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_128] - | | | | aggregations:["count(VALUE._col0)"] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 43 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_127] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_126] - | | | aggregations:["count()"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_356] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 47 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_123] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_115] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_329] - | | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_113] - | | | | alias:store - | | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 42 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_122] - | | | key expressions:_col2 (type: int) - | | | Map-reduce partition columns:_col2 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_355] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col2"] - | | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 46 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_120] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_112] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_328] - | | | | predicate:(((t_hour = 10) and (t_minute >= 30)) and t_time_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_110] - | | | | alias:time_dim - | | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 41 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_119] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col2 (type: int) - | | | Merge Join Operator [MERGEJOIN_354] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col0","_col2"] - | | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 40 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_116] - | | | | key expressions:_col1 (type: int) - | | | | Map-reduce partition columns:_col1 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | | Select Operator [SEL_106] - | | | | outputColumnNames:["_col0","_col1","_col2"] - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | Filter Operator [FIL_326] - | | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | TableScan [TS_104] - | | | | alias:store_sales - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | |<-Map 45 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_117] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_109] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_327] - | | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_107] - | | | alias:household_demographics - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 8 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_224] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint) - | | Merge Join Operator [MERGEJOIN_368] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{} - | | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 36 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_222] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_102] - | | | | aggregations:["count(VALUE._col0)"] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 35 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_101] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_100] - | | | aggregations:["count()"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_353] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 39 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_97] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_89] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_325] - | | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_87] - | | | | alias:store - | | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 34 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_96] - | | | key expressions:_col2 (type: int) - | | | Map-reduce partition columns:_col2 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_352] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col2"] - | | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 38 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_94] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_86] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_324] - | | | | predicate:(((t_hour = 10) and (t_minute < 30)) and t_time_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_84] - | | | | alias:time_dim - | | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 33 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_93] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col2 (type: int) - | | | Merge Join Operator [MERGEJOIN_351] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col0","_col2"] - | | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 32 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_90] - | | | | key expressions:_col1 (type: int) - | | | | Map-reduce partition columns:_col1 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | | Select Operator [SEL_80] - | | | | outputColumnNames:["_col0","_col1","_col2"] - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | Filter Operator [FIL_322] - | | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | TableScan [TS_78] - | | | | alias:store_sales - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | |<-Map 37 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_91] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_83] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_323] - | | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_81] - | | | alias:household_demographics - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 7 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_221] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - | | Merge Join Operator [MERGEJOIN_367] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{} - | | | outputColumnNames:["_col0","_col1","_col2"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 28 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_219] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_76] - | | | | aggregations:["count(VALUE._col0)"] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 27 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_75] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_74] - | | | aggregations:["count()"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_350] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 31 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_71] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_63] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_321] - | | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_61] - | | | | alias:store - | | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 26 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_70] - | | | key expressions:_col2 (type: int) - | | | Map-reduce partition columns:_col2 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_349] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col2"] - | | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 30 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_68] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_60] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_320] - | | | | predicate:(((t_minute >= 30) and (t_hour = 9)) and t_time_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_58] - | | | | alias:time_dim - | | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 25 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_67] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col2 (type: int) - | | | Merge Join Operator [MERGEJOIN_348] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col0","_col2"] - | | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 24 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_64] - | | | | key expressions:_col1 (type: int) - | | | | Map-reduce partition columns:_col1 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | | Select Operator [SEL_54] - | | | | outputColumnNames:["_col0","_col1","_col2"] - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | Filter Operator [FIL_318] - | | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | TableScan [TS_52] - | | | | alias:store_sales - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | |<-Map 29 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_65] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_57] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_319] - | | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_55] - | | | alias:household_demographics - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 6 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_218] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint), _col1 (type: bigint) - | | Merge Join Operator [MERGEJOIN_366] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{} - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 20 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_216] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_50] - | | | | aggregations:["count(VALUE._col0)"] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 19 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_49] - | | | sort order: - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: bigint) - | | | Group By Operator [GBY_48] - | | | aggregations:["count()"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_347] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 23 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_45] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_37] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_317] - | | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_35] - | | | | alias:store - | | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 18 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_44] - | | | key expressions:_col2 (type: int) - | | | Map-reduce partition columns:_col2 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | Merge Join Operator [MERGEJOIN_346] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col2"] - | | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 22 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_42] - | | | | key expressions:_col0 (type: int) - | | | | Map-reduce partition columns:_col0 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Select Operator [SEL_34] - | | | | outputColumnNames:["_col0"] - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | Filter Operator [FIL_316] - | | | | predicate:(((t_hour = 9) and (t_minute < 30)) and t_time_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | | TableScan [TS_32] - | | | | alias:time_dim - | | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | | |<-Reducer 17 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_41] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col2 (type: int) - | | | Merge Join Operator [MERGEJOIN_345] - | | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | | outputColumnNames:["_col0","_col2"] - | | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | | |<-Map 16 [SIMPLE_EDGE] - | | | | Reduce Output Operator [RS_38] - | | | | key expressions:_col1 (type: int) - | | | | Map-reduce partition columns:_col1 (type: int) - | | | | sort order:+ - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | | Select Operator [SEL_28] - | | | | outputColumnNames:["_col0","_col1","_col2"] - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | Filter Operator [FIL_314] - | | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | | TableScan [TS_26] - | | | | alias:store_sales - | | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | |<-Map 21 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_39] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_31] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_315] - | | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_29] - | | | alias:household_demographics - | | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 5 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_215] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint) - | | Group By Operator [GBY_24] - | | | aggregations:["count(VALUE._col0)"] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 4 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_23] - | | sort order: - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: bigint) - | | Group By Operator [GBY_22] - | | aggregations:["count()"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | | Merge Join Operator [MERGEJOIN_344] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 15 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_19] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_11] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_313] - | | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_9] - | | | alias:store - | | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 3 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_18] - | | key expressions:_col2 (type: int) - | | Map-reduce partition columns:_col2 (type: int) - | | sort order:+ - | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | Merge Join Operator [MERGEJOIN_343] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col2"] - | | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 14 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_16] - | | | key expressions:_col0 (type: int) - | | | Map-reduce partition columns:_col0 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_8] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_312] - | | | predicate:(((t_minute >= 30) and (t_hour = 8)) and t_time_sk is not null) (type: boolean) - | | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_6] - | | | alias:time_dim - | | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 2 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_15] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: int) - | | Merge Join Operator [MERGEJOIN_342] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | | outputColumnNames:["_col0","_col2"] - | | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 1 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_12] - | | | key expressions:_col1 (type: int) - | | | Map-reduce partition columns:_col1 (type: int) - | | | sort order:+ - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | value expressions:_col0 (type: int), _col2 (type: int) - | | | Select Operator [SEL_2] - | | | outputColumnNames:["_col0","_col1","_col2"] - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | Filter Operator [FIL_310] - | | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | | TableScan [TS_0] - | | | alias:store_sales - | | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | |<-Map 13 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_13] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_311] - | | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:household_demographics - | | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 60 [SIMPLE_EDGE] - | Reduce Output Operator [RS_231] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_180] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 59 [SIMPLE_EDGE] - | Reduce Output Operator [RS_179] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_178] - | aggregations:["count()"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_362] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - | |<-Map 63 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_175] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_167] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_337] - | | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_165] - | | alias:store - | | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 58 [SIMPLE_EDGE] - | Reduce Output Operator [RS_174] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_361] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - | |<-Map 62 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_172] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_164] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_336] - | | predicate:(((t_minute >= 30) and (t_hour = 11)) and t_time_sk is not null) (type: boolean) - | | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_162] - | | alias:time_dim - | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 57 [SIMPLE_EDGE] - | Reduce Output Operator [RS_171] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int) - | Merge Join Operator [MERGEJOIN_360] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col2"] - | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | |<-Map 56 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_168] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int) - | | Select Operator [SEL_158] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_334] - | | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_156] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 61 [SIMPLE_EDGE] - | Reduce Output Operator [RS_169] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_161] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_335] - | predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_159] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 68 [SIMPLE_EDGE] - Reduce Output Operator [RS_234] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_206] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 67 [SIMPLE_EDGE] - Reduce Output Operator [RS_205] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_204] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_365] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - |<-Map 71 [SIMPLE_EDGE] - | Reduce Output Operator [RS_201] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_193] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_341] - | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_191] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 66 [SIMPLE_EDGE] - Reduce Output Operator [RS_200] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_364] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - |<-Map 70 [SIMPLE_EDGE] - | Reduce Output Operator [RS_198] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_190] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_340] - | predicate:(((t_hour = 12) and (t_minute < 30)) and t_time_sk is not null) (type: boolean) - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_188] - | alias:time_dim - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 65 [SIMPLE_EDGE] - Reduce Output Operator [RS_197] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int) - Merge Join Operator [MERGEJOIN_363] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - |<-Map 64 [SIMPLE_EDGE] - | Reduce Output Operator [RS_194] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int) - | Select Operator [SEL_184] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_338] - | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_182] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 69 [SIMPLE_EDGE] - Reduce Output Operator [RS_195] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_187] - outputColumnNames:["_col0"] - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_339] - predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_185] - alias:household_demographics - Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 12 + File Output Operator [FS_237] + Merge Join Operator [MERGEJOIN_372] (rows=1 width=8) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"],keys:{} + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_233] + Merge Join Operator [MERGEJOIN_371] (rows=1 width=8) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],keys:{} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_230] + Merge Join Operator [MERGEJOIN_370] (rows=1 width=8) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],keys:{} + <-Reducer 52 [SIMPLE_EDGE] + SHUFFLE [RS_228] + Group By Operator [GBY_154] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 51 [SIMPLE_EDGE] + SHUFFLE [RS_153] + Group By Operator [GBY_152] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_359] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 55 [SIMPLE_EDGE] + SHUFFLE [RS_149] + PartitionCols:_col0 + Select Operator [SEL_141] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_333] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_139] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 50 [SIMPLE_EDGE] + SHUFFLE [RS_148] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_358] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 54 [SIMPLE_EDGE] + SHUFFLE [RS_146] + PartitionCols:_col0 + Select Operator [SEL_138] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_332] (rows=14400 width=471) + predicate:(((t_hour = 11) and (t_minute < 30)) and t_time_sk is not null) + TableScan [TS_136] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 49 [SIMPLE_EDGE] + SHUFFLE [RS_145] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_357] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 48 [SIMPLE_EDGE] + SHUFFLE [RS_142] + PartitionCols:_col1 + Select Operator [SEL_132] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_330] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_130] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 53 [SIMPLE_EDGE] + SHUFFLE [RS_143] + PartitionCols:_col0 + Select Operator [SEL_135] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_331] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_133] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_227] + Merge Join Operator [MERGEJOIN_369] (rows=1 width=8) + Output:["_col0","_col1","_col2","_col3","_col4"],keys:{} + <-Reducer 44 [SIMPLE_EDGE] + SHUFFLE [RS_225] + Group By Operator [GBY_128] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 43 [SIMPLE_EDGE] + SHUFFLE [RS_127] + Group By Operator [GBY_126] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_356] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 47 [SIMPLE_EDGE] + SHUFFLE [RS_123] + PartitionCols:_col0 + Select Operator [SEL_115] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_329] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_113] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 42 [SIMPLE_EDGE] + SHUFFLE [RS_122] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_355] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 46 [SIMPLE_EDGE] + SHUFFLE [RS_120] + PartitionCols:_col0 + Select Operator [SEL_112] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_328] (rows=14400 width=471) + predicate:(((t_hour = 10) and (t_minute >= 30)) and t_time_sk is not null) + TableScan [TS_110] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 41 [SIMPLE_EDGE] + SHUFFLE [RS_119] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_354] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 40 [SIMPLE_EDGE] + SHUFFLE [RS_116] + PartitionCols:_col1 + Select Operator [SEL_106] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_326] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_104] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 45 [SIMPLE_EDGE] + SHUFFLE [RS_117] + PartitionCols:_col0 + Select Operator [SEL_109] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_327] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_107] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_224] + Merge Join Operator [MERGEJOIN_368] (rows=1 width=8) + Output:["_col0","_col1","_col2","_col3"],keys:{} + <-Reducer 36 [SIMPLE_EDGE] + SHUFFLE [RS_222] + Group By Operator [GBY_102] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 35 [SIMPLE_EDGE] + SHUFFLE [RS_101] + Group By Operator [GBY_100] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_353] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 39 [SIMPLE_EDGE] + SHUFFLE [RS_97] + PartitionCols:_col0 + Select Operator [SEL_89] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_325] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_87] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 34 [SIMPLE_EDGE] + SHUFFLE [RS_96] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_352] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 38 [SIMPLE_EDGE] + SHUFFLE [RS_94] + PartitionCols:_col0 + Select Operator [SEL_86] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_324] (rows=14400 width=471) + predicate:(((t_hour = 10) and (t_minute < 30)) and t_time_sk is not null) + TableScan [TS_84] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 33 [SIMPLE_EDGE] + SHUFFLE [RS_93] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_351] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 32 [SIMPLE_EDGE] + SHUFFLE [RS_90] + PartitionCols:_col1 + Select Operator [SEL_80] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_322] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_78] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 37 [SIMPLE_EDGE] + SHUFFLE [RS_91] + PartitionCols:_col0 + Select Operator [SEL_83] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_323] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_81] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_221] + Merge Join Operator [MERGEJOIN_367] (rows=1 width=8) + Output:["_col0","_col1","_col2"],keys:{} + <-Reducer 28 [SIMPLE_EDGE] + SHUFFLE [RS_219] + Group By Operator [GBY_76] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 27 [SIMPLE_EDGE] + SHUFFLE [RS_75] + Group By Operator [GBY_74] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_350] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 31 [SIMPLE_EDGE] + SHUFFLE [RS_71] + PartitionCols:_col0 + Select Operator [SEL_63] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_321] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_61] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 26 [SIMPLE_EDGE] + SHUFFLE [RS_70] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_349] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 30 [SIMPLE_EDGE] + SHUFFLE [RS_68] + PartitionCols:_col0 + Select Operator [SEL_60] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_320] (rows=14400 width=471) + predicate:(((t_minute >= 30) and (t_hour = 9)) and t_time_sk is not null) + TableScan [TS_58] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 25 [SIMPLE_EDGE] + SHUFFLE [RS_67] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_348] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 24 [SIMPLE_EDGE] + SHUFFLE [RS_64] + PartitionCols:_col1 + Select Operator [SEL_54] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_318] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_52] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 29 [SIMPLE_EDGE] + SHUFFLE [RS_65] + PartitionCols:_col0 + Select Operator [SEL_57] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_319] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_55] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_218] + Merge Join Operator [MERGEJOIN_366] (rows=1 width=8) + Output:["_col0","_col1"],keys:{} + <-Reducer 20 [SIMPLE_EDGE] + SHUFFLE [RS_216] + Group By Operator [GBY_50] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 19 [SIMPLE_EDGE] + SHUFFLE [RS_49] + Group By Operator [GBY_48] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_347] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col0 + Select Operator [SEL_37] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_317] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_35] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_346] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0 + Select Operator [SEL_34] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_316] (rows=14400 width=471) + predicate:(((t_hour = 9) and (t_minute < 30)) and t_time_sk is not null) + TableScan [TS_32] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_345] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col1 + Select Operator [SEL_28] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_314] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_26] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0 + Select Operator [SEL_31] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_315] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_29] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_215] + Group By Operator [GBY_24] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Group By Operator [GBY_22] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_344] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_313] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_9] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_343] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_312] (rows=14400 width=471) + predicate:(((t_minute >= 30) and (t_hour = 8)) and t_time_sk is not null) + TableScan [TS_6] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_342] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_310] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_311] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_3] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 60 [SIMPLE_EDGE] + SHUFFLE [RS_231] + Group By Operator [GBY_180] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 59 [SIMPLE_EDGE] + SHUFFLE [RS_179] + Group By Operator [GBY_178] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_362] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 63 [SIMPLE_EDGE] + SHUFFLE [RS_175] + PartitionCols:_col0 + Select Operator [SEL_167] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_337] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_165] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 58 [SIMPLE_EDGE] + SHUFFLE [RS_174] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_361] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 62 [SIMPLE_EDGE] + SHUFFLE [RS_172] + PartitionCols:_col0 + Select Operator [SEL_164] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_336] (rows=14400 width=471) + predicate:(((t_minute >= 30) and (t_hour = 11)) and t_time_sk is not null) + TableScan [TS_162] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 57 [SIMPLE_EDGE] + SHUFFLE [RS_171] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_360] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 56 [SIMPLE_EDGE] + SHUFFLE [RS_168] + PartitionCols:_col1 + Select Operator [SEL_158] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_334] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_156] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 61 [SIMPLE_EDGE] + SHUFFLE [RS_169] + PartitionCols:_col0 + Select Operator [SEL_161] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_335] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_159] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] + <-Reducer 68 [SIMPLE_EDGE] + SHUFFLE [RS_234] + Group By Operator [GBY_206] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 67 [SIMPLE_EDGE] + SHUFFLE [RS_205] + Group By Operator [GBY_204] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_365] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 71 [SIMPLE_EDGE] + SHUFFLE [RS_201] + PartitionCols:_col0 + Select Operator [SEL_193] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_341] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_191] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 66 [SIMPLE_EDGE] + SHUFFLE [RS_200] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_364] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 70 [SIMPLE_EDGE] + SHUFFLE [RS_198] + PartitionCols:_col0 + Select Operator [SEL_190] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_340] (rows=14400 width=471) + predicate:(((t_hour = 12) and (t_minute < 30)) and t_time_sk is not null) + TableScan [TS_188] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 65 [SIMPLE_EDGE] + SHUFFLE [RS_197] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_363] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 64 [SIMPLE_EDGE] + SHUFFLE [RS_194] + PartitionCols:_col1 + Select Operator [SEL_184] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_338] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_182] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 69 [SIMPLE_EDGE] + SHUFFLE [RS_195] + PartitionCols:_col0 + Select Operator [SEL_187] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_339] (rows=3600 width=107) + predicate:((((hd_dep_count = 3) and (hd_vehicle_count <= 5)) or ((hd_dep_count = 0) and (hd_vehicle_count <= 2)) or ((hd_dep_count = 1) and (hd_vehicle_count <= 3))) and hd_demo_sk is not null) + TableScan [TS_185] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count","hd_vehicle_count"] diff --git a/ql/src/test/results/clientpositive/perf/query89.q.out b/ql/src/test/results/clientpositive/perf/query89.q.out index ee9eabc..c9faccf 100644 --- a/ql/src/test/results/clientpositive/perf/query89.q.out +++ b/ql/src/test/results/clientpositive/perf/query89.q.out @@ -63,162 +63,87 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_36] - compressed:false - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_35] - Number of rows:100 - Statistics:Num rows: 100 Data size: 143600 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_34] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - | Statistics:Num rows: 51243 Data size: 73599199 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:(_col6 - _col7) (type: decimal(22,6)), _col3 (type: string) - sort order:++ - Statistics:Num rows: 51243 Data size: 73599199 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: string), _col5 (type: int), _col6 (type: decimal(17,2)), _col7 (type: decimal(21,6)) - Select Operator [SEL_30] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 51243 Data size: 73599199 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_46] - predicate:(CASE WHEN ((avg_window_0 <> 0)) THEN ((abs((_col6 - avg_window_0)) / avg_window_0)) ELSE (null) END > 0.1) (type: boolean) - Statistics:Num rows: 51243 Data size: 73599199 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_29] - outputColumnNames:["avg_window_0","_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_28] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col0, _col2, _col3, _col4","partition by:":"_col0, _col2, _col3, _col4"}] - Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - sort order:++++ - Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col5 (type: int), _col6 (type: decimal(17,2)) - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: int), KEY._col4 (type: string), KEY._col5 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 153730 Data size: 220799036 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: int), _col4 (type: string), _col5 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: int), _col4 (type: string), _col5 (type: string) - sort order:++++++ - Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - value expressions:_col6 (type: decimal(17,2)) - Group By Operator [GBY_22] - aggregations:["sum(_col7)"] - keys:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col10 (type: int), _col12 (type: string), _col13 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - outputColumnNames:["_col1","_col2","_col3","_col10","_col12","_col13","_col7"] - Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_53] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col7","_col10","_col12","_col13"] - | Statistics:Num rows: 307461 Data size: 441599510 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_50] - | predicate:s_store_sk is not null (type: boolean) - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col7 (type: decimal(7,2)), _col10 (type: int) - Merge Join Operator [MERGEJOIN_52] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col6","_col7","_col10"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_49] - | predicate:((d_year) IN (2000) and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col6 (type: int), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_51] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col6","_col7"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_47] - | predicate:((((((i_category) IN ('Home', 'Books', 'Electronics') and (i_class) IN ('wallpaper', 'parenting', 'musical')) or ((i_category) IN ('Shoes', 'Jewelry', 'Men') and (i_class) IN ('womens', 'birdal', 'pants'))) and ((i_category) IN ('Home', 'Books', 'Electronics') or (i_category) IN ('Shoes', 'Jewelry', 'Men'))) and ((i_class) IN ('wallpaper', 'parenting', 'musical') or (i_class) IN ('womens', 'birdal', 'pants'))) and i_item_sk is not null) (type: boolean) - | Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:item - | Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_48] - predicate:((ss_item_sk is not null and ss_sold_date_sk is not null) and ss_store_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:store_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_36] + Limit [LIM_35] (rows=100 width=1436) + Number of rows:100 + Select Operator [SEL_34] (rows=51243 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_33] + Select Operator [SEL_30] (rows=51243 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Filter Operator [FIL_46] (rows=51243 width=1436) + predicate:(CASE WHEN ((avg_window_0 <> 0)) THEN ((abs((_col6 - avg_window_0)) / avg_window_0)) ELSE (null) END > 0.1) + Select Operator [SEL_29] (rows=153730 width=1436) + Output:["avg_window_0","_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_28] (rows=153730 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col0, _col2, _col3, _col4","partition by:":"_col0, _col2, _col3, _col4"}] + Select Operator [SEL_27] (rows=153730 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0, _col2, _col3, _col4 + Select Operator [SEL_25] (rows=153730 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + Group By Operator [GBY_24] (rows=153730 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4, KEY._col5 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0, _col1, _col2, _col3, _col4, _col5 + Group By Operator [GBY_22] (rows=307461 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"],aggregations:["sum(_col7)"],keys:_col1, _col2, _col3, _col10, _col12, _col13 + Select Operator [SEL_21] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col10","_col12","_col13","_col7"] + Merge Join Operator [MERGEJOIN_53] (rows=307461 width=1436) + Output:["_col1","_col2","_col3","_col7","_col10","_col12","_col13"],keys:{"0":"_col6","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=1704 width=1910) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_50] (rows=1704 width=1910) + predicate:s_store_sk is not null + TableScan [TS_9] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name","s_company_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_52] (rows=279510 width=1436) + Output:["_col1","_col2","_col3","_col6","_col7","_col10"],keys:{"0":"_col4","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0","_col2"] + Filter Operator [FIL_49] (rows=36524 width=1119) + predicate:((d_year) IN (2000) and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_51] (rows=254100 width=1436) + Output:["_col1","_col2","_col3","_col4","_col6","_col7"],keys:{"0":"_col0","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_47] (rows=231000 width=1436) + predicate:((((((i_category) IN ('Home', 'Books', 'Electronics') and (i_class) IN ('wallpaper', 'parenting', 'musical')) or ((i_category) IN ('Shoes', 'Jewelry', 'Men') and (i_class) IN ('womens', 'birdal', 'pants'))) and ((i_category) IN ('Home', 'Books', 'Electronics') or (i_category) IN ('Shoes', 'Jewelry', 'Men'))) and ((i_class) IN ('wallpaper', 'parenting', 'musical') or (i_class) IN ('womens', 'birdal', 'pants'))) and i_item_sk is not null) + TableScan [TS_0] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_brand","i_class","i_category"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_48] (rows=1 width=0) + predicate:((ss_item_sk is not null and ss_sold_date_sk is not null) and ss_store_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_store_sk","ss_sales_price"] diff --git a/ql/src/test/results/clientpositive/perf/query90.q.out b/ql/src/test/results/clientpositive/perf/query90.q.out index d34aaf4..d3bc278 100644 --- a/ql/src/test/results/clientpositive/perf/query90.q.out +++ b/ql/src/test/results/clientpositive/perf/query90.q.out @@ -18,243 +18,131 @@ Reducer 6 <- Reducer 15 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_60] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_59] - Number of rows:100 - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_58] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_57] - key expressions:_col0 (type: decimal(35,20)) - sort order:+ - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_56] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_93] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_54] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_50] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_49] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_48] - | aggregations:["count()"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_92] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_45] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_37] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_86] - | | predicate:(wp_char_count BETWEEN 5000 AND 5200 and wp_web_page_sk is not null) (type: boolean) - | | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_35] - | | alias:web_page - | | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_44] - | key expressions:_col2 (type: int) - | Map-reduce partition columns:_col2 (type: int) - | sort order:+ - | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_91] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_42] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_34] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_85] - | | predicate:(t_hour BETWEEN 14 AND 15 and t_time_sk is not null) (type: boolean) - | | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_32] - | | alias:time_dim - | | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_41] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: int) - | Merge Join Operator [MERGEJOIN_90] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col2"] - | | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - | |<-Map 11 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_38] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int), _col2 (type: int) - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_83] - | | predicate:((ws_ship_hdemo_sk is not null and ws_sold_time_sk is not null) and ws_web_page_sk is not null) (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_26] - | | alias:web_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_84] - | predicate:((hd_dep_count = 8) and hd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_53] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_24] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_22] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_89] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | Statistics:Num rows: 52272 Data size: 24620112 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_82] - | predicate:(wp_char_count BETWEEN 5000 AND 5200 and wp_web_page_sk is not null) (type: boolean) - | Statistics:Num rows: 2301 Data size: 1348089 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:web_page - | Statistics:Num rows: 4602 Data size: 2696178 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_88] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 47520 Data size: 22381920 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_81] - | predicate:(t_time_sk is not null and t_hour BETWEEN 6 AND 7) (type: boolean) - | Statistics:Num rows: 43200 Data size: 20347200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:time_dim - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int) - Merge Join Operator [MERGEJOIN_87] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_79] - | predicate:((ws_ship_hdemo_sk is not null and ws_sold_time_sk is not null) and ws_web_page_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:web_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_80] - predicate:((hd_dep_count = 8) and hd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:household_demographics - Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_60] + Limit [LIM_59] (rows=1 width=8) + Number of rows:100 + Select Operator [SEL_58] (rows=1 width=8) + Output:["_col0"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_57] + Select Operator [SEL_56] (rows=1 width=8) + Output:["_col0"] + Merge Join Operator [MERGEJOIN_93] (rows=1 width=8) + Output:["_col0","_col1"],keys:{} + <-Reducer 15 [SIMPLE_EDGE] + SHUFFLE [RS_54] + Group By Operator [GBY_50] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_49] + Group By Operator [GBY_48] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_92] (rows=52272 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col0 + Select Operator [SEL_37] (rows=2301 width=585) + Output:["_col0"] + Filter Operator [FIL_86] (rows=2301 width=585) + predicate:(wp_char_count BETWEEN 5000 AND 5200 and wp_web_page_sk is not null) + TableScan [TS_35] (rows=4602 width=585) + default@web_page,web_page,Tbl:COMPLETE,Col:NONE,Output:["wp_web_page_sk","wp_char_count"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_91] (rows=47520 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0 + Select Operator [SEL_34] (rows=43200 width=471) + Output:["_col0"] + Filter Operator [FIL_85] (rows=43200 width=471) + predicate:(t_hour BETWEEN 14 AND 15 and t_time_sk is not null) + TableScan [TS_32] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour"] + <-Reducer 12 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_90] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col1 + Select Operator [SEL_28] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_83] (rows=1 width=0) + predicate:((ws_ship_hdemo_sk is not null and ws_sold_time_sk is not null) and ws_web_page_sk is not null) + TableScan [TS_26] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_time_sk","ws_ship_hdemo_sk","ws_web_page_sk"] + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col0 + Select Operator [SEL_31] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_84] (rows=3600 width=107) + predicate:((hd_dep_count = 8) and hd_demo_sk is not null) + TableScan [TS_29] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_53] + Group By Operator [GBY_24] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Group By Operator [GBY_22] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_89] (rows=52272 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=2301 width=585) + Output:["_col0"] + Filter Operator [FIL_82] (rows=2301 width=585) + predicate:(wp_char_count BETWEEN 5000 AND 5200 and wp_web_page_sk is not null) + TableScan [TS_9] (rows=4602 width=585) + default@web_page,web_page,Tbl:COMPLETE,Col:NONE,Output:["wp_web_page_sk","wp_char_count"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_88] (rows=47520 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=43200 width=471) + Output:["_col0"] + Filter Operator [FIL_81] (rows=43200 width=471) + predicate:(t_time_sk is not null and t_hour BETWEEN 6 AND 7) + TableScan [TS_6] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_87] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_79] (rows=1 width=0) + predicate:((ws_ship_hdemo_sk is not null and ws_sold_time_sk is not null) and ws_web_page_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,web_sales,Tbl:PARTIAL,Col:NONE,Output:["ws_sold_time_sk","ws_ship_hdemo_sk","ws_web_page_sk"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_80] (rows=3600 width=107) + predicate:((hd_dep_count = 8) and hd_demo_sk is not null) + TableScan [TS_3] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"] diff --git a/ql/src/test/results/clientpositive/perf/query91.q.out b/ql/src/test/results/clientpositive/perf/query91.q.out index 54f58e4..943c79f 100644 --- a/ql/src/test/results/clientpositive/perf/query91.q.out +++ b/ql/src/test/results/clientpositive/perf/query91.q.out @@ -15,218 +15,114 @@ Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 9 - File Output Operator [FS_46] - compressed:false - Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_45] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_44] - key expressions:_col3 (type: decimal(17,2)) - sort order:- - Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Select Operator [SEL_43] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_42] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string), KEY._col3 (type: string), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 58564004 Data size: 50366227250 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_41] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)) - Group By Operator [GBY_40] - aggregations:["sum(_col7)"] - keys:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col18 (type: string), _col19 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_39] - outputColumnNames:["_col1","_col2","_col3","_col18","_col19","_col7"] - Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_86] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col13 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col7","_col18","_col19"] - | Statistics:Num rows: 117128008 Data size: 100732454500 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_20] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_80] - | predicate:(hd_demo_sk is not null and (hd_buy_potential like '0-500%')) (type: boolean) - | Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:household_demographics - | Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col13 (type: int) - Map-reduce partition columns:_col13 (type: int) - sort order:+ - Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col7 (type: decimal(7,2)), _col18 (type: string), _col19 (type: string) - Merge Join Operator [MERGEJOIN_85] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col12 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col7","_col13","_col18","_col19"] - | Statistics:Num rows: 106480005 Data size: 91574956652 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string) - | Select Operator [SEL_17] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_79] - | predicate:((((((cd_marital_status = 'M') and (cd_education_status = 'Unknown')) or ((cd_marital_status = 'W') and (cd_education_status = 'Advanced Degree'))) and ((cd_education_status = 'Unknown') or (cd_education_status = 'Advanced Degree'))) and ((cd_marital_status = 'M') or (cd_marital_status = 'W'))) and cd_demo_sk is not null) (type: boolean) - | Statistics:Num rows: 9900 Data size: 3585529 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:customer_demographics - | Statistics:Num rows: 19800 Data size: 7171059 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col12 (type: int) - Map-reduce partition columns:_col12 (type: int) - sort order:+ - Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col7 (type: decimal(7,2)), _col13 (type: int) - Merge Join Operator [MERGEJOIN_84] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col14 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col7","_col12","_col13"] - | Statistics:Num rows: 96800003 Data size: 83249958789 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_78] - | predicate:((ca_gmt_offset = -7) and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:customer_address - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col14 (type: int) - Map-reduce partition columns:_col14 (type: int) - sort order:+ - Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col7 (type: decimal(7,2)), _col12 (type: int), _col13 (type: int) - Merge Join Operator [MERGEJOIN_83] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col5 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col7","_col12","_col13","_col14"] - | Statistics:Num rows: 88000001 Data size: 75681779077 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: int), _col2 (type: int), _col3 (type: int) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_77] - | predicate:(((c_customer_sk is not null and c_current_addr_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) (type: boolean) - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:customer - | Statistics:Num rows: 80000000 Data size: 68801615852 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col5 (type: int) - Map-reduce partition columns:_col5 (type: int) - sort order:+ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_82] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col4 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col5","_col7"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_76] - | predicate:(((d_moy = 11) and d_date_sk is not null) and (d_year = 1999)) (type: boolean) - | Statistics:Num rows: 18262 Data size: 20435178 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col4 (type: int) - Map-reduce partition columns:_col4 (type: int) - sort order:+ - Statistics:Num rows: 66 Data size: 134970 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string), _col5 (type: int), _col7 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_81] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col2 (type: int)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col5","_col7"] - | Statistics:Num rows: 66 Data size: 134970 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_74] - | predicate:cc_call_center_sk is not null (type: boolean) - | Statistics:Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:call_center - | Statistics:Num rows: 60 Data size: 122700 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col3 (type: decimal(7,2)) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_75] - predicate:((cr_call_center_sk is not null and cr_returned_date_sk is not null) and cr_returning_customer_sk is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:catalog_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 9 + File Output Operator [FS_46] + Select Operator [SEL_45] (rows=58564004 width=860) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_44] + Select Operator [SEL_43] (rows=58564004 width=860) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_42] (rows=58564004 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_40] (rows=117128008 width=860) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col7)"],keys:_col1, _col2, _col3, _col18, _col19 + Select Operator [SEL_39] (rows=117128008 width=860) + Output:["_col1","_col2","_col3","_col18","_col19","_col7"] + Merge Join Operator [MERGEJOIN_86] (rows=117128008 width=860) + Output:["_col1","_col2","_col3","_col7","_col18","_col19"],keys:{"0":"_col13","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_80] (rows=3600 width=107) + predicate:(hd_demo_sk is not null and (hd_buy_potential like '0-500%')) + TableScan [TS_18] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_buy_potential"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col13 + Merge Join Operator [MERGEJOIN_85] (rows=106480005 width=860) + Output:["_col1","_col2","_col3","_col7","_col13","_col18","_col19"],keys:{"0":"_col12","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=9900 width=362) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_79] (rows=9900 width=362) + predicate:((((((cd_marital_status = 'M') and (cd_education_status = 'Unknown')) or ((cd_marital_status = 'W') and (cd_education_status = 'Advanced Degree'))) and ((cd_education_status = 'Unknown') or (cd_education_status = 'Advanced Degree'))) and ((cd_marital_status = 'M') or (cd_marital_status = 'W'))) and cd_demo_sk is not null) + TableScan [TS_15] (rows=19800 width=362) + default@customer_demographics,customer_demographics,Tbl:COMPLETE,Col:NONE,Output:["cd_demo_sk","cd_marital_status","cd_education_status"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col12 + Merge Join Operator [MERGEJOIN_84] (rows=96800003 width=860) + Output:["_col1","_col2","_col3","_col7","_col12","_col13"],keys:{"0":"_col14","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=20000000 width=1014) + Output:["_col0"] + Filter Operator [FIL_78] (rows=20000000 width=1014) + predicate:((ca_gmt_offset = -7) and ca_address_sk is not null) + TableScan [TS_12] (rows=40000000 width=1014) + default@customer_address,customer_address,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_gmt_offset"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col14 + Merge Join Operator [MERGEJOIN_83] (rows=88000001 width=860) + Output:["_col1","_col2","_col3","_col7","_col12","_col13","_col14"],keys:{"0":"_col5","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=80000000 width=860) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_77] (rows=80000000 width=860) + predicate:(((c_customer_sk is not null and c_current_addr_sk is not null) and c_current_cdemo_sk is not null) and c_current_hdemo_sk is not null) + TableScan [TS_9] (rows=80000000 width=860) + default@customer,customer,Tbl:COMPLETE,Col:NONE,Output:["c_customer_sk","c_current_cdemo_sk","c_current_hdemo_sk","c_current_addr_sk"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col5 + Merge Join Operator [MERGEJOIN_82] (rows=20088 width=1119) + Output:["_col1","_col2","_col3","_col5","_col7"],keys:{"0":"_col4","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=18262 width=1119) + Output:["_col0"] + Filter Operator [FIL_76] (rows=18262 width=1119) + predicate:(((d_moy = 11) and d_date_sk is not null) and (d_year = 1999)) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_year","d_moy"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col4 + Merge Join Operator [MERGEJOIN_81] (rows=66 width=2045) + Output:["_col1","_col2","_col3","_col4","_col5","_col7"],keys:{"0":"_col0","1":"_col2"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=60 width=2045) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_74] (rows=60 width=2045) + predicate:cc_call_center_sk is not null + TableScan [TS_0] (rows=60 width=2045) + default@call_center,call_center,Tbl:COMPLETE,Col:NONE,Output:["cc_call_center_sk","cc_call_center_id","cc_name","cc_manager"] + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col2 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_75] (rows=1 width=0) + predicate:((cr_call_center_sk is not null and cr_returned_date_sk is not null) and cr_returning_customer_sk is not null) + TableScan [TS_3] (rows=1 width=0) + default@catalog_returns,catalog_returns,Tbl:PARTIAL,Col:NONE,Output:["cr_returned_date_sk","cr_returning_customer_sk","cr_call_center_sk","cr_net_loss"] diff --git a/ql/src/test/results/clientpositive/perf/query92.q.out b/ql/src/test/results/clientpositive/perf/query92.q.out index 6fb2133..d8b3146 100644 --- a/ql/src/test/results/clientpositive/perf/query92.q.out +++ b/ql/src/test/results/clientpositive/perf/query92.q.out @@ -13,148 +13,81 @@ Reducer 8 <- Map 10 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_35] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_33] - aggregations:["sum(_col0)","sum(_col1)","sum(_col2)"] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 4909 Data size: 5493875 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_48] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"_col0 (type: int), _col1 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 4909 Data size: 5493875 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 4463 Data size: 4994432 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 4463 Data size: 4994432 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_12] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 4463 Data size: 4994432 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_10] - | keys:_col1 (type: int), _col2 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_46] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_6] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_42] - | | predicate:ss_sold_date_sk is not null (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_0] - | | alias:ss - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:(((d_month_seq <= 1217) and d_date_sk is not null) and (d_month_seq >= 1206)) (type: boolean) - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 4463 Data size: 4994432 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_26] - | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 4463 Data size: 4994432 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - keys:_col1 (type: int), _col2 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_47] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 8927 Data size: 9989984 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_45] - | predicate:(((d_month_seq <= 1217) and d_date_sk is not null) and (d_month_seq >= 1206)) (type: boolean) - | Statistics:Num rows: 8116 Data size: 9081804 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:d1 - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int) - Select Operator [SEL_16] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_44] - predicate:cs_sold_date_sk is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_14] - alias:cs - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_37] + Group By Operator [GBY_35] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_34] + Group By Operator [GBY_33] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col0)","sum(_col1)","sum(_col2)"] + Select Operator [SEL_31] (rows=4909 width=1119) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_48] (rows=4909 width=1119) + Output:["_col0","_col2"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0, _col1 + Select Operator [SEL_13] (rows=4463 width=1119) + Output:["_col0","_col1"] + Group By Operator [GBY_12] (rows=4463 width=1119) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col0, _col1 + Group By Operator [GBY_10] (rows=8927 width=1119) + Output:["_col0","_col1"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_46] (rows=8927 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_42] (rows=1 width=0) + predicate:ss_sold_date_sk is not null + TableScan [TS_0] (rows=1 width=0) + default@store_sales,ss,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=8116 width=1119) + Output:["_col0"] + Filter Operator [FIL_43] (rows=8116 width=1119) + predicate:(((d_month_seq <= 1217) and d_date_sk is not null) and (d_month_seq >= 1206)) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1 + Group By Operator [GBY_26] (rows=4463 width=1119) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0, _col1 + Group By Operator [GBY_24] (rows=8927 width=1119) + Output:["_col0","_col1"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_47] (rows=8927 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=8116 width=1119) + Output:["_col0"] + Filter Operator [FIL_45] (rows=8116 width=1119) + predicate:(((d_month_seq <= 1217) and d_date_sk is not null) and (d_month_seq >= 1206)) + TableScan [TS_17] (rows=73049 width=1119) + default@date_dim,d1,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_44] (rows=1 width=0) + predicate:cs_sold_date_sk is not null + TableScan [TS_14] (rows=1 width=0) + default@catalog_sales,cs,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query93.q.out b/ql/src/test/results/clientpositive/perf/query93.q.out index 5255145..2f8248a 100644 --- a/ql/src/test/results/clientpositive/perf/query93.q.out +++ b/ql/src/test/results/clientpositive/perf/query93.q.out @@ -11,104 +11,56 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_23] - compressed:false - Statistics:Num rows: 19 Data size: 3858 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_22] - Number of rows:100 - Statistics:Num rows: 19 Data size: 3858 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 19 Data size: 3858 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col1 (type: decimal(28,2)), _col0 (type: int) - sort order:++ - Statistics:Num rows: 19 Data size: 3858 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 19 Data size: 3858 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 39 Data size: 7920 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: decimal(28,2)) - Group By Operator [GBY_16] - aggregations:["sum(_col1)"] - keys:_col0 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 39 Data size: 7920 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 39 Data size: 7920 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_33] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col6 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col8"] - | Statistics:Num rows: 39 Data size: 7920 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36 Data size: 7200 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_7] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36 Data size: 7200 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_31] - | predicate:((r_reason_desc = 'Did not like the warranty') and r_reason_sk is not null) (type: boolean) - | Statistics:Num rows: 36 Data size: 7200 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_5] - | alias:reason - | Statistics:Num rows: 72 Data size: 14400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col6 (type: int) - Map-reduce partition columns:_col6 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col8 (type: int) - Merge Join Operator [MERGEJOIN_32] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int), _col2 (type: int)","1":"_col0 (type: int), _col2 (type: int)"} - | outputColumnNames:["_col1","_col3","_col4","_col6","_col8"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: int), _col2 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col2 (type: int) - | sort order:++ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col1 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: int), _col2 (type: int) - Map-reduce partition columns:_col0 (type: int), _col2 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col3 (type: int) - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_30] - predicate:sr_reason_sk is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_2] - alias:store_returns - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_23] + Limit [LIM_22] (rows=19 width=203) + Number of rows:100 + Select Operator [SEL_21] (rows=19 width=203) + Output:["_col0","_col1"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_20] + Group By Operator [GBY_18] (rows=19 width=203) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0 + Group By Operator [GBY_16] (rows=39 width=203) + Output:["_col0","_col1"],aggregations:["sum(_col1)"],keys:_col0 + Select Operator [SEL_14] (rows=39 width=203) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_33] (rows=39 width=203) + Output:["_col1","_col3","_col4","_col8"],keys:{"0":"_col6","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Select Operator [SEL_7] (rows=36 width=200) + Output:["_col0"] + Filter Operator [FIL_31] (rows=36 width=200) + predicate:((r_reason_desc = 'Did not like the warranty') and r_reason_sk is not null) + TableScan [TS_5] (rows=72 width=200) + default@reason,reason,Tbl:COMPLETE,Col:NONE,Output:["r_reason_sk","r_reason_desc"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col6 + Merge Join Operator [MERGEJOIN_32] (rows=1 width=0) + Output:["_col1","_col3","_col4","_col6","_col8"],keys:{"0":"_col0, _col2","1":"_col0, _col2"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0, _col2 + Select Operator [SEL_1] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4"] + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_item_sk","ss_customer_sk","ss_ticket_number","ss_quantity","ss_sales_price"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0, _col2 + Select Operator [SEL_4] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_30] (rows=1 width=0) + predicate:sr_reason_sk is not null + TableScan [TS_2] (rows=1 width=0) + default@store_returns,store_returns,Tbl:PARTIAL,Col:NONE,Output:["sr_item_sk","sr_reason_sk","sr_ticket_number","sr_return_quantity"] diff --git a/ql/src/test/results/clientpositive/perf/query94.q.out b/ql/src/test/results/clientpositive/perf/query94.q.out index 0357835..ddeec2b 100644 --- a/ql/src/test/results/clientpositive/perf/query94.q.out +++ b/ql/src/test/results/clientpositive/perf/query94.q.out @@ -14,215 +14,115 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Reducer 9 <- Map 10 (SIMPLE_EDGE), Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 7 - File Output Operator [FS_49] - compressed:false - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_48] - Number of rows:100 - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_46] - | aggregations:["count(DISTINCT KEY._col0:0._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_45] - key expressions:_col0 (type: int) - sort order:+ - Statistics:Num rows: 14641000 Data size: 14858857641 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)) - Group By Operator [GBY_44] - aggregations:["count(DISTINCT _col3)","sum(_col4)","sum(_col5)"] - keys:_col3 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 14641000 Data size: 14858857641 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_43] - outputColumnNames:["_col3","_col4","_col5"] - Statistics:Num rows: 14641000 Data size: 14858857641 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_42] - predicate:_col12 is null (type: boolean) - Statistics:Num rows: 14641000 Data size: 14858857641 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_83] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5","_col12"] - | Statistics:Num rows: 29282000 Data size: 29717715282 Basic stats: COMPLETE Column stats: NONE - |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_40] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_24] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_23] - | alias:wr1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col3 (type: int) - Map-reduce partition columns:_col3 (type: int) - sort order:+ - Statistics:Num rows: 26620000 Data size: 27016104217 Basic stats: COMPLETE Column stats: NONE - value expressions:_col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_82] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5"] - | Statistics:Num rows: 26620000 Data size: 27016104217 Basic stats: COMPLETE Column stats: NONE - |<-Map 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_22] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_76] - | predicate:(d_date BETWEEN '1999-05-01' AND '1999-07-01' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_20] - | alias:d - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 24200000 Data size: 24560094211 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_81] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col4","_col5"] - | Statistics:Num rows: 24200000 Data size: 24560094211 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_34] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_75] - | predicate:((web_company_name = 'pri') and web_site_sk is not null) (type: boolean) - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:s - | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_80] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_16] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_74] - | predicate:((ca_state = 'TX') and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_14] - | alias:ca - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_79] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_71] - | predicate:(((ws_ship_addr_sk is not null and ws_web_site_sk is not null) and ws_ship_date_sk is not null) and ws_order_number is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:ws1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Group By Operator [GBY_26] - keys:_col0 (type: int) - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_13] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_12] - predicate:(_col0 <> _col2) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Merge Join Operator [MERGEJOIN_78] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_73] - | predicate:ws_order_number is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_6] - | alias:ws1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_72] - predicate:ws_order_number is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_3] - alias:ws1 - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 7 + File Output Operator [FS_49] + Limit [LIM_48] (rows=1 width=344) + Number of rows:100 + Group By Operator [GBY_46] (rows=1 width=344) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT KEY._col0:0._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_45] + Group By Operator [GBY_44] (rows=14641000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT _col3)","sum(_col4)","sum(_col5)"],keys:_col3 + Select Operator [SEL_43] (rows=14641000 width=1014) + Output:["_col3","_col4","_col5"] + Filter Operator [FIL_42] (rows=14641000 width=1014) + predicate:_col12 is null + Merge Join Operator [MERGEJOIN_83] (rows=29282000 width=1014) + Output:["_col3","_col4","_col5","_col12"],keys:{"0":"_col3","1":"_col0"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_40] + PartitionCols:_col0 + Select Operator [SEL_24] (rows=1 width=0) + Output:["_col0"] + TableScan [TS_23] (rows=1 width=0) + default@web_returns,wr1,Tbl:PARTIAL,Col:NONE,Output:["wr_order_number"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_39] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_82] (rows=26620000 width=1014) + Output:["_col3","_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_22] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_76] (rows=36524 width=1119) + predicate:(d_date BETWEEN '1999-05-01' AND '1999-07-01' and d_date_sk is not null) + TableScan [TS_20] (rows=73049 width=1119) + default@date_dim,d,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_81] (rows=24200000 width=1014) + Output:["_col0","_col3","_col4","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=42 width=1850) + Output:["_col0"] + Filter Operator [FIL_75] (rows=42 width=1850) + predicate:((web_company_name = 'pri') and web_site_sk is not null) + TableScan [TS_17] (rows=84 width=1850) + default@web_site,s,Tbl:COMPLETE,Col:NONE,Output:["web_site_sk","web_company_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_80] (rows=22000000 width=1014) + Output:["_col0","_col2","_col3","_col4","_col5"],keys:{"0":"_col1","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=20000000 width=1014) + Output:["_col0"] + Filter Operator [FIL_74] (rows=20000000 width=1014) + predicate:((ca_state = 'TX') and ca_address_sk is not null) + TableScan [TS_14] (rows=40000000 width=1014) + default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_79] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],keys:{"0":"_col3","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col3 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_71] (rows=1 width=0) + predicate:(((ws_ship_addr_sk is not null and ws_web_site_sk is not null) and ws_ship_date_sk is not null) and ws_order_number is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_ship_date_sk","ws_ship_addr_sk","ws_web_site_sk","ws_order_number","ws_ext_ship_cost","ws_net_profit"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Group By Operator [GBY_26] (rows=1 width=0) + Output:["_col0"],keys:_col0 + Select Operator [SEL_13] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_12] (rows=1 width=0) + predicate:(_col0 <> _col2) + Merge Join Operator [MERGEJOIN_78] (rows=1 width=0) + Output:["_col0","_col1","_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_73] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_6] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_72] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_3] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] diff --git a/ql/src/test/results/clientpositive/perf/query95.q.out b/ql/src/test/results/clientpositive/perf/query95.q.out index a7c6a98..3088a7a 100644 --- a/ql/src/test/results/clientpositive/perf/query95.q.out +++ b/ql/src/test/results/clientpositive/perf/query95.q.out @@ -15,261 +15,140 @@ Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Reducer 8 <- Map 7 (SIMPLE_EDGE), Map 9 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 6 - File Output Operator [FS_63] - compressed:false - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_61] - | aggregations:["count(DISTINCT KEY._col0:0._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_60] - key expressions:_col0 (type: int) - sort order:+ - Statistics:Num rows: 26620000 Data size: 27016104217 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)) - Group By Operator [GBY_59] - aggregations:["count(DISTINCT _col3)","sum(_col4)","sum(_col5)"] - keys:_col3 (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 26620000 Data size: 27016104217 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_122] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col3","_col4","_col5"] - | Statistics:Num rows: 26620000 Data size: 27016104217 Basic stats: COMPLETE Column stats: NONE - |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_56] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_40] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_115] - | predicate:(d_date BETWEEN '2002-05-01' AND '2002-06-30' and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_38] - | alias:d - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_55] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 24200000 Data size: 24560094211 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_121] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col3","_col4","_col5"] - | Statistics:Num rows: 24200000 Data size: 24560094211 Basic stats: COMPLETE Column stats: NONE - |<-Map 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_53] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_37] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_114] - | predicate:((web_company_name = 'pri') and web_site_sk is not null) (type: boolean) - | Statistics:Num rows: 42 Data size: 77704 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_35] - | alias:s - | Statistics:Num rows: 84 Data size: 155408 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_52] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_120] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 22000000 Data size: 22327357890 Basic stats: COMPLETE Column stats: NONE - |<-Map 15 [SIMPLE_EDGE] - | Reduce Output Operator [RS_50] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_34] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_113] - | predicate:((ca_state = 'GA') and ca_address_sk is not null) (type: boolean) - | Statistics:Num rows: 20000000 Data size: 20297597642 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_32] - | alias:ca - | Statistics:Num rows: 40000000 Data size: 40595195284 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_49] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 2 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - Merge Join Operator [MERGEJOIN_119] - | condition map:[{"":"Left Semi Join 0 to 1"},{"":"Left Semi Join 0 to 2"}] - | keys:{"0":"_col3 (type: int)","1":"_col0 (type: int)","2":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 2 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | key expressions:_col3 (type: int) - | Map-reduce partition columns:_col3 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_107] - | predicate:(((ws_ship_addr_sk is not null and ws_web_site_sk is not null) and ws_ship_date_sk is not null) and ws_order_number is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:ws1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_47] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Group By Operator [GBY_44] - | keys:_col0 (type: int) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Merge Join Operator [MERGEJOIN_118] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_28] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Select Operator [SEL_16] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_110] - | | predicate:wr_order_number is not null (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_14] - | | alias:wr - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_29] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Select Operator [SEL_27] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_26] - | predicate:(_col0 <> _col2) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Merge Join Operator [MERGEJOIN_117] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 12 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_23] - | | key expressions:_col1 (type: int) - | | Map-reduce partition columns:_col1 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col0 (type: int) - | | Select Operator [SEL_19] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_111] - | | predicate:ws_order_number is not null (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_17] - | | alias:ws1 - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_24] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int) - | Select Operator [SEL_22] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_112] - | predicate:ws_order_number is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_20] - | alias:ws1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_46] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Group By Operator [GBY_42] - keys:_col0 (type: int) - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_13] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_12] - predicate:(_col0 <> _col2) (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Merge Join Operator [MERGEJOIN_116] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col1 (type: int)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_108] - | predicate:ws_order_number is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_3] - | alias:ws1 - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col1 (type: int) - Map-reduce partition columns:_col1 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: int) - Select Operator [SEL_8] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_109] - predicate:ws_order_number is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_6] - alias:ws1 - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 6 + File Output Operator [FS_63] + Group By Operator [GBY_61] (rows=1 width=344) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT KEY._col0:0._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_60] + Group By Operator [GBY_59] (rows=26620000 width=1014) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT _col3)","sum(_col4)","sum(_col5)"],keys:_col3 + Merge Join Operator [MERGEJOIN_122] (rows=26620000 width=1014) + Output:["_col3","_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col0 + Select Operator [SEL_40] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_115] (rows=36524 width=1119) + predicate:(d_date BETWEEN '2002-05-01' AND '2002-06-30' and d_date_sk is not null) + TableScan [TS_38] (rows=73049 width=1119) + default@date_dim,d,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_121] (rows=24200000 width=1014) + Output:["_col0","_col3","_col4","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 16 [SIMPLE_EDGE] + SHUFFLE [RS_53] + PartitionCols:_col0 + Select Operator [SEL_37] (rows=42 width=1850) + Output:["_col0"] + Filter Operator [FIL_114] (rows=42 width=1850) + predicate:((web_company_name = 'pri') and web_site_sk is not null) + TableScan [TS_35] (rows=84 width=1850) + default@web_site,s,Tbl:COMPLETE,Col:NONE,Output:["web_site_sk","web_company_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_120] (rows=22000000 width=1014) + Output:["_col0","_col2","_col3","_col4","_col5"],keys:{"0":"_col1","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_50] + PartitionCols:_col0 + Select Operator [SEL_34] (rows=20000000 width=1014) + Output:["_col0"] + Filter Operator [FIL_113] (rows=20000000 width=1014) + predicate:((ca_state = 'GA') and ca_address_sk is not null) + TableScan [TS_32] (rows=40000000 width=1014) + default@customer_address,ca,Tbl:COMPLETE,Col:NONE,Output:["ca_address_sk","ca_state"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_119] (rows=2 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],keys:{"0":"_col3","1":"_col0","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col3 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_107] (rows=1 width=0) + predicate:(((ws_ship_addr_sk is not null and ws_web_site_sk is not null) and ws_ship_date_sk is not null) and ws_order_number is not null) + TableScan [TS_0] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_ship_date_sk","ws_ship_addr_sk","ws_web_site_sk","ws_order_number","ws_ext_ship_cost","ws_net_profit"] + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:_col0 + Group By Operator [GBY_44] (rows=1 width=0) + Output:["_col0"],keys:_col0 + Merge Join Operator [MERGEJOIN_118] (rows=1 width=0) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_110] (rows=1 width=0) + predicate:wr_order_number is not null + TableScan [TS_14] (rows=1 width=0) + default@web_returns,wr,Tbl:PARTIAL,Col:NONE,Output:["wr_order_number"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Select Operator [SEL_27] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_26] (rows=1 width=0) + predicate:(_col0 <> _col2) + Merge Join Operator [MERGEJOIN_117] (rows=1 width=0) + Output:["_col0","_col1","_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col1 + Select Operator [SEL_19] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_111] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_17] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col1 + Select Operator [SEL_22] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_112] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_20] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col0 + Group By Operator [GBY_42] (rows=1 width=0) + Output:["_col0"],keys:_col0 + Select Operator [SEL_13] (rows=1 width=0) + Output:["_col0"] + Filter Operator [FIL_12] (rows=1 width=0) + predicate:(_col0 <> _col2) + Merge Join Operator [MERGEJOIN_116] (rows=1 width=0) + Output:["_col0","_col1","_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_108] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_3] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=1 width=0) + Output:["_col0","_col1"] + Filter Operator [FIL_109] (rows=1 width=0) + predicate:ws_order_number is not null + TableScan [TS_6] (rows=1 width=0) + default@web_sales,ws1,Tbl:PARTIAL,Col:NONE,Output:["ws_warehouse_sk","ws_order_number"] diff --git a/ql/src/test/results/clientpositive/perf/query96.q.out b/ql/src/test/results/clientpositive/perf/query96.q.out index bba8965..7b98a64 100644 --- a/ql/src/test/results/clientpositive/perf/query96.q.out +++ b/ql/src/test/results/clientpositive/perf/query96.q.out @@ -12,124 +12,69 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 6 - File Output Operator [FS_29] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_28] - Number of rows:100 - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_27] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: bigint) - sort order:+ - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_22] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_45] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: int)","1":"_col0 (type: int)"} - | Statistics:Num rows: 17424 Data size: 8206704 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_11] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_42] - | predicate:((s_store_name = 'ese') and s_store_sk is not null) (type: boolean) - | Statistics:Num rows: 852 Data size: 1628138 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:store - | Statistics:Num rows: 1704 Data size: 3256276 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col2 (type: int) - Map-reduce partition columns:_col2 (type: int) - sort order:+ - Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_44] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 15840 Data size: 7460640 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_41] - | predicate:(((t_minute >= 30) and (t_hour = 8)) and t_time_sk is not null) (type: boolean) - | Statistics:Num rows: 14400 Data size: 6782400 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:time_dim - | Statistics:Num rows: 86400 Data size: 40694400 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: int) - Merge Join Operator [MERGEJOIN_43] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 3960 Data size: 423720 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_39] - | predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_40] - predicate:((hd_dep_count = 5) and hd_demo_sk is not null) (type: boolean) - Statistics:Num rows: 3600 Data size: 385200 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:household_demographics - Statistics:Num rows: 7200 Data size: 770400 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 6 + File Output Operator [FS_29] + Limit [LIM_28] (rows=1 width=8) + Number of rows:100 + Select Operator [SEL_27] (rows=1 width=8) + Output:["_col0"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_26] + Group By Operator [GBY_24] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Group By Operator [GBY_22] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_45] (rows=17424 width=471) + keys:{"0":"_col2","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_11] (rows=852 width=1910) + Output:["_col0"] + Filter Operator [FIL_42] (rows=852 width=1910) + predicate:((s_store_name = 'ese') and s_store_sk is not null) + TableScan [TS_9] (rows=1704 width=1910) + default@store,store,Tbl:COMPLETE,Col:NONE,Output:["s_store_sk","s_store_name"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_44] (rows=15840 width=471) + Output:["_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=14400 width=471) + Output:["_col0"] + Filter Operator [FIL_41] (rows=14400 width=471) + predicate:(((t_minute >= 30) and (t_hour = 8)) and t_time_sk is not null) + TableScan [TS_6] (rows=86400 width=471) + default@time_dim,time_dim,Tbl:COMPLETE,Col:NONE,Output:["t_time_sk","t_hour","t_minute"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_43] (rows=3960 width=107) + Output:["_col0","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_39] (rows=1 width=0) + predicate:((ss_hdemo_sk is not null and ss_sold_time_sk is not null) and ss_store_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_time_sk","ss_hdemo_sk","ss_store_sk"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=3600 width=107) + Output:["_col0"] + Filter Operator [FIL_40] (rows=3600 width=107) + predicate:((hd_dep_count = 5) and hd_demo_sk is not null) + TableScan [TS_3] (rows=7200 width=107) + default@household_demographics,household_demographics,Tbl:COMPLETE,Col:NONE,Output:["hd_demo_sk","hd_dep_count"] diff --git a/ql/src/test/results/clientpositive/perf/query97.q.out b/ql/src/test/results/clientpositive/perf/query97.q.out index c4c384d..7fa6f87 100644 --- a/ql/src/test/results/clientpositive/perf/query97.q.out +++ b/ql/src/test/results/clientpositive/perf/query97.q.out @@ -13,151 +13,83 @@ Reducer 8 <- Map 10 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_38] - compressed:false - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_37] - Number of rows:100 - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_35] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_33] - aggregations:["sum(_col0)","sum(_col1)","sum(_col2)"] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_31] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_49] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"_col0 (type: int), _col1 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 22096 Data size: 24726566 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_12] - | | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_10] - | keys:_col1 (type: int), _col2 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_47] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_6] - | | key expressions:_col0 (type: int) - | | Map-reduce partition columns:_col0 (type: int) - | | sort order:+ - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | value expressions:_col1 (type: int), _col2 (type: int) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | Filter Operator [FIL_43] - | | predicate:ss_sold_date_sk is not null (type: boolean) - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | | TableScan [TS_0] - | | alias:store_sales - | | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_44] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_26] - | keys:KEY._col0 (type: int), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20088 Data size: 22478696 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col0 (type: int), _col1 (type: int) - Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - sort order:++ - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_24] - keys:_col1 (type: int), _col2 (type: int) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_48] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 40176 Data size: 44957392 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_46] - | predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_17] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col1 (type: int), _col2 (type: int) - Select Operator [SEL_16] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Filter Operator [FIL_45] - predicate:cs_sold_date_sk is not null (type: boolean) - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_14] - alias:catalog_sales - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_38] + Limit [LIM_37] (rows=1 width=24) + Number of rows:100 + Group By Operator [GBY_35] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_34] + Group By Operator [GBY_33] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(_col0)","sum(_col1)","sum(_col2)"] + Select Operator [SEL_31] (rows=22096 width=1119) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_49] (rows=22096 width=1119) + Output:["_col0","_col2"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0, _col1 + Select Operator [SEL_13] (rows=20088 width=1119) + Output:["_col0","_col1"] + Group By Operator [GBY_12] (rows=20088 width=1119) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col0, _col1 + Group By Operator [GBY_10] (rows=40176 width=1119) + Output:["_col0","_col1"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_47] (rows=40176 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_43] (rows=1 width=0) + predicate:ss_sold_date_sk is not null + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_customer_sk"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_44] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_3] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0, _col1 + Group By Operator [GBY_26] (rows=20088 width=1119) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0, _col1 + Group By Operator [GBY_24] (rows=40176 width=1119) + Output:["_col0","_col1"],keys:_col1, _col2 + Merge Join Operator [MERGEJOIN_48] (rows=40176 width=1119) + Output:["_col1","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_19] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_46] (rows=36524 width=1119) + predicate:(d_month_seq BETWEEN 1193 AND 1204 and d_date_sk is not null) + TableScan [TS_17] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_month_seq"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_16] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_45] (rows=1 width=0) + predicate:cs_sold_date_sk is not null + TableScan [TS_14] (rows=1 width=0) + default@catalog_sales,catalog_sales,Tbl:PARTIAL,Col:NONE,Output:["cs_sold_date_sk","cs_bill_customer_sk","cs_item_sk"] diff --git a/ql/src/test/results/clientpositive/perf/query98.q.out b/ql/src/test/results/clientpositive/perf/query98.q.out index baff7e0..438b37d 100644 --- a/ql/src/test/results/clientpositive/perf/query98.q.out +++ b/ql/src/test/results/clientpositive/perf/query98.q.out @@ -12,124 +12,67 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 6 - File Output Operator [FS_27] - compressed:false - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_26] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_25] - key expressions:_col1 (type: string), _col2 (type: string), _col4 (type: string), _col0 (type: string), _col6 (type: decimal(38,23)) - sort order:+++++ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_23] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - PTF Operator [PTF_22] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_21] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col3 (type: string) - Map-reduce partition columns:_col3 (type: string) - sort order:+ - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) - Select Operator [SEL_19] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: decimal(7,2)), KEY._col3 (type: string), KEY._col4 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 139755 Data size: 200727046 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)), _col3 (type: string), _col4 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: decimal(7,2)), _col3 (type: string), _col4 (type: string) - sort order:+++++ - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: decimal(17,2)) - Group By Operator [GBY_16] - aggregations:["sum(_col2)"] - keys:_col4 (type: string), _col5 (type: string), _col6 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_15] - outputColumnNames:["_col4","_col5","_col6","_col7","_col8","_col2"] - Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_37] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 279510 Data size: 401454092 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_8] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_35] - | predicate:(d_date BETWEEN 2001-01-12 AND 2001-02-11 and d_date_sk is not null) (type: boolean) - | Statistics:Num rows: 36524 Data size: 40870356 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:date_dim - | Statistics:Num rows: 73049 Data size: 81741831 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: decimal(7,2)), _col4 (type: string), _col5 (type: string), _col6 (type: decimal(7,2)), _col7 (type: string), _col8 (type: string) - Merge Join Operator [MERGEJOIN_36] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col2","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 254100 Data size: 364958258 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | value expressions:_col0 (type: int), _col2 (type: decimal(7,2)) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | Filter Operator [FIL_33] - | predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - | TableScan [TS_0] - | alias:store_sales - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: decimal(7,2)), _col4 (type: string), _col5 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_34] - predicate:((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) (type: boolean) - Statistics:Num rows: 231000 Data size: 331780228 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:item - Statistics:Num rows: 462000 Data size: 663560457 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 6 + File Output Operator [FS_27] + Select Operator [SEL_26] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_25] + Select Operator [SEL_23] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_22] (rows=139755 width=1436) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col3","partition by:":"_col3"}] + Select Operator [SEL_21] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col3 + Select Operator [SEL_19] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_18] (rows=139755 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2, KEY._col3, KEY._col4 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0, _col1, _col2, _col3, _col4 + Group By Operator [GBY_16] (rows=279510 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["sum(_col2)"],keys:_col4, _col5, _col6, _col7, _col8 + Select Operator [SEL_15] (rows=279510 width=1436) + Output:["_col4","_col5","_col6","_col7","_col8","_col2"] + Merge Join Operator [MERGEJOIN_37] (rows=279510 width=1436) + Output:["_col2","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col0","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=36524 width=1119) + Output:["_col0"] + Filter Operator [FIL_35] (rows=36524 width=1119) + predicate:(d_date BETWEEN 2001-01-12 AND 2001-02-11 and d_date_sk is not null) + TableScan [TS_6] (rows=73049 width=1119) + default@date_dim,date_dim,Tbl:COMPLETE,Col:NONE,Output:["d_date_sk","d_date"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_36] (rows=254100 width=1436) + Output:["_col0","_col2","_col4","_col5","_col6","_col7","_col8"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=0) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_33] (rows=1 width=0) + predicate:(ss_item_sk is not null and ss_sold_date_sk is not null) + TableScan [TS_0] (rows=1 width=0) + default@store_sales,store_sales,Tbl:PARTIAL,Col:NONE,Output:["ss_sold_date_sk","ss_item_sk","ss_ext_sales_price"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=231000 width=1436) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_34] (rows=231000 width=1436) + predicate:((i_category) IN ('Jewelry', 'Sports', 'Books') and i_item_sk is not null) + TableScan [TS_3] (rows=462000 width=1436) + default@item,item,Tbl:COMPLETE,Col:NONE,Output:["i_item_sk","i_item_id","i_item_desc","i_current_price","i_class","i_category"] diff --git a/ql/src/test/results/clientpositive/tez/explainuser_1.q.out b/ql/src/test/results/clientpositive/tez/explainuser_1.q.out index 8c78fd9..53beeac 100644 --- a/ql/src/test/results/clientpositive/tez/explainuser_1.q.out +++ b/ql/src/test/results/clientpositive/tez/explainuser_1.q.out @@ -3,12 +3,8 @@ PREHOOK: type: CREATETABLE POSTHOOK: query: explain create table src_orc_merge_test_part(key int, value string) partitioned by (ds string, ts string) stored as orc POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - columns:["key int","value string"] - input format:org.apache.hadoop.hive.ql.io.orc.OrcInputFormat - name:default.src_orc_merge_test_part - output format:org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat - partition columns:["ds string","ts string"] + Create Table Operator: + name:default.src_orc_merge_test_part PREHOOK: query: create table src_orc_merge_test_part(key int, value string) partitioned by (ds string, ts string) stored as orc PREHOOK: type: CREATETABLE @@ -50,25 +46,20 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-3 - Stats-Aggr Operator - Stage-0 - Move Operator - partition:{"ds":"2012-01-03","ts":"2012-01-03+14:46:31"} - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.src_orc_merge_test_part"} - Stage-2 - Dependency Collection{} - Stage-1 - Map 1 - File Output Operator [FS_3] - compressed:false - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.src_orc_merge_test_part"} - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.src_orc_merge_test_part"} + Stage-2 + Dependency Collection{} + Stage-1 + Map 1 + File Output Operator [FS_3] + table:{"name:":"default.src_orc_merge_test_part"} + Select Operator [SEL_1] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: insert overwrite table src_orc_merge_test_part partition(ds='2012-01-03', ts='2012-01-03+14:46:31') select * from src PREHOOK: type: QUERY @@ -90,42 +81,30 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-3 - Stats-Aggr Operator - Stage-0 - Move Operator - partition:{"ds":"2012-01-03","ts":"2012-01-03+14:46:31"} - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.src_orc_merge_test_part"} - Stage-2 - Dependency Collection{} - Stage-1 - Reducer 2 - File Output Operator [FS_7] - compressed:false - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.src_orc_merge_test_part"} - Select Operator [SEL_6] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - Limit [LIM_5] - Number of rows:100 - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_4] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string), _col1 (type: string) - Limit [LIM_2] - Number of rows:100 - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.src_orc_merge_test_part"} + Stage-2 + Dependency Collection{} + Stage-1 + Reducer 2 + File Output Operator [FS_7] + table:{"name:":"default.src_orc_merge_test_part"} + Select Operator [SEL_6] (rows=100 width=10) + Output:["_col0","_col1"] + Limit [LIM_5] (rows=100 width=10) + Number of rows:100 + Select Operator [SEL_4] (rows=100 width=10) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Limit [LIM_2] (rows=100 width=10) + Number of rows:100 + Select Operator [SEL_1] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select count(1) from src_orc_merge_test_part where ds='2012-01-03' and ts='2012-01-03+14:46:31' PREHOOK: type: QUERY @@ -137,32 +116,20 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_6] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_4] - aggregations:["count(1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_2] - Statistics:Num rows: 500 Data size: 47000 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src_orc_merge_test_part - Statistics:Num rows: 500 Data size: 47000 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Group By Operator [GBY_6] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + Select Operator [SEL_2] (rows=500 width=94) + TableScan [TS_0] (rows=500 width=94) + default@src_orc_merge_test_part,src_orc_merge_test_part,Tbl:COMPLETE,Col:NONE PREHOOK: query: explain select sum(hash(key)), sum(hash(value)) from src_orc_merge_test_part where ds='2012-01-03' and ts='2012-01-03+14:46:31' PREHOOK: type: QUERY @@ -174,33 +141,21 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_6] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_4] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_2] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 47000 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src_orc_merge_test_part - Statistics:Num rows: 500 Data size: 47000 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Group By Operator [GBY_6] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Group By Operator [GBY_4] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_2] (rows=500 width=94) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=94) + default@src_orc_merge_test_part,src_orc_merge_test_part,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: alter table src_orc_merge_test_part partition (ds='2012-01-03', ts='2012-01-03+14:46:31') concatenate PREHOOK: type: ALTER_PARTITION_MERGE @@ -220,32 +175,20 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_6] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_4] - aggregations:["count(1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_2] - Statistics:Num rows: 1 Data size: 2515 Basic stats: PARTIAL Column stats: NONE - TableScan [TS_0] - alias:src_orc_merge_test_part - Statistics:Num rows: 1 Data size: 2515 Basic stats: PARTIAL Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Group By Operator [GBY_6] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + Select Operator [SEL_2] (rows=1 width=2515) + TableScan [TS_0] (rows=1 width=2515) + default@src_orc_merge_test_part,src_orc_merge_test_part,Tbl:PARTIAL,Col:NONE PREHOOK: query: explain select sum(hash(key)), sum(hash(value)) from src_orc_merge_test_part where ds='2012-01-03' and ts='2012-01-03+14:46:31' PREHOOK: type: QUERY @@ -257,33 +200,21 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_6] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_4] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_2] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 24 Data size: 2515 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src_orc_merge_test_part - Statistics:Num rows: 24 Data size: 2515 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Group By Operator [GBY_6] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Group By Operator [GBY_4] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_2] (rows=24 width=104) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=24 width=104) + default@src_orc_merge_test_part,src_orc_merge_test_part,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: drop table src_orc_merge_test_part PREHOOK: type: DROPTABLE @@ -322,63 +253,37 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_17] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_15] - | aggregations:["sum(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_13] - aggregations:["sum(hash(_col0,_col1,_col2,_col3))"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 182 Data size: 1939 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 182 Data size: 1939 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_20] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 182 Data size: 1939 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_7] - | sort order: - | Statistics:Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col1 (type: string) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_19] - | predicate:(key < 10) (type: boolean) - | Statistics:Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_18] - predicate:(key < 10) (type: boolean) - Statistics:Num rows: 166 Data size: 1763 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_17] + Group By Operator [GBY_15] (rows=1 width=8) + Output:["_col0"],aggregations:["sum(VALUE._col0)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_14] + Group By Operator [GBY_13] (rows=1 width=8) + Output:["_col0"],aggregations:["sum(hash(_col0,_col1,_col2,_col3))"] + Select Operator [SEL_11] (rows=182 width=10) + Output:["_col0","_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Map Join Operator [MAPJOIN_20] (rows=182 width=10) + Output:["_col0","_col1","_col2","_col3"],keys:{} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_7] + Select Operator [SEL_5] (rows=166 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_19] (rows=166 width=10) + predicate:(key < 10) + TableScan [TS_3] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_2] (rows=166 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_18] (rows=166 width=10) + predicate:(key < 10) + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select key, (c_int+1)+2 as x, sum(c_int) from cbo_t1 group by c_float, cbo_t1.c_int, key PREHOOK: type: QUERY @@ -390,40 +295,24 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_7] - compressed:false - Statistics:Num rows: 10 Data size: 885 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 10 Data size: 885 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_2] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","c_int","c_float"] - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_7] + Select Operator [SEL_5] (rows=10 width=88) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_4] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_2] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Select Operator [SEL_1] (rows=20 width=83) + Output:["key","c_int","c_float"] + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select x, y, count(*) from (select key, (c_int+c_float+1+2) as x, sum(c_int) as y from cbo_t1 group by c_float, cbo_t1.c_int, key) R group by y, x PREHOOK: type: QUERY @@ -436,60 +325,33 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_12] - compressed:false - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_11] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_10] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: float) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: bigint), _col1 (type: float) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: float) - sort order:++ - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_8] - aggregations:["count()"] - keys:_col0 (type: bigint), _col1 (type: float) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_2] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","c_int","c_float"] - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_12] + Select Operator [SEL_11] (rows=5 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_10] (rows=5 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0, _col1 + Group By Operator [GBY_8] (rows=5 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=10 width=91) + Output:["_col0","_col1"] + Group By Operator [GBY_4] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_2] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Select Operator [SEL_1] (rows=20 width=83) + Output:["key","c_int","c_float"] + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key order by a) cbo_t1 join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key order by q/10 desc, r asc) cbo_t2 on cbo_t1.a=p join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 0) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c order by cbo_t3.c_int+c desc, c PREHOOK: type: QUERY @@ -508,172 +370,88 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_42] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_41] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_40] - key expressions:(UDFToLong(_col0) + _col1) (type: bigint), _col1 (type: bigint) - sort order:-+ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: int), _col2 (type: bigint) - Select Operator [SEL_38] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_37] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_35] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_34] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_33] - predicate:((_col1 > 0) or (_col6 >= 0)) (type: boolean) - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_52] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col6"] - | Statistics:Num rows: 3 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_31] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_29] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_50] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_27] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_26] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_25] - predicate:((_col1 + _col4) >= 0) (type: boolean) - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_51] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_20] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col3 (type: double), _col2 (type: bigint) - | sort order:-+ - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: int) - | Select Operator [SEL_17] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_16] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_14] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_49] - | predicate:((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) (type: boolean) - | Statistics:Num rows: 3 Data size: 279 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_11] - | alias:cbo_t2 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_9] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_6] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_5] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_3] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_48] - predicate:((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) (type: boolean) - Statistics:Num rows: 3 Data size: 279 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_42] + Select Operator [SEL_41] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_40] + Select Operator [SEL_38] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_37] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_34] (rows=2 width=16) + Output:["_col2","_col6"] + Filter Operator [FIL_33] (rows=2 width=16) + predicate:((_col1 > 0) or (_col6 >= 0)) + Merge Join Operator [MERGEJOIN_52] (rows=3 width=16) + Output:["_col1","_col2","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Select Operator [SEL_29] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_50] (rows=18 width=79) + predicate:key is not null + TableScan [TS_27] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_25] (rows=1 width=101) + predicate:((_col1 + _col4) >= 0) + Merge Join Operator [MERGEJOIN_51] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1 width=89) + Output:["_col0","_col1"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_19] + Select Operator [SEL_17] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_16] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_14] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_49] (rows=3 width=93) + predicate:((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) + TableScan [TS_11] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_9] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Select Operator [SEL_6] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_48] (rows=3 width=93) + predicate:((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key having cbo_t1.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by b % c asc, b desc) cbo_t1 left outer join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key having cbo_t2.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0) cbo_t2 on cbo_t1.a=p left outer join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 0) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c having cbo_t3.c_int > 0 and (c_int >=1 or c >= 1) and (c_int + c) >= 0 order by cbo_t3.c_int % c asc, cbo_t3.c_int desc PREHOOK: type: QUERY @@ -691,160 +469,84 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_39] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_38] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_37] - key expressions:(UDFToLong(_col0) % _col1) (type: bigint), _col0 (type: int) - sort order:+- - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint), _col2 (type: bigint) - Select Operator [SEL_35] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_34] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_33] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_32] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_31] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_30] - predicate:(((_col1 > 0) or (_col6 >= 0)) and ((_col6 >= 1) or (_col2 >= 1)) and ((UDFToLong(_col6) + _col2) >= 0)) (type: boolean) - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_48] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col6"] - | Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_26] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_46] - | predicate:((c_int > 0) and key is not null) (type: boolean) - | Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_24] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_27] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_23] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_22] - predicate:((_col1 + _col4) >= 0) (type: boolean) - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_47] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_9] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col3 (type: bigint), _col1 (type: int) - | sort order:+- - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col2 (type: bigint) - | Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_44] - | predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_16] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_14] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_45] - predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) (type: boolean) - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_11] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_39] + Select Operator [SEL_38] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_37] + Select Operator [SEL_35] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_34] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_33] + PartitionCols:_col0, _col1 + Group By Operator [GBY_32] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_31] (rows=1 width=16) + Output:["_col2","_col6"] + Filter Operator [FIL_30] (rows=1 width=16) + predicate:(((_col1 > 0) or (_col6 >= 0)) and ((_col6 >= 1) or (_col2 >= 1)) and ((UDFToLong(_col6) + _col2) >= 0)) + Merge Join Operator [MERGEJOIN_48] (rows=2 width=16) + Output:["_col1","_col2","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Select Operator [SEL_26] (rows=5 width=71) + Output:["_col0","_col1"] + Filter Operator [FIL_46] (rows=5 width=71) + predicate:((c_int > 0) and key is not null) + TableScan [TS_24] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_22] (rows=1 width=101) + predicate:((_col1 + _col4) >= 0) + Merge Join Operator [MERGEJOIN_47] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_9] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Select Operator [SEL_6] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_44] (rows=1 width=93) + predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=1 width=89) + Output:["_col0","_col1"] + Group By Operator [GBY_16] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_14] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:key, c_int, c_float + Filter Operator [FIL_45] (rows=1 width=93) + predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) + TableScan [TS_11] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key having cbo_t1.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by b+c, a desc) cbo_t1 right outer join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key having cbo_t2.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0) cbo_t2 on cbo_t1.a=p right outer join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 2) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c PREHOOK: type: QUERY @@ -860,130 +562,69 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 7 <- Map 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_30] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_29] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_27] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_26] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_25] - predicate:(((_col1 + _col4) >= 2) and ((_col1 > 0) or (_col6 >= 0))) (type: boolean) - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_36] - | condition map:[{"":"Right Outer Join0 to 1"},{"":"Right Outer Join0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col4","_col6"] - | Statistics:Num rows: 4 Data size: 80 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_19] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_9] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col3 (type: bigint), _col0 (type: string) - | sort order:+- - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_34] - | predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) (type: boolean) - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_16] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_14] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_35] - predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) (type: boolean) - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_11] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_31] + Select Operator [SEL_30] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_29] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0, _col1 + Group By Operator [GBY_27] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_26] (rows=1 width=20) + Output:["_col2","_col6"] + Filter Operator [FIL_25] (rows=1 width=20) + predicate:(((_col1 + _col4) >= 2) and ((_col1 > 0) or (_col6 >= 0))) + Merge Join Operator [MERGEJOIN_36] (rows=4 width=20) + Output:["_col1","_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_19] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Select Operator [SEL_9] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Select Operator [SEL_6] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_34] (rows=1 width=93) + predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=1 width=89) + Output:["_col0","_col1"] + Group By Operator [GBY_16] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_14] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:key, c_int, c_float + Filter Operator [FIL_35] (rows=1 width=93) + predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) + TableScan [TS_11] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key having cbo_t1.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by c+a desc) cbo_t1 full outer join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key having cbo_t2.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by p+q desc, r asc) cbo_t2 on cbo_t1.a=p full outer join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 0) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c having cbo_t3.c_int > 0 and (c_int >=1 or c >= 1) and (c_int + c) >= 0 order by cbo_t3.c_int PREHOOK: type: QUERY @@ -1001,154 +642,79 @@ Reducer 8 <- Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 6 - File Output Operator [FS_37] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_36] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_35] - key expressions:_col0 (type: int) - sort order:+ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint), _col2 (type: bigint) - Select Operator [SEL_34] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_33] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_32] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_31] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_30] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_29] - predicate:(((_col1 + _col4) >= 0) and ((_col1 > 0) or (_col6 >= 0)) and ((_col6 >= 1) or (_col2 >= 1)) and ((UDFToLong(_col6) + _col2) >= 0)) (type: boolean) - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_42] - | condition map:[{"":"Outer Join 0 to 1"},{"":"Right Outer Join0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col4","_col6"] - | Statistics:Num rows: 3 Data size: 60 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_24] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_41] - | predicate:(c_int > 0) (type: boolean) - | Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_22] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_9] - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col3 (type: double) - | sort order:- - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_39] - | predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) (type: boolean) - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col3 (type: double), _col2 (type: bigint) - sort order:-+ - Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string), _col1 (type: int) - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_16] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_14] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_40] - predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) (type: boolean) - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_11] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 6 + File Output Operator [FS_37] + Select Operator [SEL_36] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_35] + Select Operator [SEL_34] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_33] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0, _col1 + Group By Operator [GBY_31] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_30] (rows=1 width=20) + Output:["_col2","_col6"] + Filter Operator [FIL_29] (rows=1 width=20) + predicate:(((_col1 + _col4) >= 0) and ((_col1 > 0) or (_col6 >= 0)) and ((_col6 >= 1) or (_col2 >= 1)) and ((UDFToLong(_col6) + _col2) >= 0)) + Merge Join Operator [MERGEJOIN_42] (rows=3 width=20) + Output:["_col1","_col2","_col4","_col6"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col0 + Select Operator [SEL_24] (rows=6 width=74) + Output:["_col0","_col1"] + Filter Operator [FIL_41] (rows=6 width=74) + predicate:(c_int > 0) + TableScan [TS_22] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_9] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Select Operator [SEL_6] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_39] (rows=1 width=93) + predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_26] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1 width=89) + Output:["_col0","_col1"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_19] + Select Operator [SEL_17] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_16] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_14] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_40] (rows=1 width=93) + predicate:((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) + TableScan [TS_11] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key having cbo_t1.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0) cbo_t1 join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key having cbo_t2.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0) cbo_t2 on cbo_t1.a=p join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 0) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c PREHOOK: type: QUERY @@ -1164,142 +730,76 @@ Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Reducer 7 <- Map 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_33] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_32] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_31] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_29] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_28] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:((_col1 > 0) or (_col6 >= 0)) (type: boolean) - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_43] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col6"] - | Statistics:Num rows: 3 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_23] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_41] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_21] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_20] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_19] - predicate:((_col1 + _col4) >= 0) (type: boolean) - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_42] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: bigint) - | Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_39] - | predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) (type: boolean) - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 89 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_13] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_11] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_40] - predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) (type: boolean) - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_8] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_33] + Select Operator [SEL_32] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_31] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0, _col1 + Group By Operator [GBY_29] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_28] (rows=2 width=16) + Output:["_col2","_col6"] + Filter Operator [FIL_27] (rows=2 width=16) + predicate:((_col1 > 0) or (_col6 >= 0)) + Merge Join Operator [MERGEJOIN_43] (rows=3 width=16) + Output:["_col1","_col2","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_41] (rows=18 width=79) + predicate:key is not null + TableScan [TS_21] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_19] (rows=1 width=101) + predicate:((_col1 + _col4) >= 0) + Merge Join Operator [MERGEJOIN_42] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0 + Select Operator [SEL_6] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_39] (rows=1 width=93) + predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=1 width=89) + Output:["_col0","_col1"] + Group By Operator [GBY_13] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_11] (rows=1 width=93) + Output:["_col0","_col1","_col2"],keys:key, c_int, c_float + Filter Operator [FIL_40] (rows=1 width=93) + predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and key is not null) + TableScan [TS_8] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select unionsrc.key FROM (select 'tst1' as key, count(1) as value from src) unionsrc PREHOOK: type: QUERY @@ -1311,36 +811,23 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_7] - compressed:false - Statistics:Num rows: 1 Data size: 88 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 88 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_2] - aggregations:["count(key)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key"] - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_7] + Select Operator [SEL_5] (rows=1 width=88) + Output:["_col0"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_1] (rows=500 width=87) + Output:["key"] + TableScan [TS_0] (rows=500 width=87) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select unionsrc.key FROM (select 'max' as key, max(c_int) as value from cbo_t3 s1 UNION ALL @@ -1363,99 +850,56 @@ Reducer 6 <- Map 5 (SIMPLE_EDGE), Union 3 (CONTAINS) Reducer 8 <- Map 7 (SIMPLE_EDGE), Union 3 (CONTAINS) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_26] - compressed:false - Statistics:Num rows: 3 Data size: 261 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_25] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3 Data size: 261 Basic stats: COMPLETE Column stats: COMPLETE - |<-Union 3 [SIMPLE_EDGE] - |<-Reducer 2 [CONTAINS] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 3 Data size: 261 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_4] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_2] - | aggregations:["count(key)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_1] - | outputColumnNames:["key"] - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [CONTAINS] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 3 Data size: 261 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_12] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_11] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_9] - | aggregations:["count(key)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_8] - | outputColumnNames:["key"] - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_7] - | alias:s1 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 8 [CONTAINS] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 3 Data size: 261 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_21] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_20] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_18] - aggregations:["count(key)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_17] - outputColumnNames:["key"] - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_16] - alias:s1 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_26] + Select Operator [SEL_25] (rows=3 width=87) + Output:["_col0"] + <-Union 3 [SIMPLE_EDGE] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_24] + Select Operator [SEL_5] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_1] (rows=20 width=76) + Output:["key"] + TableScan [TS_0] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 6 [CONTAINS] + Reduce Output Operator [RS_24] + Select Operator [SEL_12] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_11] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Group By Operator [GBY_9] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_8] (rows=20 width=76) + Output:["key"] + TableScan [TS_7] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 8 [CONTAINS] + Reduce Output Operator [RS_24] + Select Operator [SEL_21] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_20] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_19] + Group By Operator [GBY_18] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_17] (rows=20 width=76) + Output:["key"] + TableScan [TS_16] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select unionsrc.key, count(1) FROM (select 'max' as key, max(c_int) as value from cbo_t3 s1 UNION ALL @@ -1479,131 +923,69 @@ Reducer 7 <- Map 6 (SIMPLE_EDGE), Union 3 (CONTAINS) Reducer 9 <- Map 8 (SIMPLE_EDGE), Union 3 (CONTAINS) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_30] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_27] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - |<-Union 3 [SIMPLE_EDGE] - |<-Reducer 2 [CONTAINS] - | Reduce Output Operator [RS_26] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: bigint) - | Group By Operator [GBY_25] - | aggregations:["count(1)"] - | keys:_col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_4] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_2] - | aggregations:["count(key)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_1] - | outputColumnNames:["key"] - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 7 [CONTAINS] - | Reduce Output Operator [RS_26] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: bigint) - | Group By Operator [GBY_25] - | aggregations:["count(1)"] - | keys:_col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_12] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_11] - | | aggregations:["count(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: bigint) - | Group By Operator [GBY_9] - | aggregations:["count(key)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_8] - | outputColumnNames:["key"] - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_7] - | alias:s1 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 9 [CONTAINS] - Reduce Output Operator [RS_26] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_25] - aggregations:["count(1)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 95 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_21] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_20] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_18] - aggregations:["count(key)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_17] - outputColumnNames:["key"] - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_16] - alias:s1 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_31] + Select Operator [SEL_30] (rows=1 width=95) + Output:["_col0","_col1"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_29] + Group By Operator [GBY_27] (rows=1 width=95) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Union 3 [SIMPLE_EDGE] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_26] + PartitionCols:_col0 + Group By Operator [GBY_25] (rows=1 width=95) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Select Operator [SEL_5] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_1] (rows=20 width=76) + Output:["key"] + TableScan [TS_0] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 7 [CONTAINS] + Reduce Output Operator [RS_26] + PartitionCols:_col0 + Group By Operator [GBY_25] (rows=1 width=95) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Select Operator [SEL_12] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_11] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Group By Operator [GBY_9] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_8] (rows=20 width=76) + Output:["key"] + TableScan [TS_7] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 9 [CONTAINS] + Reduce Output Operator [RS_26] + PartitionCols:_col0 + Group By Operator [GBY_25] (rows=1 width=95) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Select Operator [SEL_21] (rows=1 width=87) + Output:["_col0"] + Group By Operator [GBY_20] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_19] + Group By Operator [GBY_18] (rows=1 width=8) + Output:["_col0"],aggregations:["count(key)"] + Select Operator [SEL_17] (rows=20 width=76) + Output:["key"] + TableScan [TS_16] (rows=20 width=76) + default@cbo_t3,s1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select cbo_t1.key from cbo_t1 join cbo_t3 where cbo_t1.key=cbo_t3.key and cbo_t1.key >= 1 PREHOOK: type: QUERY @@ -1615,49 +997,31 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 18 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_13] - | predicate:(UDFToDouble(key) >= 1.0) (type: boolean) - | Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_14] - predicate:(UDFToDouble(key) >= 1.0) (type: boolean) - Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:cbo_t3 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_10] + Merge Join Operator [MERGEJOIN_15] (rows=18 width=85) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=6 width=70) + Output:["_col0"] + Filter Operator [FIL_13] (rows=6 width=70) + predicate:(UDFToDouble(key) >= 1.0) + TableScan [TS_0] (rows=20 width=76) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=6 width=70) + Output:["_col0"] + Filter Operator [FIL_14] (rows=6 width=70) + predicate:(UDFToDouble(key) >= 1.0) + TableScan [TS_3] (rows=20 width=76) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select cbo_t1.c_int, cbo_t2.c_int from cbo_t1 left outer join cbo_t2 on cbo_t1.key=cbo_t2.key PREHOOK: type: QUERY @@ -1669,48 +1033,29 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_11] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col3"] - | Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_3] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Select Operator [SEL_7] (rows=100 width=8) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_11] (rows=100 width=8) + Output:["_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0 + Select Operator [SEL_1] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=20 width=80) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col0 + Select Operator [SEL_3] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_2] (rows=20 width=80) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select cbo_t1.c_int, cbo_t2.c_int from cbo_t1 full outer join cbo_t2 on cbo_t1.key=cbo_t2.key PREHOOK: type: QUERY @@ -1722,48 +1067,29 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_9] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col3"] - | Statistics:Num rows: 100 Data size: 800 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_3] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Select Operator [SEL_7] (rows=100 width=8) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_9] (rows=100 width=8) + Output:["_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0 + Select Operator [SEL_1] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=20 width=80) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col0 + Select Operator [SEL_3] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_2] (rows=20 width=80) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select b, cbo_t1.c, cbo_t2.p, q, cbo_t3.c_int from (select key as a, c_int as b, cbo_t1.c_float as c from cbo_t1) cbo_t1 join (select cbo_t2.key as p, cbo_t2.c_int as q, c_float as r from cbo_t2) cbo_t2 on cbo_t1.a=p join cbo_t3 on cbo_t1.a=key PREHOOK: type: QUERY @@ -1775,70 +1101,42 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 291 Data size: 29391 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 291 Data size: 29391 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_24] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col4","_col5","_col6"] - | Statistics:Num rows: 291 Data size: 29391 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1488 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: float) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 18 Data size: 1488 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_21] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1488 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_22] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_8] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_23] - predicate:key is not null (type: boolean) - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=291 width=101) + Output:["_col0","_col1","_col2","_col3","_col4"] + Merge Join Operator [MERGEJOIN_24] (rows=291 width=101) + Output:["_col1","_col2","_col4","_col5","_col6"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18 width=82) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_21] (rows=18 width=82) + predicate:key is not null + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=18 width=79) + predicate:key is not null + TableScan [TS_3] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_23] (rows=18 width=79) + predicate:key is not null + TableScan [TS_6] (rows=20 width=80) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select key, cbo_t1.c_int, cbo_t2.p, q from cbo_t1 join (select cbo_t2.key as p, cbo_t2.c_int as q, c_float as r from cbo_t2) cbo_t2 on cbo_t1.key=p join (select key as a, c_int as b, cbo_t3.c_float as c from cbo_t3)cbo_t3 on cbo_t1.key=a PREHOOK: type: QUERY @@ -1850,69 +1148,42 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 291 Data size: 51798 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 291 Data size: 51798 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_24] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3","_col4"] - | Statistics:Num rows: 291 Data size: 51798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_21] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_22] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_8] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_23] - predicate:key is not null (type: boolean) - Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=291 width=178) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_24] (rows=291 width=178) + Output:["_col0","_col1","_col3","_col4"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_21] (rows=18 width=79) + predicate:key is not null + TableScan [TS_0] (rows=20 width=80) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=18 width=75) + Output:["_col0"] + Filter Operator [FIL_22] (rows=18 width=75) + predicate:key is not null + TableScan [TS_3] (rows=20 width=76) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_23] (rows=18 width=79) + predicate:key is not null + TableScan [TS_6] (rows=20 width=80) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select * from (select q, b, cbo_t2.p, cbo_t1.c, cbo_t3.c_int from (select key as a, c_int as b, cbo_t1.c_float as c from cbo_t1 where (cbo_t1.c_int + 1 == 2) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0)) cbo_t1 full outer join (select cbo_t2.key as p, cbo_t2.c_int as q, c_float as r from cbo_t2 where (cbo_t2.c_int + 1 == 2) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0)) cbo_t2 on cbo_t1.a=p join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q == 2) and (b > 0 or c_int >= 0)) R where (q + 1 = 2) and (R.b > 0 or c_int >= 0) PREHOOK: type: QUERY @@ -1925,88 +1196,51 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_19] - compressed:false - Statistics:Num rows: 6 Data size: 606 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_18] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 6 Data size: 606 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_17] - predicate:((_col1 > 0) or (_col6 >= 0)) (type: boolean) - Statistics:Num rows: 6 Data size: 606 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_28] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 10 Data size: 1010 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_11] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 3 Data size: 546 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: float), _col3 (type: string), _col4 (type: int) - Filter Operator [FIL_9] - predicate:(((_col1 + _col4) = 2) and ((_col4 + 1) = 2)) (type: boolean) - Statistics:Num rows: 3 Data size: 546 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_27] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 15 Data size: 2730 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: float) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_24] - | predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) (type: boolean) - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_25] - predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_19] + Select Operator [SEL_18] (rows=6 width=101) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_17] (rows=6 width=101) + predicate:((_col1 > 0) or (_col6 >= 0)) + Merge Join Operator [MERGEJOIN_28] (rows=10 width=101) + Output:["_col1","_col2","_col3","_col4","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_26] (rows=18 width=79) + predicate:key is not null + TableScan [TS_11] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col0 + Filter Operator [FIL_9] (rows=3 width=182) + predicate:(((_col1 + _col4) = 2) and ((_col4 + 1) = 2)) + Merge Join Operator [MERGEJOIN_27] (rows=15 width=182) + Output:["_col0","_col1","_col2","_col3","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=5 width=74) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_24] (rows=5 width=74) + predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=6 width=74) + Output:["_col0","_col1"] + Filter Operator [FIL_25] (rows=6 width=77) + predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_3] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select * from (select q, b, cbo_t2.p, cbo_t1.c, cbo_t3.c_int from (select key as a, c_int as b, cbo_t1.c_float as c from cbo_t1 where (cbo_t1.c_int + 1 == 2) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0)) cbo_t1 right outer join (select cbo_t2.key as p, cbo_t2.c_int as q, c_float as r from cbo_t2 where (cbo_t2.c_int + 1 == 2) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0)) cbo_t2 on cbo_t1.a=p right outer join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q == 2) and (b > 0 or c_int >= 0)) R where (q + 1 = 2) and (R.b > 0 or c_int >= 0) PREHOOK: type: QUERY @@ -2018,70 +1252,42 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 8 Data size: 808 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 8 Data size: 808 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_12] - predicate:(((_col1 + _col4) = 2) and ((_col1 > 0) or (_col6 >= 0)) and ((_col4 + 1) = 2) and ((_col1 > 0) or (_col6 >= 0))) (type: boolean) - Statistics:Num rows: 8 Data size: 808 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_19] - | condition map:[{"":"Right Outer Join0 to 1"},{"":"Right Outer Join0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 72 Data size: 7272 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: float) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_17] - | predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 6 Data size: 445 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_18] - | predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:cbo_t2 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:cbo_t3 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=8 width=101) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_12] (rows=8 width=101) + predicate:(((_col1 + _col4) = 2) and ((_col1 > 0) or (_col6 >= 0)) and ((_col4 + 1) = 2) and ((_col1 > 0) or (_col6 >= 0))) + Merge Join Operator [MERGEJOIN_19] (rows=72 width=101) + Output:["_col1","_col2","_col3","_col4","_col6"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=6 width=77) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_17] (rows=6 width=77) + predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=6 width=74) + Output:["_col0","_col1"] + Filter Operator [FIL_18] (rows=6 width=77) + predicate:(((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_3] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Select Operator [SEL_7] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_6] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select key, (c_int+1)+2 as x, sum(c_int) from cbo_t1 group by c_float, cbo_t1.c_int, key order by x limit 1 PREHOOK: type: QUERY @@ -2094,52 +1300,30 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:1 - Stage-1 - Reducer 3 - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_9] - Number of rows:1 - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 10 Data size: 885 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col1 (type: int) - sort order:+ - Statistics:Num rows: 10 Data size: 885 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string), _col2 (type: bigint) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 10 Data size: 885 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_2] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","c_int","c_float"] - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:1 + Stage-1 + Reducer 3 + File Output Operator [FS_10] + Limit [LIM_9] (rows=1 width=97) + Number of rows:1 + Select Operator [SEL_8] (rows=10 width=88) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_7] + Select Operator [SEL_5] (rows=10 width=88) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_4] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_2] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Select Operator [SEL_1] (rows=20 width=83) + Output:["key","c_int","c_float"] + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select x, y, count(*) from (select key, (c_int+c_float+1+2) as x, sum(c_int) as y from cbo_t1 group by c_float, cbo_t1.c_int, key) R group by y, x order by x,y limit 1 PREHOOK: type: QUERY @@ -2153,72 +1337,39 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:1 - Stage-1 - Reducer 4 - File Output Operator [FS_15] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_14] - Number of rows:1 - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: float), _col1 (type: bigint) - sort order:++ - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Select Operator [SEL_11] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_10] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: float) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: bigint), _col1 (type: float) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: float) - sort order:++ - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_8] - aggregations:["count()"] - keys:_col0 (type: bigint), _col1 (type: float) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 5 Data size: 100 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_2] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 10 Data size: 917 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","c_int","c_float"] - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:1 + Stage-1 + Reducer 4 + File Output Operator [FS_15] + Limit [LIM_14] (rows=1 width=20) + Number of rows:1 + Select Operator [SEL_13] (rows=5 width=20) + Output:["_col0","_col1","_col2"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_12] + Select Operator [SEL_11] (rows=5 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_10] (rows=5 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0, _col1 + Group By Operator [GBY_8] (rows=5 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=10 width=91) + Output:["_col0","_col1"] + Group By Operator [GBY_4] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_2] (rows=10 width=91) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Select Operator [SEL_1] (rows=20 width=83) + Output:["key","c_int","c_float"] + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select key from(select key from (select key from cbo_t1 limit 5)cbo_t2 limit 5)cbo_t3 limit 5 PREHOOK: type: QUERY @@ -2231,51 +1382,33 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:5 - Stage-1 - Reducer 3 - File Output Operator [FS_13] - compressed:false - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_12] - Number of rows:5 - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Limit [LIM_10] + Fetch Operator + limit:5 + Stage-1 + Reducer 3 + File Output Operator [FS_13] + Limit [LIM_12] (rows=5 width=68) + Number of rows:5 + Limit [LIM_10] (rows=5 width=68) + Number of rows:5 + Select Operator [SEL_9] (rows=5 width=68) + Output:["_col0"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Limit [LIM_7] (rows=5 width=68) Number of rows:5 - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - sort order: - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Limit [LIM_7] - Number of rows:5 - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Limit [LIM_5] - Number of rows:5 - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_4] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Limit [LIM_2] - Number of rows:5 - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["_col0"] - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Limit [LIM_5] (rows=5 width=68) + Number of rows:5 + Select Operator [SEL_4] (rows=5 width=68) + Output:["_col0"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Limit [LIM_2] (rows=5 width=68) + Number of rows:5 + Select Operator [SEL_1] (rows=20 width=76) + Output:["_col0"] + TableScan [TS_0] (rows=20 width=76) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select key, c_int from(select key, c_int from (select key, c_int from cbo_t1 order by c_int limit 5)cbo_t1 order by c_int limit 5)cbo_t2 order by c_int limit 5 PREHOOK: type: QUERY @@ -2289,56 +1422,33 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:5 - Stage-1 - Reducer 4 - File Output Operator [FS_13] - compressed:false - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_12] - Number of rows:5 - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col1 (type: int) - sort order:+ - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Limit [LIM_8] - Number of rows:5 - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - key expressions:_col1 (type: int) - sort order:+ - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Limit [LIM_4] - Number of rows:5 - Statistics:Num rows: 5 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:_col1 (type: int) - sort order:+ - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string) - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:5 + Stage-1 + Reducer 4 + File Output Operator [FS_13] + Limit [LIM_12] (rows=5 width=71) + Number of rows:5 + Select Operator [SEL_11] (rows=5 width=71) + Output:["_col0","_col1"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Limit [LIM_8] (rows=5 width=71) + Number of rows:5 + Select Operator [SEL_7] (rows=5 width=71) + Output:["_col0","_col1"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Limit [LIM_4] (rows=5 width=71) + Number of rows:5 + Select Operator [SEL_3] (rows=20 width=80) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + Select Operator [SEL_1] (rows=20 width=80) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=20 width=80) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] PREHOOK: query: explain select cbo_t3.c_int, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key order by a limit 5) cbo_t1 join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key order by q/10 desc, r asc limit 5) cbo_t2 on cbo_t1.a=p join cbo_t3 on cbo_t1.a=key where (b + cbo_t2.q >= 0) and (b > 0 or c_int >= 0) group by cbo_t3.c_int, c order by cbo_t3.c_int+c desc, c limit 5 PREHOOK: type: QUERY @@ -2357,187 +1467,98 @@ Reducer 7 <- Reducer 6 (SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:5 - Stage-1 - Reducer 7 - File Output Operator [FS_49] - compressed:false - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_48] - Number of rows:5 - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_47] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_46] - key expressions:(UDFToLong(_col0) + _col1) (type: bigint), _col1 (type: bigint) - sort order:-+ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: int), _col2 (type: bigint) - Select Operator [SEL_44] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_43] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: bigint), KEY._col1 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col0 (type: bigint), _col1 (type: int) - Map-reduce partition columns:_col0 (type: bigint), _col1 (type: int) - sort order:++ - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_41] - aggregations:["count()"] - keys:_col2 (type: bigint), _col6 (type: int) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_40] - outputColumnNames:["_col2","_col6"] - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_39] - predicate:((_col1 > 0) or (_col6 >= 0)) (type: boolean) - Statistics:Num rows: 2 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_61] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col6"] - | Statistics:Num rows: 3 Data size: 48 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_37] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_59] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 18 Data size: 1424 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_33] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1602 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_32] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_31] - predicate:((_col1 + _col4) >= 0) (type: boolean) - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_60] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_29] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Filter Operator [FIL_26] - | predicate:_col0 is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Limit [LIM_24] - | Number of rows:5 - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_23] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_22] - | key expressions:_col3 (type: double), _col2 (type: bigint) - | sort order:-+ - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: int) - | Select Operator [SEL_20] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 105 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_19] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 8 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_17] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_58] - | predicate:(((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - | Statistics:Num rows: 4 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_14] - | alias:cbo_t2 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Filter Operator [FIL_12] - predicate:_col0 is not null (type: boolean) - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - Limit [LIM_10] - Number of rows:5 - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int), _col2 (type: bigint) - Select Operator [SEL_6] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 97 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_5] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_3] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_56] - predicate:(((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - Statistics:Num rows: 4 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:5 + Stage-1 + Reducer 7 + File Output Operator [FS_49] + Limit [LIM_48] (rows=1 width=20) + Number of rows:5 + Select Operator [SEL_47] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_46] + Select Operator [SEL_44] (rows=1 width=20) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_43] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0, _col1 + Group By Operator [GBY_41] (rows=1 width=20) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col2, _col6 + Select Operator [SEL_40] (rows=2 width=16) + Output:["_col2","_col6"] + Filter Operator [FIL_39] (rows=2 width=16) + predicate:((_col1 > 0) or (_col6 >= 0)) + Merge Join Operator [MERGEJOIN_61] (rows=3 width=16) + Output:["_col1","_col2","_col6"],keys:{"0":"_col0","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col0 + Select Operator [SEL_35] (rows=18 width=79) + Output:["_col0","_col1"] + Filter Operator [FIL_59] (rows=18 width=79) + predicate:key is not null + TableScan [TS_33] (rows=20 width=80) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0 + Select Operator [SEL_32] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_31] (rows=1 width=101) + predicate:((_col1 + _col4) >= 0) + Merge Join Operator [MERGEJOIN_60] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0","1":"_col0"} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col0 + Filter Operator [FIL_26] (rows=1 width=105) + predicate:_col0 is not null + Limit [LIM_24] (rows=1 width=105) + Number of rows:5 + Select Operator [SEL_23] (rows=1 width=105) + Output:["_col0","_col1"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_22] + Select Operator [SEL_20] (rows=1 width=105) + Output:["_col0","_col1","_col2","_col3"] + Group By Operator [GBY_19] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 8 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_17] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_58] (rows=4 width=93) + predicate:(((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_14] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Filter Operator [FIL_12] (rows=1 width=97) + predicate:_col0 is not null + Limit [LIM_10] (rows=1 width=97) + Number of rows:5 + Select Operator [SEL_9] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Select Operator [SEL_6] (rows=1 width=97) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_56] (rows=4 width=93) + predicate:(((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t1.c_int from cbo_t1 left semi join cbo_t2 on cbo_t1.key=cbo_t2.key where (cbo_t1.c_int + 1 == 2) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) PREHOOK: type: QUERY @@ -2549,57 +1570,35 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_12] - compressed:false - Statistics:Num rows: 7 Data size: 28 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_11] - outputColumnNames:["_col0"] - Statistics:Num rows: 7 Data size: 28 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 7 Data size: 28 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_15] - | predicate:((((c_int + 1) = 2) and key is not null) and ((c_int > 0) or (c_float >= 0.0))) (type: boolean) - | Statistics:Num rows: 6 Data size: 465 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_16] - predicate:key is not null (type: boolean) - Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_12] + Select Operator [SEL_11] (rows=7 width=4) + Output:["_col0"] + Merge Join Operator [MERGEJOIN_17] (rows=7 width=4) + Output:["_col1"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=6 width=77) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=6 width=77) + predicate:((((c_int + 1) = 2) and key is not null) and ((c_int > 0) or (c_float >= 0.0))) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_7] (rows=5 width=68) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=18 width=75) + Output:["_col0"] + Filter Operator [FIL_16] (rows=18 width=75) + predicate:key is not null + TableScan [TS_3] (rows=20 width=76) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select * from (select c, b, a from (select key as a, c_int as b, cbo_t1.c_float as c from cbo_t1 where (cbo_t1.c_int + 1 == 2) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0)) cbo_t1 left semi join (select cbo_t2.key as p, cbo_t2.c_int as q, c_float as r from cbo_t2 where (cbo_t2.c_int + 1 == 2) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0)) cbo_t2 on cbo_t1.a=p left semi join cbo_t3 on cbo_t1.a=key where (b + 1 == 2) and (b > 0 or c >= 0)) R where (b + 1 = 2) and (R.b > 0 or c >= 0) PREHOOK: type: QUERY @@ -2611,76 +1610,46 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_18] - compressed:false - Statistics:Num rows: 12 Data size: 1116 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 12 Data size: 1116 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_28] - | condition map:[{"":"Left Semi Join 0 to 1"},{"":"Left Semi Join 0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 12 Data size: 1116 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: int), _col2 (type: float) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_25] - | predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) (type: boolean) - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_14] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 2 Data size: 170 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_10] - | keys:_col0 (type: string) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 2 Data size: 170 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 5 Data size: 340 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) (type: boolean) - | Statistics:Num rows: 5 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:cbo_t2 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_12] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - outputColumnNames:["_col0"] - Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:key is not null (type: boolean) - Statistics:Num rows: 18 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:cbo_t3 - Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_18] + Select Operator [SEL_17] (rows=12 width=93) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_28] (rows=12 width=93) + Output:["_col0","_col1","_col2"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=5 width=74) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_25] (rows=5 width=74) + predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col0 + Group By Operator [GBY_10] (rows=2 width=85) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=5 width=68) + Output:["_col0"] + Filter Operator [FIL_26] (rows=5 width=74) + predicate:((((c_int + 1) = 2) and ((c_int > 0) or (c_float >= 0.0))) and key is not null) + TableScan [TS_3] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0 + Group By Operator [GBY_12] (rows=6 width=70) + Output:["_col0"],keys:_col0 + Select Operator [SEL_8] (rows=18 width=75) + Output:["_col0"] + Filter Operator [FIL_27] (rows=18 width=75) + predicate:key is not null + TableScan [TS_6] (rows=20 width=76) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select a, c, count(*) from (select key as a, c_int+1 as b, sum(c_int) as c from cbo_t1 where (cbo_t1.c_int + 1 >= 0) and (cbo_t1.c_int > 0 or cbo_t1.c_float >= 0) group by c_float, cbo_t1.c_int, key having cbo_t1.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by a+b desc, c asc) cbo_t1 left semi join (select key as p, c_int+1 as q, sum(c_int) as r from cbo_t2 where (cbo_t2.c_int + 1 >= 0) and (cbo_t2.c_int > 0 or cbo_t2.c_float >= 0) group by c_float, cbo_t2.c_int, key having cbo_t2.c_float > 0 and (c_int >=1 or c_float >= 1) and (c_int + c_float) >= 0 order by q+r/10 desc, p) cbo_t2 on cbo_t1.a=p left semi join cbo_t3 on cbo_t1.a=key where (b + 1 >= 0) and (b > 0 or a >= 0) group by a, c having a > 0 and (a >=1 or c >= 1) and (a + c) >= 0 order by c, a PREHOOK: type: QUERY @@ -2698,156 +1667,81 @@ Reducer 8 <- Map 7 (SIMPLE_EDGE) Reducer 9 <- Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 6 - File Output Operator [FS_41] - compressed:false - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_40] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_39] - key expressions:_col1 (type: bigint), _col0 (type: string) - sort order:++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_37] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: bigint) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: string), _col1 (type: bigint) - Map-reduce partition columns:_col0 (type: string), _col1 (type: bigint) - sort order:++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: bigint) - Group By Operator [GBY_35] - aggregations:["count()"] - keys:_col0 (type: string), _col1 (type: bigint) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_51] - | condition map:[{"":"Left Semi Join 0 to 1"},{"":"Left Semi Join 0 to 2"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)","2":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 3 Data size: 170 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_29] - | keys:_col0 (type: string) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 3 Data size: 170 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_25] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_50] - | predicate:(UDFToDouble(key) > 0.0) (type: boolean) - | Statistics:Num rows: 6 Data size: 425 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_23] - | alias:cbo_t3 - | Statistics:Num rows: 20 Data size: 1530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_30] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: bigint) - | Select Operator [SEL_10] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col2 (type: double), _col1 (type: bigint) - | sort order:-+ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_7] - | predicate:(((UDFToDouble(_col2) >= 1.0) or (_col3 >= 1)) and ((UDFToDouble(_col2) + UDFToDouble(_col3)) >= 0.0)) (type: boolean) - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_6] - | outputColumnNames:["_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["sum(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col3 (type: bigint) - | Group By Operator [GBY_3] - | aggregations:["sum(c_int)"] - | keys:key (type: string), c_int (type: int), c_float (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_48] - | predicate:(((((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and (((c_int + 1) + 1) >= 0)) and (((c_int + 1) > 0) or (UDFToDouble(key) >= 0.0))) and (UDFToDouble(key) > 0.0)) (type: boolean) - | Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 9 [SIMPLE_EDGE] - Reduce Output Operator [RS_31] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 85 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_27] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 85 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_21] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 85 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_20] - key expressions:_col1 (type: double), _col0 (type: string) - sort order:-+ - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_18] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_17] - | aggregations:["sum(VALUE._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: int), KEY._col2 (type: float) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - key expressions:_col0 (type: string), _col1 (type: int), _col2 (type: float) - Map-reduce partition columns:_col0 (type: string), _col1 (type: int), _col2 (type: float) - sort order:+++ - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col3 (type: bigint) - Group By Operator [GBY_15] - aggregations:["sum(c_int)"] - keys:key (type: string), c_int (type: int), c_float (type: float) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 101 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_49] - predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and (UDFToDouble(key) > 0.0)) (type: boolean) - Statistics:Num rows: 1 Data size: 93 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_12] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 1674 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 6 + File Output Operator [FS_41] + Select Operator [SEL_40] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_39] + Group By Operator [GBY_37] (rows=1 width=101) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=1 width=101) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 + Merge Join Operator [MERGEJOIN_51] (rows=1 width=93) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0","2":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Group By Operator [GBY_29] (rows=3 width=56) + Output:["_col0"],keys:_col0 + Select Operator [SEL_25] (rows=6 width=70) + Output:["_col0"] + Filter Operator [FIL_50] (rows=6 width=70) + predicate:(UDFToDouble(key) > 0.0) + TableScan [TS_23] (rows=20 width=76) + default@cbo_t3,cbo_t3,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Select Operator [SEL_10] (rows=1 width=93) + Output:["_col0","_col1"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + Select Operator [SEL_8] (rows=1 width=101) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_7] (rows=1 width=101) + predicate:(((UDFToDouble(_col2) >= 1.0) or (_col3 >= 1)) and ((UDFToDouble(_col2) + UDFToDouble(_col3)) >= 0.0)) + Select Operator [SEL_6] (rows=1 width=101) + Output:["_col1","_col2","_col3"] + Group By Operator [GBY_5] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_3] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_48] (rows=1 width=93) + predicate:(((((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and (((c_int + 1) + 1) >= 0)) and (((c_int + 1) > 0) or (UDFToDouble(key) >= 0.0))) and (UDFToDouble(key) > 0.0)) + TableScan [TS_0] (rows=20 width=83) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0 + Group By Operator [GBY_27] (rows=1 width=85) + Output:["_col0"],keys:_col0 + Select Operator [SEL_21] (rows=1 width=85) + Output:["_col0"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_20] + Select Operator [SEL_18] (rows=1 width=93) + Output:["_col0","_col1"] + Group By Operator [GBY_17] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(VALUE._col0)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_15] (rows=1 width=101) + Output:["_col0","_col1","_col2","_col3"],aggregations:["sum(c_int)"],keys:key, c_int, c_float + Filter Operator [FIL_49] (rows=1 width=93) + predicate:(((((((c_int + 1) >= 0) and ((c_int > 0) or (c_float >= 0.0))) and (c_float > 0.0)) and ((c_int >= 1) or (c_float >= 1.0))) and ((UDFToFloat(c_int) + c_float) >= 0.0)) and (UDFToDouble(key) > 0.0)) + TableScan [TS_12] (rows=20 width=83) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE,Output:["key","c_int","c_float"] PREHOOK: query: explain select cbo_t1.key as x, c_int as c_int, (((c_int+c_float)*10)+5) as y from cbo_t1 PREHOOK: type: QUERY @@ -2856,12 +1750,12 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1","_col2"] - TableScan [TS_0] - alias:cbo_t1 + Fetch Operator + limit:-1 + Select Operator [SEL_1] + Output:["_col0","_col1","_col2"] + TableScan [TS_0] + Output:["key","c_int","c_float"] PREHOOK: query: explain select null from cbo_t1 PREHOOK: type: QUERY @@ -2870,12 +1764,11 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Select Operator [SEL_1] - outputColumnNames:["_col0"] - TableScan [TS_0] - alias:cbo_t1 + Fetch Operator + limit:-1 + Select Operator [SEL_1] + Output:["_col0"] + TableScan [TS_0] PREHOOK: query: explain select key from cbo_t1 where c_int = -6 or c_int = +6 PREHOOK: type: QUERY @@ -2884,14 +1777,14 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Select Operator [SEL_2] - outputColumnNames:["_col0"] - Filter Operator [FIL_4] - predicate:((c_int = -6) or (c_int = 6)) (type: boolean) - TableScan [TS_0] - alias:cbo_t1 + Fetch Operator + limit:-1 + Select Operator [SEL_2] + Output:["_col0"] + Filter Operator [FIL_4] + predicate:((c_int = -6) or (c_int = 6)) + TableScan [TS_0] + Output:["key","c_int"] PREHOOK: query: explain select count(cbo_t1.dt) from cbo_t1 join cbo_t2 on cbo_t1.dt = cbo_t2.dt where cbo_t1.dt = '2014' PREHOOK: type: QUERY @@ -2904,52 +1797,31 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_12] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_10] - aggregations:["count(_col0)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - outputColumnNames:["_col0"] - Statistics:Num rows: 400 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_19] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"'2014' (type: string)","1":"'2014' (type: string)"} - | Statistics:Num rows: 400 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:'2014' (type: string) - | Map-reduce partition columns:'2014' (type: string) - | sort order:+ - | Statistics:Num rows: 20 Data size: 262 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:cbo_t1 - | Statistics:Num rows: 20 Data size: 262 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:'2014' (type: string) - Map-reduce partition columns:'2014' (type: string) - sort order:+ - Statistics:Num rows: 20 Data size: 262 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:cbo_t2 - Statistics:Num rows: 20 Data size: 262 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_14] + Group By Operator [GBY_12] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + Group By Operator [GBY_10] (rows=1 width=8) + Output:["_col0"],aggregations:["count(_col0)"] + Select Operator [SEL_9] (rows=400 width=0) + Output:["_col0"] + Merge Join Operator [MERGEJOIN_19] (rows=400 width=0) + keys:{"0":"'2014'","1":"'2014'"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:'2014' + TableScan [TS_0] (rows=20 width=13) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:'2014' + TableScan [TS_3] (rows=20 width=13) + default@cbo_t2,cbo_t2,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: explain select * from src_cbo b @@ -2974,67 +1846,40 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE) Reducer 4 <- Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_12] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 1 Data size: 269 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 193 Data size: 51917 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:b - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - outputColumnNames:["_col1"] - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_5] - keys:key (type: string), value (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_16] - predicate:(value > 'val_2') (type: boolean) - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:b - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=1 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_12] (rows=1 width=269) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_17] (rows=193 width=269) + Output:["_col0","_col1","_col3"],keys:{"0":"_col1","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1 + Select Operator [SEL_1] (rows=500 width=178) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=83 width=178) + Output:["_col1"] + Group By Operator [GBY_7] (rows=83 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0, _col1 + Group By Operator [GBY_5] (rows=83 width=178) + Output:["_col0","_col1"],keys:key, value + Filter Operator [FIL_16] (rows=166 width=178) + predicate:(value > 'val_2') + TableScan [TS_2] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select * from src_cbo b @@ -3061,66 +1906,40 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Map 4 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_12] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 1 Data size: 265 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col1 (type: string), _col0 (type: string)","1":"_col0 (type: string), _col1 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 1 Data size: 265 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_16] - | predicate:(value > 'val_12') (type: boolean) - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_6] - | alias:b - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col1 (type: string), _col0 (type: string) - Map-reduce partition columns:_col1 (type: string), _col0 (type: string) - sort order:++ - Statistics:Num rows: 250 Data size: 44500 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 250 Data size: 44500 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 250 Data size: 44500 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_2] - keys:key (type: string), value (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 250 Data size: 44500 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","value"] - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:b - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=1 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_12] (rows=1 width=265) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_17] (rows=1 width=265) + Output:["_col0","_col1","_col3"],keys:{"0":"_col1, _col0","1":"_col0, _col1"} + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0, _col1 + Select Operator [SEL_8] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_16] (rows=166 width=178) + predicate:(value > 'val_12') + TableScan [TS_6] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col1, _col0 + Group By Operator [GBY_4] (rows=250 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0, _col1 + Group By Operator [GBY_2] (rows=250 width=178) + Output:["_col0","_col1"],keys:key, value + Select Operator [SEL_1] (rows=500 width=178) + Output:["key","value"] + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: create view cv1 as select * @@ -3154,53 +1973,33 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_12] - compressed:false - Statistics:Num rows: 2 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col1 (type: string), _col0 (type: string)","1":"_col0 (type: string), _col1 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 2 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col1 (type: string), _col0 (type: string) - | Map-reduce partition columns:_col1 (type: string), _col0 (type: string) - | sort order:++ - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_15] - | predicate:((value > 'val_9') and key is not null) (type: boolean) - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:b - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_16] - predicate:((value > 'val_9') and key is not null) (type: boolean) - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:b - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_12] + Merge Join Operator [MERGEJOIN_17] (rows=2 width=178) + Output:["_col0","_col1"],keys:{"0":"_col1, _col0","1":"_col0, _col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col1, _col0 + Select Operator [SEL_2] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=166 width=178) + predicate:((value > 'val_9') and key is not null) + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0, _col1 + Group By Operator [GBY_7] (rows=83 width=178) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_16] (rows=166 width=178) + predicate:((value > 'val_9') and key is not null) + TableScan [TS_3] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select * from (select * @@ -3226,53 +2025,33 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_12] - compressed:false - Statistics:Num rows: 2 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col1 (type: string), _col0 (type: string)","1":"_col0 (type: string), _col1 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 2 Data size: 356 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col1 (type: string), _col0 (type: string) - | Map-reduce partition columns:_col1 (type: string), _col0 (type: string) - | sort order:++ - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_15] - | predicate:((value > 'val_9') and key is not null) (type: boolean) - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:b - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 83 Data size: 14774 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_16] - predicate:((value > 'val_9') and key is not null) (type: boolean) - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:b - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_12] + Merge Join Operator [MERGEJOIN_17] (rows=2 width=178) + Output:["_col0","_col1"],keys:{"0":"_col1, _col0","1":"_col0, _col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col1, _col0 + Select Operator [SEL_2] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=166 width=178) + predicate:((value > 'val_9') and key is not null) + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0, _col1 + Group By Operator [GBY_7] (rows=83 width=178) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_16] (rows=166 width=178) + predicate:((value > 'val_9') and key is not null) + TableScan [TS_3] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select * from src_cbo @@ -3288,54 +2067,33 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_12] - compressed:false - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_15] - | predicate:(key > '9') (type: boolean) - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src_cbo - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 69 Data size: 6003 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 69 Data size: 6003 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_16] - predicate:(key > '9') (type: boolean) - Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:src_cbo - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_12] + Merge Join Operator [MERGEJOIN_17] (rows=166 width=178) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=166 width=178) + predicate:(key > '9') + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,src_cbo,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_7] (rows=69 width=87) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=166 width=87) + Output:["_col0"] + Filter Operator [FIL_16] (rows=166 width=87) + predicate:(key > '9') + TableScan [TS_3] (rows=500 width=87) + default@src_cbo,src_cbo,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select p.p_partkey, li.l_suppkey from (select distinct l_partkey as p_partkey from lineitem) p join lineitem li on p.p_partkey = li.l_partkey @@ -3355,95 +2113,54 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE), Reducer 6 (SIMPLE_EDGE) Reducer 6 <- Map 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_22] - compressed:false - Statistics:Num rows: 4 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_21] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 4 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_32] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col2","_col4"] - | Statistics:Num rows: 4 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col2 (type: int) - | Merge Join Operator [MERGEJOIN_31] - | | condition map:[{"":"Left Semi Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int), _col3 (type: int)","1":"_col0 (type: int), _col1 (type: int)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_15] - | | key expressions:_col0 (type: int), _col3 (type: int) - | | Map-reduce partition columns:_col0 (type: int), _col3 (type: int) - | | sort order:++ - | | Statistics:Num rows: 16 Data size: 256 Basic stats: COMPLETE Column stats: COMPLETE - | | value expressions:_col1 (type: int), _col2 (type: int) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1","_col2","_col3"] - | | Statistics:Num rows: 16 Data size: 256 Basic stats: COMPLETE Column stats: COMPLETE - | | Filter Operator [FIL_28] - | | predicate:(((l_linenumber = 1) and l_partkey is not null) and l_orderkey is not null) (type: boolean) - | | Statistics:Num rows: 16 Data size: 256 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_0] - | | alias:lineitem - | | Statistics:Num rows: 100 Data size: 1600 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 4 [SIMPLE_EDGE] - | Reduce Output Operator [RS_16] - | key expressions:_col0 (type: int), _col1 (type: int) - | Map-reduce partition columns:_col0 (type: int), _col1 (type: int) - | sort order:++ - | Statistics:Num rows: 4 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_14] - | keys:_col0 (type: int), 1 (type: int) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 4 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 14 Data size: 56 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_29] - | predicate:(((l_shipmode = 'AIR') and (l_linenumber = 1)) and l_orderkey is not null) (type: boolean) - | Statistics:Num rows: 14 Data size: 1344 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:lineitem - | Statistics:Num rows: 100 Data size: 9600 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 50 Data size: 200 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 50 Data size: 200 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 50 Data size: 200 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_9] - keys:l_partkey (type: int) - outputColumnNames:["_col0"] - Statistics:Num rows: 50 Data size: 200 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_30] - predicate:l_partkey is not null (type: boolean) - Statistics:Num rows: 100 Data size: 400 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:lineitem - Statistics:Num rows: 100 Data size: 400 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_22] + Select Operator [SEL_21] (rows=4 width=8) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_32] (rows=4 width=8) + Output:["_col2","_col4"],keys:{"0":"_col1","1":"_col0"} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_31] (rows=12 width=8) + Output:["_col1","_col2"],keys:{"0":"_col0, _col3","1":"_col0, _col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + PartitionCols:_col0, _col3 + Select Operator [SEL_2] (rows=16 width=16) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_28] (rows=16 width=16) + predicate:(((l_linenumber = 1) and l_partkey is not null) and l_orderkey is not null) + TableScan [TS_0] (rows=100 width=16) + default@lineitem,lineitem,Tbl:COMPLETE,Col:COMPLETE,Output:["l_orderkey","l_partkey","l_suppkey","l_linenumber"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_16] + PartitionCols:_col0, _col1 + Group By Operator [GBY_14] (rows=4 width=8) + Output:["_col0","_col1"],keys:_col0, 1 + Select Operator [SEL_5] (rows=14 width=4) + Output:["_col0"] + Filter Operator [FIL_29] (rows=14 width=96) + predicate:(((l_shipmode = 'AIR') and (l_linenumber = 1)) and l_orderkey is not null) + TableScan [TS_3] (rows=100 width=96) + default@lineitem,lineitem,Tbl:COMPLETE,Col:COMPLETE,Output:["l_orderkey","l_linenumber","l_shipmode"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Group By Operator [GBY_11] (rows=50 width=4) + Output:["_col0"],keys:KEY._col0 + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col0 + Group By Operator [GBY_9] (rows=50 width=4) + Output:["_col0"],keys:l_partkey + Filter Operator [FIL_30] (rows=100 width=4) + predicate:l_partkey is not null + TableScan [TS_6] (rows=100 width=4) + default@lineitem,lineitem,Tbl:COMPLETE,Col:COMPLETE,Output:["l_partkey"] PREHOOK: query: explain select key, value, count(*) from src_cbo b @@ -3466,128 +2183,69 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE), Reducer 7 (SIMPLE_EDGE) Reducer 7 <- Map 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_31] - compressed:false - Statistics:Num rows: 34 Data size: 6324 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_44] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col2 (type: bigint)","1":"_col0 (type: bigint)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 34 Data size: 6324 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | key expressions:_col2 (type: bigint) - | Map-reduce partition columns:_col2 (type: bigint) - | sort order:+ - | Statistics:Num rows: 83 Data size: 15438 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: string) - | Filter Operator [FIL_37] - | predicate:_col2 is not null (type: boolean) - | Statistics:Num rows: 83 Data size: 15438 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_14] - | | aggregations:["count(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 83 Data size: 15438 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 83 Data size: 15438 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col2 (type: bigint) - | Group By Operator [GBY_12] - | aggregations:["count()"] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 83 Data size: 15438 Basic stats: COMPLETE Column stats: COMPLETE - | Merge Join Operator [MERGEJOIN_43] - | | condition map:[{"":"Left Semi Join 0 to 1"}] - | | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_8] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_2] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | | Filter Operator [FIL_38] - | | predicate:(key > '8') (type: boolean) - | | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_0] - | | alias:b - | | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 69 Data size: 6003 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_7] - | keys:_col0 (type: string) - | outputColumnNames:["_col0"] - | Statistics:Num rows: 69 Data size: 6003 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_39] - | predicate:(key > '8') (type: boolean) - | Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_3] - | alias:b - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_28] - key expressions:_col0 (type: bigint) - Map-reduce partition columns:_col0 (type: bigint) - sort order:+ - Statistics:Num rows: 34 Data size: 272 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_26] - keys:_col0 (type: bigint) - outputColumnNames:["_col0"] - Statistics:Num rows: 34 Data size: 272 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_24] - outputColumnNames:["_col0"] - Statistics:Num rows: 69 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_40] - predicate:_col1 is not null (type: boolean) - Statistics:Num rows: 69 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_42] - outputColumnNames:["_col1"] - Statistics:Num rows: 69 Data size: 552 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_22] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 69 Data size: 6555 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 69 Data size: 6555 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_20] - aggregations:["count()"] - keys:key (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 69 Data size: 6555 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_41] - predicate:(key > '9') (type: boolean) - Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_17] - alias:b - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_31] + Merge Join Operator [MERGEJOIN_44] (rows=34 width=186) + Output:["_col0","_col1","_col2"],keys:{"0":"_col2","1":"_col0"} + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_27] + PartitionCols:_col2 + Filter Operator [FIL_37] (rows=83 width=186) + predicate:_col2 is not null + Group By Operator [GBY_14] (rows=83 width=186) + Output:["_col0","_col1","_col2"],aggregations:["count(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0, _col1 + Group By Operator [GBY_12] (rows=83 width=186) + Output:["_col0","_col1","_col2"],aggregations:["count()"],keys:_col0, _col1 + Merge Join Operator [MERGEJOIN_43] (rows=166 width=178) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_38] (rows=166 width=178) + predicate:(key > '8') + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_7] (rows=69 width=87) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=166 width=87) + Output:["_col0"] + Filter Operator [FIL_39] (rows=166 width=87) + predicate:(key > '8') + TableScan [TS_3] (rows=500 width=87) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col0 + Group By Operator [GBY_26] (rows=34 width=8) + Output:["_col0"],keys:_col0 + Select Operator [SEL_24] (rows=69 width=8) + Output:["_col0"] + Filter Operator [FIL_40] (rows=69 width=8) + predicate:_col1 is not null + Select Operator [SEL_42] (rows=69 width=8) + Output:["_col1"] + Group By Operator [GBY_22] (rows=69 width=95) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col0 + Group By Operator [GBY_20] (rows=69 width=95) + Output:["_col0","_col1"],aggregations:["count()"],keys:key + Filter Operator [FIL_41] (rows=166 width=87) + predicate:(key > '9') + TableScan [TS_17] (rows=500 width=87) + default@src_cbo,b,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select p_mfgr, p_name, avg(p_size) from part @@ -3609,84 +2267,47 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE), Reducer 5 (SIMPLE_EDGE) Reducer 5 <- Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_21] - compressed:false - Statistics:Num rows: 6 Data size: 1362 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_26] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 6 Data size: 1362 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_17] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 13 Data size: 2951 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col2 (type: double) - | Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 13 Data size: 2951 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_5] - | | aggregations:["avg(VALUE._col0)"] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 13 Data size: 2951 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 13 Data size: 2847 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col2 (type: struct) - | Group By Operator [GBY_3] - | aggregations:["avg(p_size)"] - | keys:p_name (type: string), p_mfgr (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 13 Data size: 2847 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_24] - | predicate:p_name is not null (type: boolean) - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:part - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 13 Data size: 2392 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_16] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 13 Data size: 2392 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_11] - outputColumnNames:["_col0"] - Statistics:Num rows: 26 Data size: 4784 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_25] - predicate:first_value_window_0 is not null (type: boolean) - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_10] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col5","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:p_mfgr (type: string), p_size (type: int) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_name (type: string) - TableScan [TS_7] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_21] + Merge Join Operator [MERGEJOIN_26] (rows=6 width=227) + Output:["_col0","_col1","_col2"],keys:{"0":"_col1","1":"_col0"} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col1 + Select Operator [SEL_6] (rows=13 width=227) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_5] (rows=13 width=227) + Output:["_col0","_col1","_col2"],aggregations:["avg(VALUE._col0)"],keys:KEY._col0, KEY._col1 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1 + Group By Operator [GBY_3] (rows=13 width=219) + Output:["_col0","_col1","_col2"],aggregations:["avg(p_size)"],keys:p_name, p_mfgr + Filter Operator [FIL_24] (rows=26 width=223) + predicate:p_name is not null + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Group By Operator [GBY_16] (rows=13 width=184) + Output:["_col0"],keys:_col0 + Select Operator [SEL_11] (rows=26 width=184) + Output:["_col0"] + Filter Operator [FIL_25] (rows=26 width=491) + predicate:first_value_window_0 is not null + PTF Operator [PTF_10] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col5","partition by:":"_col2"}] + Select Operator [SEL_9] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:p_mfgr + TableScan [TS_7] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select * from src_cbo @@ -3711,102 +2332,57 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 6 <- Map 5 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_25] - compressed:false - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_24] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string) - Select Operator [SEL_22] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 178 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_21] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 1 Data size: 265 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_30] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 404 Data size: 107060 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_13] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_28] - | predicate:(key > '2') (type: boolean) - | Statistics:Num rows: 166 Data size: 14442 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_11] - | alias:src_cbo - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string) - Merge Join Operator [MERGEJOIN_29] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | sort order: - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: string) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src_cbo - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_10] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_9] - predicate:(_col0 = 0) (type: boolean) - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_5] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_4] - Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_27] - predicate:((key > '2') and key is null) (type: boolean) - Statistics:Num rows: 1 Data size: 87 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:src_cbo - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_25] + Select Operator [SEL_24] (rows=1 width=178) + Output:["_col0","_col1"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Select Operator [SEL_22] (rows=1 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_21] (rows=1 width=265) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_30] (rows=404 width=265) + Output:["_col0","_col1","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_13] (rows=166 width=87) + Output:["_col0"] + Filter Operator [FIL_28] (rows=166 width=87) + predicate:(key > '2') + TableScan [TS_11] (rows=500 width=87) + default@src_cbo,src_cbo,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_29] (rows=500 width=178) + Output:["_col0","_col1"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + Select Operator [SEL_1] (rows=500 width=178) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=178) + default@src_cbo,src_cbo,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_16] + Select Operator [SEL_10] (rows=1 width=8) + Filter Operator [FIL_9] (rows=1 width=8) + predicate:(_col0 = 0) + Group By Operator [GBY_7] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Group By Operator [GBY_5] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Select Operator [SEL_4] (rows=1 width=87) + Filter Operator [FIL_27] (rows=1 width=87) + predicate:((key > '2') and key is null) + TableScan [TS_2] (rows=500 width=87) + default@src_cbo,src_cbo,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select p_mfgr, b.p_name, p_size from part b @@ -3832,93 +2408,53 @@ Reducer 3 <- Map 6 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Reducer 5 <- Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_23] - compressed:false - Statistics:Num rows: 1 Data size: 223 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_22] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 223 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_21] - predicate:_col4 is null (type: boolean) - Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_28] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string), _col1 (type: string)","1":"_col0 (type: string), _col1 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col4"] - | Statistics:Num rows: 1 Data size: 344 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 8 Data size: 1752 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 8 Data size: 1752 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_26] - | predicate:(p_size < 10) (type: boolean) - | Statistics:Num rows: 8 Data size: 1784 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_11] - | alias:b - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col2 (type: int) - Merge Join Operator [MERGEJOIN_27] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_15] - | sort order: - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int) - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:b - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_16] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_10] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_9] - predicate:(_col0 = 0) (type: boolean) - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_5] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_4] - Statistics:Num rows: 1 Data size: 223 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_25] - predicate:((p_size < 10) and (p_name is null or p_mfgr is null)) (type: boolean) - Statistics:Num rows: 1 Data size: 223 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:b - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_23] + Select Operator [SEL_22] (rows=1 width=223) + Output:["_col0","_col1","_col2"] + Filter Operator [FIL_21] (rows=1 width=344) + predicate:_col4 is null + Merge Join Operator [MERGEJOIN_28] (rows=1 width=344) + Output:["_col0","_col1","_col2","_col4"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0, _col1 + Select Operator [SEL_13] (rows=8 width=219) + Output:["_col0","_col1"] + Filter Operator [FIL_26] (rows=8 width=223) + predicate:(p_size < 10) + TableScan [TS_11] (rows=26 width=223) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_18] + PartitionCols:_col0, _col1 + Merge Join Operator [MERGEJOIN_27] (rows=26 width=223) + Output:["_col0","_col1","_col2"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_15] + Select Operator [SEL_1] (rows=26 width=223) + Output:["_col0","_col1","_col2"] + TableScan [TS_0] (rows=26 width=223) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size"] + <-Reducer 5 [SIMPLE_EDGE] + SHUFFLE [RS_16] + Select Operator [SEL_10] (rows=1 width=8) + Filter Operator [FIL_9] (rows=1 width=8) + predicate:(_col0 = 0) + Group By Operator [GBY_7] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Group By Operator [GBY_5] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Select Operator [SEL_4] (rows=1 width=223) + Filter Operator [FIL_25] (rows=1 width=223) + predicate:((p_size < 10) and (p_name is null or p_mfgr is null)) + TableScan [TS_2] (rows=26 width=223) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size"] PREHOOK: query: explain select p_name, p_size from @@ -3946,119 +2482,65 @@ Reducer 6 <- Map 5 (SIMPLE_EDGE) Reducer 8 <- Map 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_36] - compressed:false - Statistics:Num rows: 1 Data size: 125 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_35] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 125 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_34] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 125 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: int) - Select Operator [SEL_33] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 125 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_32] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 1 Data size: 133 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_42] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"UDFToDouble(_col1) (type: double)","1":"_col0 (type: double)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 1 Data size: 133 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_29] - | key expressions:UDFToDouble(_col1) (type: double) - | Map-reduce partition columns:UDFToDouble(_col1) (type: double) - | sort order:+ - | Statistics:Num rows: 26 Data size: 3250 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: int) - | Merge Join Operator [MERGEJOIN_41] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 26 Data size: 3250 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_26] - | | sort order: - | | Statistics:Num rows: 26 Data size: 3250 Basic stats: COMPLETE Column stats: COMPLETE - | | value expressions:_col0 (type: string), _col1 (type: int) - | | Select Operator [SEL_1] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 26 Data size: 3250 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_0] - | | alias:part - | | Statistics:Num rows: 26 Data size: 3250 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Reducer 6 [SIMPLE_EDGE] - | Reduce Output Operator [RS_27] - | sort order: - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_17] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_16] - | predicate:(_col0 = 0) (type: boolean) - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_14] - | aggregations:["count()"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_10] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_9] - | predicate:_col0 is null (type: boolean) - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_7] - | | aggregations:["avg(VALUE._col0)"] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | sort order: - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - | value expressions:_col0 (type: struct) - | Group By Operator [GBY_5] - | aggregations:["avg(p_size)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - | Filter Operator [FIL_38] - | predicate:(p_size < 10) (type: boolean) - | Statistics:Num rows: 8 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_2] - | alias:part - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_30] - key expressions:_col0 (type: double) - Map-reduce partition columns:_col0 (type: double) - sort order:+ - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_23] - | aggregations:["avg(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - sort order: - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - value expressions:_col0 (type: struct) - Group By Operator [GBY_21] - aggregations:["avg(p_size)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Filter Operator [FIL_40] - predicate:(p_size < 10) (type: boolean) - Statistics:Num rows: 8 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_18] - alias:part - Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_36] + Select Operator [SEL_35] (rows=1 width=125) + Output:["_col0","_col1"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_34] + Select Operator [SEL_33] (rows=1 width=125) + Output:["_col0","_col1"] + Filter Operator [FIL_32] (rows=1 width=133) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_42] (rows=1 width=133) + Output:["_col0","_col1","_col3"],keys:{"0":"UDFToDouble(_col1)","1":"_col0"} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:UDFToDouble(_col1) + Merge Join Operator [MERGEJOIN_41] (rows=26 width=125) + Output:["_col0","_col1"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_26] + Select Operator [SEL_1] (rows=26 width=125) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=26 width=125) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_size"] + <-Reducer 6 [SIMPLE_EDGE] + SHUFFLE [RS_27] + Select Operator [SEL_17] (rows=1 width=8) + Filter Operator [FIL_16] (rows=1 width=8) + predicate:(_col0 = 0) + Group By Operator [GBY_14] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Select Operator [SEL_10] (rows=1 width=8) + Filter Operator [FIL_9] (rows=1 width=8) + predicate:_col0 is null + Group By Operator [GBY_7] (rows=1 width=8) + Output:["_col0"],aggregations:["avg(VALUE._col0)"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Group By Operator [GBY_5] (rows=1 width=0) + Output:["_col0"],aggregations:["avg(p_size)"] + Filter Operator [FIL_38] (rows=8 width=4) + predicate:(p_size < 10) + TableScan [TS_2] (rows=26 width=4) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_size"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_30] + PartitionCols:_col0 + Group By Operator [GBY_23] (rows=1 width=8) + Output:["_col0"],aggregations:["avg(VALUE._col0)"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_22] + Group By Operator [GBY_21] (rows=1 width=0) + Output:["_col0"],aggregations:["avg(p_size)"] + Filter Operator [FIL_40] (rows=8 width=4) + predicate:(p_size < 10) + TableScan [TS_18] (rows=26 width=4) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_size"] PREHOOK: query: explain select b.p_mfgr, min(p_retailprice) from part b @@ -4092,155 +2574,80 @@ Reducer 7 <- Map 6 (SIMPLE_EDGE) Reducer 8 <- Reducer 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_38] - compressed:false - Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_37] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_36] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: double) - Select Operator [SEL_35] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_34] - predicate:_col3 is null (type: boolean) - Statistics:Num rows: 1 Data size: 204 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_43] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"_col0 (type: string), _col1 (type: double)","1":"_col0 (type: string), _col1 (type: double)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 1 Data size: 204 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: string), _col1 (type: double) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: double) - | sort order:++ - | Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_26] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 106 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_40] - | predicate:((_col2 - _col1) > 600.0) (type: boolean) - | Statistics:Num rows: 1 Data size: 114 Basic stats: COMPLETE Column stats: COMPLETE - | Group By Operator [GBY_24] - | | aggregations:["min(VALUE._col0)","max(VALUE._col1)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1","_col2"] - | | Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: double), _col2 (type: double) - | Group By Operator [GBY_22] - | aggregations:["min(p_retailprice)","max(p_retailprice)"] - | keys:p_mfgr (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_20] - | alias:b - | Statistics:Num rows: 26 Data size: 2756 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_31] - key expressions:_col0 (type: string), _col1 (type: double) - Map-reduce partition columns:_col0 (type: string), _col1 (type: double) - sort order:++ - Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_42] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - | Reduce Output Operator [RS_28] - | sort order: - | Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: double) - | Group By Operator [GBY_4] - | | aggregations:["min(VALUE._col0)"] - | | keys:KEY._col0 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: double) - | Group By Operator [GBY_2] - | aggregations:["min(p_retailprice)"] - | keys:p_mfgr (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 5 Data size: 530 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_1] - | outputColumnNames:["p_mfgr","p_retailprice"] - | Statistics:Num rows: 26 Data size: 2756 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:b - | Statistics:Num rows: 26 Data size: 2756 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 8 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_19] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_18] - predicate:(_col0 = 0) (type: boolean) - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_16] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_15] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_14] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_12] - Statistics:Num rows: 1 Data size: 114 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_11] - predicate:(((_col2 - _col1) > 600.0) and (_col0 is null or _col1 is null)) (type: boolean) - Statistics:Num rows: 1 Data size: 114 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_10] - | aggregations:["min(VALUE._col0)","max(VALUE._col1)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: double), _col2 (type: double) - Group By Operator [GBY_8] - aggregations:["min(p_retailprice)","max(p_retailprice)"] - keys:p_mfgr (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 5 Data size: 570 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_7] - outputColumnNames:["p_mfgr","p_retailprice"] - Statistics:Num rows: 26 Data size: 2756 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:b - Statistics:Num rows: 26 Data size: 2756 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_38] + Select Operator [SEL_37] (rows=1 width=106) + Output:["_col0","_col1"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_36] + Select Operator [SEL_35] (rows=1 width=106) + Output:["_col0","_col1"] + Filter Operator [FIL_34] (rows=1 width=204) + predicate:_col3 is null + Merge Join Operator [MERGEJOIN_43] (rows=1 width=204) + Output:["_col0","_col1","_col3"],keys:{"0":"_col0, _col1","1":"_col0, _col1"} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0, _col1 + Select Operator [SEL_26] (rows=1 width=106) + Output:["_col0","_col1"] + Filter Operator [FIL_40] (rows=1 width=114) + predicate:((_col2 - _col1) > 600.0) + Group By Operator [GBY_24] (rows=5 width=114) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)"],keys:KEY._col0 + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Group By Operator [GBY_22] (rows=5 width=114) + Output:["_col0","_col1","_col2"],aggregations:["min(p_retailprice)","max(p_retailprice)"],keys:p_mfgr + TableScan [TS_20] (rows=26 width=106) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_retailprice"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col0, _col1 + Merge Join Operator [MERGEJOIN_42] (rows=5 width=106) + Output:["_col0","_col1"],keys:{} + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_28] + Group By Operator [GBY_4] (rows=5 width=106) + Output:["_col0","_col1"],aggregations:["min(VALUE._col0)"],keys:KEY._col0 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0 + Group By Operator [GBY_2] (rows=5 width=106) + Output:["_col0","_col1"],aggregations:["min(p_retailprice)"],keys:p_mfgr + Select Operator [SEL_1] (rows=26 width=106) + Output:["p_mfgr","p_retailprice"] + TableScan [TS_0] (rows=26 width=106) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_retailprice"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_29] + Select Operator [SEL_19] (rows=1 width=8) + Filter Operator [FIL_18] (rows=1 width=8) + predicate:(_col0 = 0) + Group By Operator [GBY_16] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 7 [SIMPLE_EDGE] + SHUFFLE [RS_15] + Group By Operator [GBY_14] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Select Operator [SEL_12] (rows=1 width=114) + Filter Operator [FIL_11] (rows=1 width=114) + predicate:(((_col2 - _col1) > 600.0) and (_col0 is null or _col1 is null)) + Group By Operator [GBY_10] (rows=5 width=114) + Output:["_col0","_col1","_col2"],aggregations:["min(VALUE._col0)","max(VALUE._col1)"],keys:KEY._col0 + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_8] (rows=5 width=114) + Output:["_col0","_col1","_col2"],aggregations:["min(p_retailprice)","max(p_retailprice)"],keys:p_mfgr + Select Operator [SEL_7] (rows=26 width=106) + Output:["p_mfgr","p_retailprice"] + TableScan [TS_6] (rows=26 width=106) + default@part,b,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_retailprice"] PREHOOK: query: explain select count(c_int) over(), sum(c_float) over(), max(c_int) over(), min(c_int) over(), row_number() over(), rank() over(), dense_rank() over(), percent_rank() over(), lead(c_int, 2, c_int) over(), lag(c_float, 2, c_float) over() from cbo_t1 PREHOOK: type: QUERY @@ -4252,33 +2659,22 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 20 Data size: 1040 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 20 Data size: 1040 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"0","partition by:":"0"}] - Statistics:Num rows: 20 Data size: 9184 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col2","_col3"] - | Statistics:Num rows: 20 Data size: 9184 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:0 (type: int) - Map-reduce partition columns:0 (type: int) - sort order:+ - Statistics:Num rows: 20 Data size: 144 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:c_int (type: int), c_float (type: float) - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 144 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_4] (rows=20 width=52) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + PTF Operator [PTF_3] (rows=20 width=459) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"0","partition by:":"0"}] + Select Operator [SEL_2] (rows=20 width=459) + Output:["_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:0 + TableScan [TS_0] (rows=20 width=7) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["c_float","c_int"] PREHOOK: query: explain select * from (select count(c_int) over(), sum(c_float) over(), max(c_int) over(), min(c_int) over(), row_number() over(), rank() over(), dense_rank() over(), percent_rank() over(), lead(c_int, 2, c_int) over(), lag(c_float, 2, c_float) over() from cbo_t1) cbo_t1 PREHOOK: type: QUERY @@ -4290,33 +2686,22 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 20 Data size: 1040 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] - Statistics:Num rows: 20 Data size: 1040 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"0","partition by:":"0"}] - Statistics:Num rows: 20 Data size: 9184 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col2","_col3"] - | Statistics:Num rows: 20 Data size: 9184 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:0 (type: int) - Map-reduce partition columns:0 (type: int) - sort order:+ - Statistics:Num rows: 20 Data size: 144 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:c_int (type: int), c_float (type: float) - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 144 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_4] (rows=20 width=52) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9"] + PTF Operator [PTF_3] (rows=20 width=459) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"0","partition by:":"0"}] + Select Operator [SEL_2] (rows=20 width=459) + Output:["_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:0 + TableScan [TS_0] (rows=20 width=7) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["c_float","c_int"] PREHOOK: query: explain select i, a, h, b, c, d, e, f, g, a as x, a +1 as y from (select max(c_int) over (partition by key order by value range UNBOUNDED PRECEDING) a, min(c_int) over (partition by key order by value range current row) b, count(c_int) over(partition by key order by value range 1 PRECEDING) c, avg(value) over (partition by key order by value range between unbounded preceding and unbounded following) d, sum(value) over (partition by key order by value range between unbounded preceding and current row) e, avg(c_float) over (partition by key order by value range between 1 preceding and unbounded following) f, sum(c_float) over (partition by key order by value range between 1 preceding and current row) g, max(c_float) over (partition by key order by value range between 1 preceding and unbounded following) h, min(c_float) over (partition by key order by value range between 1 preceding and 1 following) i from cbo_t1) cbo_t1 PREHOOK: type: QUERY @@ -4328,33 +2713,22 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 20 Data size: 1280 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] - Statistics:Num rows: 20 Data size: 1280 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] - Statistics:Num rows: 20 Data size: 12244 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 20 Data size: 12244 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:key (type: string), value (type: string) - Map-reduce partition columns:key (type: string) - sort order:++ - Statistics:Num rows: 20 Data size: 3204 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:c_int (type: int), c_float (type: float) - TableScan [TS_0] - alias:cbo_t1 - Statistics:Num rows: 20 Data size: 3204 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_4] (rows=20 width=64) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8","_col9","_col10"] + PTF Operator [PTF_3] (rows=20 width=612) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] + Select Operator [SEL_2] (rows=20 width=612) + Output:["_col0","_col1","_col2","_col3"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:key + TableScan [TS_0] (rows=20 width=160) + default@cbo_t1,cbo_t1,Tbl:COMPLETE,Col:COMPLETE,Output:["c_float","c_int","key","value"] PREHOOK: query: explain select *, rank() over(partition by key order by value) as rr from src1 PREHOOK: type: QUERY @@ -4366,32 +2740,22 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 25 Data size: 4475 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_4] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 25 Data size: 4475 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] - Statistics:Num rows: 25 Data size: 11075 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 11075 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:key (type: string), value (type: string) - Map-reduce partition columns:key (type: string) - sort order:++ - Statistics:Num rows: 25 Data size: 4375 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:src1 - Statistics:Num rows: 25 Data size: 4375 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_4] (rows=25 width=179) + Output:["_col0","_col1","_col2"] + PTF Operator [PTF_3] (rows=25 width=443) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] + Select Operator [SEL_2] (rows=25 width=443) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:key + TableScan [TS_0] (rows=25 width=175) + default@src1,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select SUM(HASH(tmp.key)), SUM(HASH(tmp.cnt)) @@ -4413,82 +2777,46 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_20] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_16] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_13] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_11] - aggregations:["count(1)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_25] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 60 Data size: 5160 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_23] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_20] + Group By Operator [GBY_18] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + Group By Operator [GBY_16] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_14] (rows=14 width=94) + Output:["_col0","_col1"] + Group By Operator [GBY_13] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Group By Operator [GBY_11] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Merge Join Operator [MERGEJOIN_25] (rows=60 width=86) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_0] (rows=25 width=86) + default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=500 width=87) + Output:["_col0"] + Filter Operator [FIL_24] (rows=500 width=87) + predicate:key is not null + TableScan [TS_3] (rows=500 width=87) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select SUM(HASH(tmp.key)), SUM(HASH(tmp.cnt)) @@ -4510,82 +2838,46 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_20] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_16] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_13] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_11] - aggregations:["count(1)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_25] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 60 Data size: 5160 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_23] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_20] + Group By Operator [GBY_18] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + Group By Operator [GBY_16] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_14] (rows=14 width=94) + Output:["_col0","_col1"] + Group By Operator [GBY_13] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Group By Operator [GBY_11] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Merge Join Operator [MERGEJOIN_25] (rows=60 width=86) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_0] (rows=25 width=86) + default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=500 width=87) + Output:["_col0"] + Filter Operator [FIL_24] (rows=500 width=87) + predicate:key is not null + TableScan [TS_3] (rows=500 width=87) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select SUM(HASH(tmp.key)), SUM(HASH(tmp.cnt)) @@ -4607,77 +2899,43 @@ Reducer 3 <- Map 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_20] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_18] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_16] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_13] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_11] - aggregations:["count(1)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 14 Data size: 1316 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator [MAPJOIN_25] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col0 (type: string)","Map 2":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 60 Data size: 5160 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [BROADCAST_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_23] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - |<-Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_20] + Group By Operator [GBY_18] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_17] + Group By Operator [GBY_16] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_14] (rows=14 width=94) + Output:["_col0","_col1"] + Group By Operator [GBY_13] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Map 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col0 + Group By Operator [GBY_11] (rows=14 width=94) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Map Join Operator [MAPJOIN_25] (rows=60 width=86) + HybridGraceHashJoin:true,Output:["_col0"],keys:{"RS_6":"_col0","SEL_5":"_col0"} + <-Map 1 [BROADCAST_EDGE] + BROADCAST [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_0] (rows=25 width=86) + default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_5] (rows=500 width=87) + Output:["_col0"] + Filter Operator [FIL_24] (rows=500 width=87) + predicate:key is not null + TableScan [TS_3] (rows=500 width=87) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain select SUM(HASH(tmp.key)), SUM(HASH(tmp.cnt)) @@ -4699,97 +2957,56 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_22] - compressed:false - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_20] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_18] - aggregations:["sum(_col0)","sum(_col1)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_16] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 12 Data size: 1128 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_15] - | aggregations:["count(VALUE._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 12 Data size: 1128 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 12 Data size: 1128 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: bigint) - Group By Operator [GBY_13] - aggregations:["count(1)"] - keys:_col0 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 12 Data size: 1128 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_27] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_25] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 205 Data size: 17835 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_7] - keys:_col0 (type: string) - outputColumnNames:["_col0"] - Statistics:Num rows: 205 Data size: 17835 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_26] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_22] + Group By Operator [GBY_20] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_19] + Group By Operator [GBY_18] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(_col0)","sum(_col1)"] + Select Operator [SEL_16] (rows=12 width=94) + Output:["_col0","_col1"] + Group By Operator [GBY_15] (rows=12 width=94) + Output:["_col0","_col1"],aggregations:["count(VALUE._col0)"],keys:KEY._col0 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col0 + Group By Operator [GBY_13] (rows=12 width=94) + Output:["_col0","_col1"],aggregations:["count(1)"],keys:_col0 + Merge Join Operator [MERGEJOIN_27] (rows=25 width=86) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_25] (rows=25 width=86) + predicate:key is not null + TableScan [TS_0] (rows=25 width=86) + default@src1,x,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_7] (rows=205 width=87) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=500 width=87) + Output:["_col0"] + Filter Operator [FIL_26] (rows=500 width=87) + predicate:key is not null + TableScan [TS_3] (rows=500 width=87) + default@src,y,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: explain create table abcd (a int, b int, c int, d int) PREHOOK: type: CREATETABLE POSTHOOK: query: explain create table abcd (a int, b int, c int, d int) POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - columns:["a int","b int","c int","d int"] - input format:org.apache.hadoop.mapred.TextInputFormat - name:default.abcd - output format:org.apache.hadoop.hive.ql.io.IgnoreKeyTextOutputFormat + Create Table Operator: + name:default.abcd PREHOOK: query: create table abcd (a int, b int, c int, d int) PREHOOK: type: CREATETABLE @@ -4817,37 +3034,22 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 2 Data size: 39 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["count(DISTINCT KEY._col1:0._col0)","count(DISTINCT KEY._col1:1._col0)","sum(VALUE._col2)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 2 Data size: 39 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+++ - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE - value expressions:_col5 (type: bigint) - Group By Operator [GBY_2] - aggregations:["count(DISTINCT b)","count(DISTINCT c)","sum(d)"] - keys:a (type: int), b (type: int), c (type: int) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_1] - outputColumnNames:["a","b","c","d"] - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:abcd - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=2 width=19) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT KEY._col1:0._col0)","count(DISTINCT KEY._col1:1._col0)","sum(VALUE._col2)"],keys:KEY._col0 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:_col0 + Group By Operator [GBY_2] (rows=4 width=19) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(DISTINCT b)","count(DISTINCT c)","sum(d)"],keys:a, b, c + Select Operator [SEL_1] (rows=4 width=19) + Output:["a","b","c","d"] + TableScan [TS_0] (rows=4 width=19) + default@abcd,abcd,Tbl:COMPLETE,Col:NONE,Output:["a","b","c","d"] PREHOOK: query: explain select a, count(distinct b), count(distinct c), sum(d) from abcd group by a PREHOOK: type: QUERY @@ -4859,43 +3061,28 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_5] - compressed:false - Statistics:Num rows: 2 Data size: 39 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_3] - | aggregations:["count(DISTINCT KEY._col1:0._col0)","count(DISTINCT KEY._col1:1._col0)","sum(VALUE._col0)"] - | keys:KEY._col0 (type: int) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 2 Data size: 39 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:a (type: int), b (type: int), c (type: int) - Map-reduce partition columns:a (type: int) - sort order:+++ - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE - value expressions:d (type: int) - Select Operator [SEL_1] - outputColumnNames:["a","b","c","d"] - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:abcd - Statistics:Num rows: 4 Data size: 78 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_5] + Group By Operator [GBY_3] (rows=2 width=19) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT KEY._col1:0._col0)","count(DISTINCT KEY._col1:1._col0)","sum(VALUE._col0)"],keys:KEY._col0 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:a + Select Operator [SEL_1] (rows=4 width=19) + Output:["a","b","c","d"] + TableScan [TS_0] (rows=4 width=19) + default@abcd,abcd,Tbl:COMPLETE,Col:NONE,Output:["a","b","c","d"] PREHOOK: query: explain create table src_rc_merge_test(key int, value string) stored as rcfile PREHOOK: type: CREATETABLE POSTHOOK: query: explain create table src_rc_merge_test(key int, value string) stored as rcfile POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - columns:["key int","value string"] - input format:org.apache.hadoop.hive.ql.io.RCFileInputFormat - name:default.src_rc_merge_test - output format:org.apache.hadoop.hive.ql.io.RCFileOutputFormat + Create Table Operator: + name:default.src_rc_merge_test PREHOOK: query: create table src_rc_merge_test(key int, value string) stored as rcfile PREHOOK: type: CREATETABLE @@ -4918,11 +3105,8 @@ PREHOOK: type: CREATETABLE POSTHOOK: query: explain create table tgt_rc_merge_test(key int, value string) stored as rcfile POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - columns:["key int","value string"] - input format:org.apache.hadoop.hive.ql.io.RCFileInputFormat - name:default.tgt_rc_merge_test - output format:org.apache.hadoop.hive.ql.io.RCFileOutputFormat + Create Table Operator: + name:default.tgt_rc_merge_test PREHOOK: query: create table tgt_rc_merge_test(key int, value string) stored as rcfile PREHOOK: type: CREATETABLE @@ -4969,27 +3153,18 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["count(1)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:tgt_rc_merge_test - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Select Operator [SEL_1] (rows=5 width=6) + TableScan [TS_0] (rows=5 width=6) + default@tgt_rc_merge_test,tgt_rc_merge_test,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: explain select sum(hash(key)), sum(hash(value)) from tgt_rc_merge_test PREHOOK: type: QUERY @@ -5001,29 +3176,19 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int) - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:tgt_rc_merge_test - Statistics:Num rows: 5 Data size: 32 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Select Operator [SEL_1] (rows=5 width=6) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=5 width=6) + default@tgt_rc_merge_test,tgt_rc_merge_test,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: alter table tgt_rc_merge_test concatenate PREHOOK: type: ALTER_TABLE_MERGE @@ -5060,27 +3225,18 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["count(1)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:tgt_rc_merge_test - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Select Operator [SEL_1] (rows=1 width=171) + TableScan [TS_0] (rows=1 width=171) + default@tgt_rc_merge_test,tgt_rc_merge_test,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: explain select sum(hash(key)), sum(hash(value)) from tgt_rc_merge_test PREHOOK: type: QUERY @@ -5092,29 +3248,19 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int) - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:tgt_rc_merge_test - Statistics:Num rows: 1 Data size: 171 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Select Operator [SEL_1] (rows=1 width=171) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=1 width=171) + default@tgt_rc_merge_test,tgt_rc_merge_test,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: drop table src_rc_merge_test PREHOOK: type: DROPTABLE @@ -5142,50 +3288,32 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 250000 Data size: 21750000 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_10] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 250000 Data size: 21750000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_5] - | sort order: - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Select Operator [SEL_1] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - sort order: - Statistics:Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - Statistics:Num rows: 500 Data size: 2000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_2] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_9] + Merge Join Operator [MERGEJOIN_10] (rows=250000 width=87) + Output:["_col0"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Select Operator [SEL_1] (rows=500 width=87) + Output:["_col0"] + TableScan [TS_0] (rows=500 width=87) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Select Operator [SEL_3] (rows=500 width=4) + TableScan [TS_2] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: explain create table nzhang_Tmp(a int, b string) PREHOOK: type: CREATETABLE POSTHOOK: query: explain create table nzhang_Tmp(a int, b string) POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - columns:["a int","b string"] - input format:org.apache.hadoop.mapred.TextInputFormat - name:default.nzhang_Tmp - output format:org.apache.hadoop.hive.ql.io.IgnoreKeyTextOutputFormat + Create Table Operator: + name:default.nzhang_Tmp PREHOOK: query: create table nzhang_Tmp(a int, b string) PREHOOK: type: CREATETABLE @@ -5206,52 +3334,35 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-3 - Stats-Aggr Operator - Stage-4 - Create Table Operator: - columns:["k string","value string"] - input format:org.apache.hadoop.mapred.TextInputFormat - name:default.nzhang_CTAS1 - output format:org.apache.hadoop.hive.ql.io.IgnoreKeyTextOutputFormat - Stage-2 - Dependency Collection{} - Stage-1 - Reducer 3 - File Output Operator [FS_8] - compressed:true - Statistics:Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.nzhang_CTAS1"} - Limit [LIM_7] - Number of rows:10 - Statistics:Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE - Limit [LIM_4] - Number of rows:10 - Statistics:Num rows: 10 Data size: 1780 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Stage-0 - Move Operator - Please refer to the previous Stage-1 + Stats-Aggr Operator + Stage-4 + Create Table Operator: + name:default.nzhang_CTAS1 + Stage-2 + Dependency Collection{} + Stage-1 + Reducer 3 + File Output Operator [FS_8] + table:{"name:":"default.nzhang_CTAS1"} + Limit [LIM_7] (rows=10 width=178) + Number of rows:10 + Select Operator [SEL_6] (rows=10 width=178) + Output:["_col0","_col1"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Limit [LIM_4] (rows=10 width=178) + Number of rows:10 + Select Operator [SEL_3] (rows=500 width=178) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + Select Operator [SEL_1] (rows=500 width=178) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + Stage-0 + Move Operator + Please refer to the previous Stage-1 PREHOOK: query: create table nzhang_CTAS1 as select key k, value from src sort by k, value limit 10 PREHOOK: type: CREATETABLE_AS_SELECT @@ -5274,52 +3385,35 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-3 - Stats-Aggr Operator - Stage-4 - Create Table Operator: - columns:["half_key double","conb string"] - input format:org.apache.hadoop.hive.ql.io.RCFileInputFormat - name:default.nzhang_ctas3 - output format:org.apache.hadoop.hive.ql.io.RCFileOutputFormat - Stage-2 - Dependency Collection{} - Stage-1 - Reducer 3 - File Output Operator [FS_8] - compressed:true - Statistics:Num rows: 10 Data size: 1920 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.hive.ql.io.RCFileInputFormat","output format:":"org.apache.hadoop.hive.ql.io.RCFileOutputFormat","serde:":"org.apache.hadoop.hive.serde2.columnar.ColumnarSerDe","name:":"default.nzhang_ctas3"} - Limit [LIM_7] - Number of rows:10 - Statistics:Num rows: 10 Data size: 1920 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 10 Data size: 1920 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col0 (type: double), _col1 (type: string) - sort order:++ - Statistics:Num rows: 10 Data size: 1920 Basic stats: COMPLETE Column stats: COMPLETE - Limit [LIM_4] - Number of rows:10 - Statistics:Num rows: 10 Data size: 1920 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 96000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:_col0 (type: double), _col1 (type: string) - sort order:++ - Statistics:Num rows: 500 Data size: 96000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 96000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Stage-0 - Move Operator - Please refer to the previous Stage-1 + Stats-Aggr Operator + Stage-4 + Create Table Operator: + name:default.nzhang_ctas3 + Stage-2 + Dependency Collection{} + Stage-1 + Reducer 3 + File Output Operator [FS_8] + table:{"name:":"default.nzhang_ctas3"} + Limit [LIM_7] (rows=10 width=192) + Number of rows:10 + Select Operator [SEL_6] (rows=10 width=192) + Output:["_col0","_col1"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + Limit [LIM_4] (rows=10 width=192) + Number of rows:10 + Select Operator [SEL_3] (rows=500 width=192) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + Select Operator [SEL_1] (rows=500 width=192) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + Stage-0 + Move Operator + Please refer to the previous Stage-1 PREHOOK: query: create table nzhang_ctas3 row format serde "org.apache.hadoop.hive.serde2.columnar.ColumnarSerDe" stored as RCFile as select key/2 half_key, concat(value, "_con") conb from src sort by half_key, conb limit 10 PREHOOK: type: CREATETABLE_AS_SELECT @@ -5345,13 +3439,8 @@ PREHOOK: type: CREATETABLE POSTHOOK: query: explain create temporary table acid_dtt(a int, b varchar(128)) clustered by (a) into 2 buckets stored as orc TBLPROPERTIES ('transactional'='true') POSTHOOK: type: CREATETABLE Stage-0 - Create Table Operator: - # buckets:2 - bucket columns:["a"] - columns:["a int","b varchar(128)"] - input format:org.apache.hadoop.hive.ql.io.orc.OrcInputFormat - name:default.acid_dtt - output format:org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat + Create Table Operator: + name:default.acid_dtt PREHOOK: query: create temporary table acid_dtt(a int, b varchar(128)) clustered by (a) into 2 buckets stored as orc TBLPROPERTIES ('transactional'='true') PREHOOK: type: CREATETABLE @@ -5384,55 +3473,33 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_12] - compressed:true - Statistics:Num rows: 27556 Data size: 9809936 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 27556 Data size: 9809936 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col3 (type: string) - sort order:++++ - Statistics:Num rows: 27556 Data size: 9809936 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{} - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 27556 Data size: 9809936 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | sort order: - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string), _col1 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_13] - | predicate:(key < 10) (type: boolean) - | Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - sort order: - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: string), _col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_14] - predicate:(key < 10) (type: boolean) - Statistics:Num rows: 166 Data size: 29548 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:src - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_12] + Select Operator [SEL_11] (rows=27556 width=356) + Output:["_col0","_col1","_col2","_col3"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Merge Join Operator [MERGEJOIN_15] (rows=27556 width=356) + Output:["_col0","_col1","_col2","_col3"],keys:{} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + Select Operator [SEL_2] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_13] (rows=166 width=178) + predicate:(key < 10) + TableScan [TS_0] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_7] + Select Operator [SEL_5] (rows=166 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_14] (rows=166 width=178) + predicate:(key < 10) + TableScan [TS_3] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: CREATE TABLE myinput1(key int, value int) PREHOOK: type: CREATETABLE @@ -5460,42 +3527,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: int)","1":"value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:value (type: int) - Map-reduce partition columns:value (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=3 width=9) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=3 width=9) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key=c.key PREHOOK: type: QUERY @@ -5507,61 +3557,36 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_10] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_21] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"key (type: int)","1":"value (type: int)","2":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11"] - | Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | Filter Operator [FIL_18] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:value (type: int) - | Map-reduce partition columns:value (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:key (type: int) - | Filter Operator [FIL_19] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - Filter Operator [FIL_20] - predicate:key is not null (type: boolean) - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:c - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_11] + Select Operator [SEL_10] (rows=6 width=9) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_21] (rows=6 width=9) + Output:["_col0","_col1","_col5","_col6","_col10","_col11"],keys:{"0":"key","1":"value","2":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:key + Filter Operator [FIL_18] (rows=3 width=8) + predicate:key is not null + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:value + Filter Operator [FIL_19] (rows=3 width=8) + predicate:value is not null + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:key + Filter Operator [FIL_20] (rows=3 width=8) + predicate:key is not null + TableScan [TS_2] (rows=3 width=8) + default@myinput1,c,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value join myinput1 c on a.key<=>c.key PREHOOK: type: QUERY @@ -5573,52 +3598,30 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:true - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_9] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"key (type: int)","1":"value (type: int)","2":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11"] - | Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:value (type: int) - | Map-reduce partition columns:value (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:key (type: int) - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - TableScan [TS_2] - alias:c - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Select Operator [SEL_7] (rows=6 width=9) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_9] (rows=6 width=9) + Output:["_col0","_col1","_col5","_col6","_col10","_col11"],keys:{"0":"key","1":"value","2":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:key + TableScan [TS_2] (rows=3 width=8) + default@myinput1,c,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value=b.key join myinput1 c on a.key<=>c.key AND a.value=c.value PREHOOK: type: QUERY @@ -5630,58 +3633,36 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_10] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"key (type: int), value (type: int)","1":"value (type: int), key (type: int)","2":"key (type: int), value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11"] - | Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:key (type: int), value (type: int) - | Map-reduce partition columns:key (type: int), value (type: int) - | sort order:++ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_12] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:value (type: int), key (type: int) - | Map-reduce partition columns:value (type: int), key (type: int) - | sort order:++ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_13] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:key (type: int), value (type: int) - Map-reduce partition columns:key (type: int), value (type: int) - sort order:++ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_14] - predicate:value is not null (type: boolean) - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:c - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_11] + Select Operator [SEL_10] (rows=6 width=9) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_15] (rows=6 width=9) + Output:["_col0","_col1","_col5","_col6","_col10","_col11"],keys:{"0":"key, value","1":"value, key","2":"key, value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:key, value + Filter Operator [FIL_12] (rows=3 width=8) + predicate:value is not null + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:value, key + Filter Operator [FIL_13] (rows=3 width=8) + predicate:key is not null + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:key, value + Filter Operator [FIL_14] (rows=3 width=8) + predicate:value is not null + TableScan [TS_2] (rows=3 width=8) + default@myinput1,c,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * from myinput1 a join myinput1 b on a.key<=>b.value AND a.value<=>b.key join myinput1 c on a.key<=>c.key AND a.value<=>c.value PREHOOK: type: QUERY @@ -5693,49 +3674,30 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:true - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_9] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 0 to 2"}] - | keys:{"0":"key (type: int), value (type: int)","1":"value (type: int), key (type: int)","2":"key (type: int), value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11"] - | Statistics:Num rows: 6 Data size: 57 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:key (type: int), value (type: int) - | Map-reduce partition columns:key (type: int), value (type: int) - | sort order:++ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:value (type: int), key (type: int) - | Map-reduce partition columns:value (type: int), key (type: int) - | sort order:++ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:key (type: int), value (type: int) - Map-reduce partition columns:key (type: int), value (type: int) - sort order:++ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:c - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Select Operator [SEL_7] (rows=6 width=9) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Merge Join Operator [MERGEJOIN_9] (rows=6 width=9) + Output:["_col0","_col1","_col5","_col6","_col10","_col11"],keys:{"0":"key, value","1":"value, key","2":"key, value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key, value + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:value, key + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:key, value + TableScan [TS_2] (rows=3 width=8) + default@myinput1,c,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * FROM myinput1 a LEFT OUTER JOIN myinput1 b ON a.key<=>b.value PREHOOK: type: QUERY @@ -5747,42 +3709,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"key (type: int)","1":"value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:value (type: int) - Map-reduce partition columns:value (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=3 width=9) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=3 width=9) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * FROM myinput1 a RIGHT OUTER JOIN myinput1 b ON a.key<=>b.value PREHOOK: type: QUERY @@ -5794,42 +3739,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Right Outer Join0 to 1"}] - | keys:{"0":"key (type: int)","1":"value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:value (type: int) - Map-reduce partition columns:value (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=3 width=9) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=3 width=9) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select * FROM myinput1 a FULL OUTER JOIN myinput1 b ON a.key<=>b.value PREHOOK: type: QUERY @@ -5841,42 +3769,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"key (type: int)","1":"value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:value (type: int) - Map-reduce partition columns:value (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=3 width=9) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=3 width=9) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select /*+ MAPJOIN(b) */ * FROM myinput1 a JOIN myinput1 b ON a.key<=>b.value PREHOOK: type: QUERY @@ -5888,42 +3799,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: int)","1":"value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 3 Data size: 28 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:value (type: int) - Map-reduce partition columns:value (type: int) - sort order:+ - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 3 Data size: 26 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=3 width=9) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=3 width=9) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=3 width=8) + default@myinput1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:value + TableScan [TS_1] (rows=3 width=8) + default@myinput1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: CREATE TABLE smb_input(key int, value int) PREHOOK: type: CREATETABLE @@ -6001,42 +3895,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: int)","1":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=28 width=7) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=28 width=7) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=26 width=7) + default@smb_input1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_1] (rows=26 width=7) + default@smb_input1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select /*+ MAPJOIN(a) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key AND a.value <=> b.value PREHOOK: type: QUERY @@ -6048,40 +3925,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: int), value (type: int)","1":"key (type: int), value (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int), value (type: int) - | Map-reduce partition columns:key (type: int), value (type: int) - | sort order:++ - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:key (type: int), value (type: int) - Map-reduce partition columns:key (type: int), value (type: int) - sort order:++ - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_1] - alias:b - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=28 width=7) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=28 width=7) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key, value","1":"key, value"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key, value + TableScan [TS_0] (rows=26 width=7) + default@smb_input1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key, value + TableScan [TS_1] (rows=26 width=7) + default@smb_input1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select /*+ MAPJOIN(a) */ * FROM smb_input1 a RIGHT OUTER JOIN smb_input1 b ON a.key <=> b.key PREHOOK: type: QUERY @@ -6093,42 +3955,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Right Outer Join0 to 1"}] - | keys:{"0":"key (type: int)","1":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=28 width=7) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=28 width=7) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=26 width=7) + default@smb_input1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_1] (rows=26 width=7) + default@smb_input1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select /*+ MAPJOIN(b) */ * FROM smb_input1 a JOIN smb_input1 b ON a.key <=> b.key PREHOOK: type: QUERY @@ -6140,42 +3985,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: int)","1":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=28 width=7) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=28 width=7) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=26 width=7) + default@smb_input1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_1] (rows=26 width=7) + default@smb_input1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select /*+ MAPJOIN(b) */ * FROM smb_input1 a LEFT OUTER JOIN smb_input1 b ON a.key <=> b.key PREHOOK: type: QUERY @@ -6187,42 +4015,25 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_6] - compressed:true - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_7] - | condition map:[{"":"Left Outer Join0 to 1"}] - | keys:{"0":"key (type: int)","1":"key (type: int)"} - | outputColumnNames:["_col0","_col1","_col5","_col6"] - | Statistics:Num rows: 28 Data size: 209 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:key (type: int) - | Map-reduce partition columns:key (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: int) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:key (type: int) - Map-reduce partition columns:key (type: int) - sort order:+ - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE - value expressions:value (type: int) - TableScan [TS_1] - alias:b - Statistics:Num rows: 26 Data size: 190 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_6] + Select Operator [SEL_5] (rows=28 width=7) + Output:["_col0","_col1","_col2","_col3"] + Merge Join Operator [MERGEJOIN_7] (rows=28 width=7) + Output:["_col0","_col1","_col5","_col6"],keys:{"0":"key","1":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:key + TableScan [TS_0] (rows=26 width=7) + default@smb_input1,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_1] (rows=26 width=7) + default@smb_input1,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: drop table sales PREHOOK: type: DROPTABLE @@ -6288,54 +4099,33 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_12] - compressed:true - Statistics:Num rows: 2 Data size: 13 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_17] - | condition map:[{"":"Left Semi Join 0 to 1"}] - | keys:{"0":"_col1 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 2 Data size: 13 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:_col1 (type: int) - | Map-reduce partition columns:_col1 (type: int) - | sort order:+ - | Statistics:Num rows: 1 Data size: 13 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 13 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_15] - | predicate:id is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 13 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:sales - | Statistics:Num rows: 1 Data size: 13 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 2 Data size: 12 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_7] - keys:_col0 (type: int) - outputColumnNames:["_col0"] - Statistics:Num rows: 2 Data size: 12 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 2 Data size: 12 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_16] - predicate:id is not null (type: boolean) - Statistics:Num rows: 2 Data size: 12 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:things - Statistics:Num rows: 2 Data size: 12 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_12] + Merge Join Operator [MERGEJOIN_17] (rows=2 width=6) + Output:["_col0","_col1"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col1 + Select Operator [SEL_2] (rows=1 width=13) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=1 width=13) + predicate:id is not null + TableScan [TS_0] (rows=1 width=13) + default@sales,sales,Tbl:COMPLETE,Col:NONE,Output:["name","id"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Group By Operator [GBY_7] (rows=2 width=6) + Output:["_col0"],keys:_col0 + Select Operator [SEL_5] (rows=2 width=6) + Output:["_col0"] + Filter Operator [FIL_16] (rows=2 width=6) + predicate:id is not null + TableScan [TS_3] (rows=2 width=6) + default@things,things,Tbl:COMPLETE,Col:NONE,Output:["id"] PREHOOK: query: drop table sales PREHOOK: type: DROPTABLE @@ -6364,71 +4154,42 @@ Map 1 <- Map 3 (BROADCAST_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_26] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Map Join Operator [MAPJOIN_25] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 3 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_10] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Filter Operator [FIL_23] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_3] - | | alias:src1 - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_22] - | predicate:((value > 'val_450') and key is not null) (type: boolean) - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:srcpart - | Statistics:Num rows: 2000 Data size: 356000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - outputColumnNames:["_col0"] - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:(value > 'val_450') (type: boolean) - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:src - Statistics:Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_16] + Merge Join Operator [MERGEJOIN_26] (rows=555 width=87) + Output:["_col0"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_25] (rows=241 width=178) + HybridGraceHashJoin:true,Output:["_col0","_col1"],keys:{"SEL_2":"_col0","RS_10":"_col0"} + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_3] (rows=25 width=86) + default@src1,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=666 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=666 width=178) + predicate:((value > 'val_450') and key is not null) + TableScan [TS_0] (rows=2000 width=178) + default@srcpart,srcpart,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=166 width=91) + Output:["_col0"] + Filter Operator [FIL_24] (rows=166 width=91) + predicate:(value > 'val_450') + TableScan [TS_6] (rows=500 width=91) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: explain select srcpart.key from srcpart join src on (srcpart.value=src.value) join src1 on (srcpart.key=src1.key) where srcpart.value > 'val_450' PREHOOK: type: QUERY @@ -6441,71 +4202,42 @@ Map 1 <- Map 3 (BROADCAST_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_26] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Map Join Operator [MAPJOIN_25] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 3 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_10] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Filter Operator [FIL_23] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_3] - | | alias:src1 - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_22] - | predicate:((value > 'val_450') and key is not null) (type: boolean) - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:srcpart - | Statistics:Num rows: 2000 Data size: 356000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - outputColumnNames:["_col0"] - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:(value > 'val_450') (type: boolean) - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:src - Statistics:Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_16] + Merge Join Operator [MERGEJOIN_26] (rows=555 width=87) + Output:["_col0"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_25] (rows=241 width=178) + HybridGraceHashJoin:true,Output:["_col0","_col1"],keys:{"SEL_2":"_col0","RS_10":"_col0"} + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_3] (rows=25 width=86) + default@src1,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=666 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=666 width=178) + predicate:((value > 'val_450') and key is not null) + TableScan [TS_0] (rows=2000 width=178) + default@srcpart,srcpart,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=166 width=91) + Output:["_col0"] + Filter Operator [FIL_24] (rows=166 width=91) + predicate:(value > 'val_450') + TableScan [TS_6] (rows=500 width=91) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: explain select srcpart.key from srcpart join src on (srcpart.value=src.value) join src1 on (srcpart.key=src1.key) where srcpart.value > 'val_450' PREHOOK: type: QUERY @@ -6518,71 +4250,42 @@ Map 1 <- Map 3 (BROADCAST_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_26] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 555 Data size: 48285 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col0 (type: string) - | Map Join Operator [MAPJOIN_25] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 1":"_col0 (type: string)","Map 3":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 241 Data size: 42898 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Map 3 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_10] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | Filter Operator [FIL_23] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | | TableScan [TS_3] - | | alias:src1 - | | Statistics:Num rows: 25 Data size: 2150 Basic stats: COMPLETE Column stats: COMPLETE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_22] - | predicate:((value > 'val_450') and key is not null) (type: boolean) - | Statistics:Num rows: 666 Data size: 118548 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:srcpart - | Statistics:Num rows: 2000 Data size: 356000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - outputColumnNames:["_col0"] - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_24] - predicate:(value > 'val_450') (type: boolean) - Statistics:Num rows: 166 Data size: 15106 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_6] - alias:src - Statistics:Num rows: 500 Data size: 45500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_16] + Merge Join Operator [MERGEJOIN_26] (rows=555 width=87) + Output:["_col0"],keys:{"0":"_col1","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_25] (rows=241 width=178) + HybridGraceHashJoin:true,Output:["_col0","_col1"],keys:{"SEL_2":"_col0","RS_10":"_col0"} + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_10] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=25 width=86) + Output:["_col0"] + Filter Operator [FIL_23] (rows=25 width=86) + predicate:key is not null + TableScan [TS_3] (rows=25 width=86) + default@src1,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Select Operator [SEL_2] (rows=666 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=666 width=178) + predicate:((value > 'val_450') and key is not null) + TableScan [TS_0] (rows=2000 width=178) + default@srcpart,srcpart,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=166 width=91) + Output:["_col0"] + Filter Operator [FIL_24] (rows=166 width=91) + predicate:(value > 'val_450') + TableScan [TS_6] (rows=500 width=91) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["value"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -6611,46 +4314,29 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_9] + Select Operator [SEL_7] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_6] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] PREHOOK: query: explain select p_mfgr, p_name, @@ -6674,67 +4360,40 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 29 Data size: 6583 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_14] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 29 Data size: 6583 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_13] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_12] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_10] - Function definitions:[{"Input definition":{"type:":"SUBQUERY"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - Map Join Operator [MAPJOIN_21] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"p_partkey (type: int)","Map 4":"p_partkey (type: int)"} - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 29 Data size: 6467 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_5] - | key expressions:p_partkey (type: int) - | Map-reduce partition columns:p_partkey (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_20] - | predicate:p_partkey is not null (type: boolean) - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_1] - | alias:p2 - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - |<-Filter Operator [FIL_19] - predicate:p_partkey is not null (type: boolean) - Statistics:Num rows: 26 Data size: 5902 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:p1 - Statistics:Num rows: 26 Data size: 5902 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_16] + Select Operator [SEL_14] (rows=29 width=227) + Output:["_col0","_col1","_col2","_col3"] + PTF Operator [PTF_13] (rows=29 width=223) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_12] (rows=29 width=223) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:_col2 + PTF Operator [PTF_10] (rows=29 width=223) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_9] (rows=29 width=223) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col2 + Map Join Operator [MAPJOIN_21] (rows=29 width=223) + HybridGraceHashJoin:true,Output:["_col1","_col2","_col5"],keys:{"FIL_19":"p_partkey","RS_5":"p_partkey"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_5] + PartitionCols:p_partkey + Filter Operator [FIL_20] (rows=26 width=4) + predicate:p_partkey is not null + TableScan [TS_1] (rows=26 width=4) + default@part,p2,Tbl:COMPLETE,Col:COMPLETE,Output:["p_partkey"] + <-Filter Operator [FIL_19] (rows=26 width=227) + predicate:p_partkey is not null + TableScan [TS_0] (rows=26 width=227) + default@part,p1,Tbl:COMPLETE,Col:COMPLETE,Output:["p_partkey","p_name","p_mfgr","p_size"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -6763,46 +4422,29 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_9] + Select Operator [SEL_7] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_6] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -6831,46 +4473,29 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_9] + Select Operator [SEL_7] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_6] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -6902,59 +4527,36 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_14] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_12] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_11] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_8] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: int) - Map-reduce partition columns:_col0 (type: string) - sort order:+++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_6] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: int) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col2 (type: string), _col1 (type: string), _col5 (type: int) - Map-reduce partition columns:rand() (type: double) - sort order:+++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_4] - outputColumnNames:["_col1","_col2","_col5"] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_14] + Select Operator [SEL_12] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6"] + PTF Operator [PTF_11] (rows=26 width=223) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col0"}] + Group By Operator [GBY_8] (rows=26 width=223) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Group By Operator [GBY_6] (rows=26 width=223) + Output:["_col0","_col1","_col2"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:rand() + Select Operator [SEL_4] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + PTF Operator [PTF_3] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select abc.* @@ -6976,51 +4578,31 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (BROADCAST_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 29 Data size: 17951 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Map Join Operator [MAPJOIN_16] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 2":"_col0 (type: int)","Map 3":"p_partkey (type: int)"} - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 29 Data size: 17951 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [BROADCAST_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:p_partkey (type: int) - | Map-reduce partition columns:p_partkey (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_15] - | predicate:p_partkey is not null (type: boolean) - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_1] - | alias:p1 - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - |<-Filter Operator [FIL_14] - predicate:_col0 is not null (type: boolean) - Statistics:Num rows: 26 Data size: 23062 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 23062 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - | Statistics:Num rows: 26 Data size: 23062 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 16094 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_partkey (type: int), p_brand (type: string), p_type (type: string), p_size (type: int), p_container (type: string), p_retailprice (type: double), p_comment (type: string) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 16094 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_11] + Map Join Operator [MAPJOIN_16] (rows=29 width=619) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"],keys:{"FIL_14":"_col0","RS_8":"p_partkey"} + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_8] + PartitionCols:p_partkey + Filter Operator [FIL_15] (rows=26 width=4) + predicate:p_partkey is not null + TableScan [TS_1] (rows=26 width=4) + default@part,p1,Tbl:COMPLETE,Col:COMPLETE,Output:["p_partkey"] + <-Filter Operator [FIL_14] (rows=26 width=887) + predicate:_col0 is not null + PTF Operator [PTF_4] (rows=26 width=887) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_3] (rows=26 width=887) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=619) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_brand","p_comment","p_container","p_mfgr","p_name","p_partkey","p_retailprice","p_size","p_type"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -7043,47 +4625,31 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_10] - compressed:true - Statistics:Num rows: 26 Data size: 5902 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_8] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 26 Data size: 5902 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_7] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1, _col5(DESC)","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col2 (type: string), _col1 (type: string), _col5 (type: int) - Map-reduce partition columns:_col2 (type: string) - sort order:++- - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col1, _col5(DESC)","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:p_mfgr (type: string), p_name (type: string), p_size (type: int) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++- - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_1] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"p_name, p_size(DESC)","partition by:":"p_mfgr"}}] - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_10] + Select Operator [SEL_8] (rows=26 width=227) + Output:["_col0","_col1","_col2","_col3"] + PTF Operator [PTF_7] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1, _col5(DESC)","partition by:":"_col2"}] + Select Operator [SEL_6] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col2 + PTF Operator [PTF_4] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col1, _col5(DESC)","partition by:":"_col2"}}] + Select Operator [SEL_3] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:p_mfgr + PTF Operator [PTF_1] (rows=26 width=223) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"p_name, p_size(DESC)","partition by:":"p_mfgr"}}] + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -7110,49 +4676,31 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_10] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_8] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_7] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - PTF Operator [PTF_1] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"p_name","partition by:":"p_mfgr"}}] - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_10] + Select Operator [SEL_8] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_7] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_6] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col2 + PTF Operator [PTF_4] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_3] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:p_mfgr + PTF Operator [PTF_1] (rows=26 width=231) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"p_name","partition by:":"p_mfgr"}}] + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_name","p_mfgr","p_size","p_retailprice"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -7179,46 +4727,29 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_9] + Select Operator [SEL_7] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_6] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] PREHOOK: query: explain select p_mfgr, p_name, p_size, @@ -7248,62 +4779,38 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_13] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_11] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_10] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_7] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2(DESC), _col1","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:-+ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2(DESC), _col1","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:-+ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_13] + Select Operator [SEL_11] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_10] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_9] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col2 + PTF Operator [PTF_7] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2(DESC), _col1","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] + Select Operator [SEL_6] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col2 + PTF Operator [PTF_4] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2(DESC), _col1","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2(DESC), _col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] PREHOOK: query: explain select p_mfgr, p_name, @@ -7338,46 +4845,29 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_10] - compressed:true - Statistics:Num rows: 26 Data size: 6110 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 26 Data size: 6110 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_10] + Select Operator [SEL_7] (rows=26 width=235) + Output:["_col0","_col1","_col2","_col3"] + PTF Operator [PTF_6] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] PREHOOK: query: explain select abc.p_mfgr, abc.p_name, @@ -7410,67 +4900,40 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (BROADCAST_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_15] - compressed:true - Statistics:Num rows: 29 Data size: 7511 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] - Statistics:Num rows: 29 Data size: 7511 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_12] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 29 Data size: 22243 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_11] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 29 Data size: 22243 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 29 Data size: 6699 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - Map Join Operator [MAPJOIN_20] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 2":"_col0 (type: int)","Map 4":"p_partkey (type: int)"} - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 29 Data size: 6699 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_8] - | key expressions:p_partkey (type: int) - | Map-reduce partition columns:p_partkey (type: int) - | sort order:+ - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_19] - | predicate:p_partkey is not null (type: boolean) - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_1] - | alias:p1 - | Statistics:Num rows: 26 Data size: 104 Basic stats: COMPLETE Column stats: COMPLETE - |<-Filter Operator [FIL_18] - predicate:_col0 is not null (type: boolean) - Statistics:Num rows: 26 Data size: 13078 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 13078 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_3] - | outputColumnNames:["_col0","_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 13078 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6110 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_partkey (type: int), p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6110 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_15] + Select Operator [SEL_13] (rows=29 width=259) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7","_col8"] + PTF Operator [PTF_12] (rows=29 width=767) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_11] (rows=29 width=767) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col2 + Map Join Operator [MAPJOIN_20] (rows=29 width=231) + HybridGraceHashJoin:true,Output:["_col1","_col2","_col5","_col7"],keys:{"FIL_18":"_col0","RS_8":"p_partkey"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_8] + PartitionCols:p_partkey + Filter Operator [FIL_19] (rows=26 width=4) + predicate:p_partkey is not null + TableScan [TS_1] (rows=26 width=4) + default@part,p1,Tbl:COMPLETE,Col:COMPLETE,Output:["p_partkey"] + <-Filter Operator [FIL_18] (rows=26 width=503) + predicate:_col0 is not null + PTF Operator [PTF_4] (rows=26 width=503) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_3] (rows=26 width=503) + Output:["_col0","_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=235) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_partkey","p_retailprice","p_size"] PREHOOK: query: explain create view IF NOT EXISTS mfgr_price_view as select p_mfgr, p_brand, @@ -7487,9 +4950,8 @@ POSTHOOK: type: CREATEVIEW Plan not optimized by CBO. Stage-0 - Create View Operator: - name:default.mfgr_price_view - original text:select p_mfgr, p_brand, + Create View Operator: + name:default.mfgr_price_view,original text:select p_mfgr, p_brand, sum(p_retailprice) as s from part group by p_mfgr, p_brand @@ -7579,94 +5041,62 @@ Reducer 4 <- Reducer 2 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-4 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.part_4"} - Stage-3 - Dependency Collection{} - Stage-2 - Reducer 3 - File Output Operator [FS_9] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.part_4"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int), _col7 (type: double) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5","_col7"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int), p_retailprice (type: double) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 6006 Basic stats: COMPLETE Column stats: COMPLETE - Reducer 5 - File Output Operator [FS_20] - compressed:true - Statistics:Num rows: 26 Data size: 6422 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.part_5"} - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 26 Data size: 6422 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_16] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col3, _col2","partition by:":"_col3"}] - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_15] - | outputColumnNames:["_col0","_col2","_col3","_col6"] - | Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_14] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:sum_window_0 (type: bigint), _col5 (type: int) - Select Operator [SEL_13] - outputColumnNames:["_col1","_col2","_col5","sum_window_0"] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_12] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col5","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_11] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col2 (type: string), _col5 (type: int) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12974 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string) - Please refer to the previous PTF Operator [PTF_3] + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.part_4"} + Stage-3 + Dependency Collection{} + Stage-2 + Reducer 3 + File Output Operator [FS_9] + table:{"name:":"default.part_4"} + Select Operator [SEL_7] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_6] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_5] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=499) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col1","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=499) + Output:["_col1","_col2","_col5","_col7"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=231) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_retailprice","p_size"] + Reducer 5 + File Output Operator [FS_20] + table:{"name:":"default.part_5"} + Select Operator [SEL_17] (rows=26 width=247) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + PTF Operator [PTF_16] (rows=26 width=499) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col3, _col2","partition by:":"_col3"}] + Select Operator [SEL_15] (rows=26 width=499) + Output:["_col0","_col2","_col3","_col6"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_14] + PartitionCols:_col2 + Select Operator [SEL_13] (rows=26 width=491) + Output:["_col1","_col2","_col5","sum_window_0"] + PTF Operator [PTF_12] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col5","partition by:":"_col2"}] + Select Operator [SEL_11] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col2 + Please refer to the previous PTF Operator [PTF_3] Stage-5 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.part_5"} - Please refer to the previous Stage-3 + Stats-Aggr Operator + Stage-1 + Move Operator + table:{"name:":"default.part_5"} + Please refer to the previous Stage-3 PREHOOK: query: explain select p_mfgr, p_name, @@ -7710,62 +5140,38 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_13] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_11] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_10] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col2, _col1","partition by:":"_col2, _col1"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_9] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_7] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_6] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_4] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:+ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_name (type: string), p_size (type: int) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_13] + Select Operator [SEL_11] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_10] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col2, _col1","partition by:":"_col2, _col1"}] + Select Operator [SEL_9] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:_col2, _col1 + PTF Operator [PTF_7] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] + Select Operator [SEL_6] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:_col2, _col1 + PTF Operator [PTF_4] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noopwithmap","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] + PTF Operator [PTF_3] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select p_mfgr, p_name, @@ -7810,72 +5216,43 @@ Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_15] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_12] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_11] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_9] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col2 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:+ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string), _col5 (type: int) - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string) - Map-reduce partition columns:p_mfgr (type: string) - sort order:+ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_name (type: string), p_size (type: int) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_15] + Select Operator [SEL_13] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_12] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_11] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col2 + PTF Operator [PTF_9] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] + Select Operator [SEL_8] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col2 + PTF Operator [PTF_6] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] + Select Operator [SEL_5] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2, _col1 + PTF Operator [PTF_3] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] + Select Operator [SEL_2] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select p_mfgr, p_name, @@ -7915,59 +5292,36 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_12] - compressed:true - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_10] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 26 Data size: 6214 Basic stats: COMPLETE Column stats: COMPLETE - PTF Operator [PTF_9] - Function definitions:[{"Input definition":{"type:":"WINDOWING"}},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_8] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col2 (type: string), _col1 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col5 (type: int) - PTF Operator [PTF_6] - Function definitions:[{"Input definition":{"type:":"PTFCOMPONENT"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_5] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col2 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:+ - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string), _col5 (type: int) - PTF Operator [PTF_3] - Function definitions:[{"Input definition":{"type:":"TABLE"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] - Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_2] - | outputColumnNames:["_col1","_col2","_col5"] - | Statistics:Num rows: 26 Data size: 12766 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_1] - key expressions:p_mfgr (type: string), p_name (type: string) - Map-reduce partition columns:p_mfgr (type: string), p_name (type: string) - sort order:++ - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:p_size (type: int) - TableScan [TS_0] - alias:part - Statistics:Num rows: 26 Data size: 5798 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_12] + Select Operator [SEL_10] (rows=26 width=239) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + PTF Operator [PTF_9] (rows=26 width=491) + Function definitions:[{},{"name:":"windowingtablefunction","order by:":"_col1","partition by:":"_col2"}] + Select Operator [SEL_8] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col2 + PTF Operator [PTF_6] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}},{"Partition table definition":{"name:":"noop","order by:":"_col2","partition by:":"_col2"}}] + Select Operator [SEL_5] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col2 + PTF Operator [PTF_3] (rows=26 width=491) + Function definitions:[{},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}},{"Partition table definition":{"name:":"noop","order by:":"_col2, _col1","partition by:":"_col2, _col1"}}] + Select Operator [SEL_2] (rows=26 width=491) + Output:["_col1","_col2","_col5"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_1] + PartitionCols:p_mfgr, p_name + TableScan [TS_0] (rows=26 width=223) + default@part,part,Tbl:COMPLETE,Col:COMPLETE,Output:["p_mfgr","p_name","p_size"] PREHOOK: query: explain select distinct src.* from src PREHOOK: type: QUERY @@ -7980,40 +5334,25 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_7] - compressed:true - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_5] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_4] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_3] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:key (type: string), value (type: string) - Map-reduce partition columns:rand() (type: double) - sort order:++ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["key","value"] - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_7] + Group By Operator [GBY_5] (rows=500 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:_col0, _col1 + Group By Operator [GBY_3] (rows=500 width=178) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:rand() + Select Operator [SEL_1] (rows=500 width=178) + Output:["key","value"] + TableScan [TS_0] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select explode(array('a', 'b')) PREHOOK: type: QUERY @@ -8022,23 +5361,17 @@ POSTHOOK: type: QUERY Plan not optimized by CBO due to missing feature [Others]. Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_3] - compressed:true - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - UDTF Operator [UDTF_2] - function name:explode - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - Select Operator [SEL_1] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: COMPLETE - TableScan [TS_0] - alias:_dummy_table - Statistics:Num rows: 1 Data size: 1 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_3] + UDTF Operator [UDTF_2] (rows=1 width=0) + function name:explode + Select Operator [SEL_1] (rows=1 width=0) + Output:["_col0"] + TableScan [TS_0] (rows=1 width=1) + _dummy_database@_dummy_table,_dummy_table,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: CREATE TABLE T1(key STRING, val STRING) STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -8126,57 +5459,38 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-3 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest_j1"} - Stage-2 - Dependency Collection{} - Stage-1 - Reducer 2 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 1219 Data size: 115805 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest_j1"} - Select Operator [SEL_9] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1219 Data size: 115805 Basic stats: COMPLETE Column stats: COMPLETE - Merge Join Operator [MERGEJOIN_16] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 1219 Data size: 216982 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_14] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src1 - | Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_15] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:src1 - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.dest_j1"} + Stage-2 + Dependency Collection{} + Stage-1 + Reducer 2 + File Output Operator [FS_11] + table:{"name:":"default.dest_j1"} + Select Operator [SEL_9] (rows=1219 width=95) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_16] (rows=1219 width=178) + Output:["_col0","_col2"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500 width=87) + Output:["_col0"] + Filter Operator [FIL_14] (rows=500 width=87) + predicate:key is not null + TableScan [TS_0] (rows=500 width=87) + default@src,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_15] (rows=500 width=178) + predicate:key is not null + TableScan [TS_3] (rows=500 width=178) + default@src,src1,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: FROM src src1 JOIN src src2 ON (src1.key = src2.key) INSERT OVERWRITE TABLE dest_j1 select src1.key, src2.value @@ -8208,68 +5522,40 @@ Vertex dependency in root stage Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE), Map 4 (BROADCAST_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_14] - compressed:true - Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_31] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 1 to 2"},{"":"Inner Join 2 to 3"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"key (type: string)","Map 2":"key (type: string)","Map 3":"key (type: string)","Map 4":"key (type: string)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11","_col15","_col16"] - | Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - |<-Map 2 [BROADCAST_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_28] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [BROADCAST_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_29] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_2] - | alias:c - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_30] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:d - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Filter Operator [FIL_27] - predicate:key is not null (type: boolean) - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:a - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=3 width=33) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Map Join Operator [MAPJOIN_31] (rows=3 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col5","_col6","_col10","_col11","_col15","_col16"],keys:{"FIL_27":"key","RS_7":"key","RS_9":"key","RS_11":"key"} + <-Map 2 [BROADCAST_EDGE] + BROADCAST [RS_7] + PartitionCols:key + Filter Operator [FIL_28] (rows=1 width=30) + predicate:key is not null + TableScan [TS_1] (rows=1 width=30) + default@t2,b,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_9] + PartitionCols:key + Filter Operator [FIL_29] (rows=1 width=20) + predicate:key is not null + TableScan [TS_2] (rows=1 width=20) + default@t3,c,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_11] + PartitionCols:key + Filter Operator [FIL_30] (rows=1 width=30) + predicate:key is not null + TableScan [TS_3] (rows=1 width=30) + default@t4,d,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Filter Operator [FIL_27] (rows=1 width=30) + predicate:key is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] PREHOOK: query: explain select /*+ STREAMTABLE(a,c) */ * @@ -8289,68 +5575,40 @@ Vertex dependency in root stage Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE), Map 4 (BROADCAST_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_14] - compressed:true - Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_13] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] - Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_31] - | condition map:[{"":"Inner Join 0 to 1"},{"":"Inner Join 1 to 2"},{"":"Inner Join 2 to 3"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"key (type: string)","Map 2":"key (type: string)","Map 3":"key (type: string)","Map 4":"key (type: string)"} - | outputColumnNames:["_col0","_col1","_col5","_col6","_col10","_col11","_col15","_col16"] - | Statistics:Num rows: 3 Data size: 99 Basic stats: COMPLETE Column stats: NONE - |<-Map 2 [BROADCAST_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_28] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [BROADCAST_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_29] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_2] - | alias:c - | Statistics:Num rows: 1 Data size: 20 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_11] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | Filter Operator [FIL_30] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:d - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Filter Operator [FIL_27] - predicate:key is not null (type: boolean) - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:a - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_14] + Select Operator [SEL_13] (rows=3 width=33) + Output:["_col0","_col1","_col2","_col3","_col4","_col5","_col6","_col7"] + Map Join Operator [MAPJOIN_31] (rows=3 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col5","_col6","_col10","_col11","_col15","_col16"],keys:{"FIL_27":"key","RS_7":"key","RS_9":"key","RS_11":"key"} + <-Map 2 [BROADCAST_EDGE] + BROADCAST [RS_7] + PartitionCols:key + Filter Operator [FIL_28] (rows=1 width=30) + predicate:key is not null + TableScan [TS_1] (rows=1 width=30) + default@t2,b,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_9] + PartitionCols:key + Filter Operator [FIL_29] (rows=1 width=20) + predicate:key is not null + TableScan [TS_2] (rows=1 width=20) + default@t3,c,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_11] + PartitionCols:key + Filter Operator [FIL_30] (rows=1 width=30) + predicate:key is not null + TableScan [TS_3] (rows=1 width=30) + default@t4,d,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Filter Operator [FIL_27] (rows=1 width=30) + predicate:key is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] PREHOOK: query: explain FROM T1 a JOIN src c ON c.key+1=a.key select /*+ STREAMTABLE(a) */ sum(hash(a.key)), sum(hash(a.val)), sum(hash(c.key)) PREHOOK: type: QUERY @@ -8364,58 +5622,33 @@ Reducer 3 <- Map 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_13] - compressed:true - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_11] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_9] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Map 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 550 Data size: 47850 Basic stats: COMPLETE Column stats: NONE - value expressions:hash(_col0) (type: int), hash(_col1) (type: int), hash(_col5) (type: int) - Map Join Operator [MAPJOIN_18] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"UDFToDouble(key) (type: double)","Map 2":"(key + 1) (type: double)"} - | outputColumnNames:["_col0","_col1","_col5"] - | Statistics:Num rows: 550 Data size: 47850 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [BROADCAST_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:UDFToDouble(key) (type: double) - | Map-reduce partition columns:UDFToDouble(key) (type: double) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:key (type: string), val (type: string) - | Filter Operator [FIL_16] - | predicate:UDFToDouble(key) is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Filter Operator [FIL_17] - predicate:(key + 1) is not null (type: boolean) - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_1] - alias:c - Statistics:Num rows: 500 Data size: 43500 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_13] + Group By Operator [GBY_11] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Group By Operator [GBY_9] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Map 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:rand() + Map Join Operator [MAPJOIN_18] (rows=550 width=87) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col5"],keys:{"RS_3":"UDFToDouble(key)","FIL_17":"(key + 1)"} + <-Map 1 [BROADCAST_EDGE] + BROADCAST [RS_3] + PartitionCols:UDFToDouble(key) + Filter Operator [FIL_16] (rows=1 width=30) + predicate:UDFToDouble(key) is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Filter Operator [FIL_17] (rows=500 width=87) + predicate:(key + 1) is not null + TableScan [TS_1] (rows=500 width=87) + default@src,c,Tbl:COMPLETE,Col:COMPLETE,Output:["key"] PREHOOK: query: FROM T1 a JOIN src c ON c.key+1=a.key select /*+ STREAMTABLE(a) */ sum(hash(a.key)), sum(hash(a.val)), sum(hash(c.key)) PREHOOK: type: QUERY @@ -8448,51 +5681,31 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_10] - compressed:true - Statistics:Num rows: 1219 Data size: 433964 Basic stats: COMPLETE Column stats: COMPLETE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1219 Data size: 433964 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | value expressions:_col1 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | Filter Operator [FIL_13] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - | TableScan [TS_0] - | alias:src - | Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_7] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col1 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator [FIL_14] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_3] - alias:src - Statistics:Num rows: 500 Data size: 89000 Basic stats: COMPLETE Column stats: COMPLETE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_10] + Merge Join Operator [MERGEJOIN_15] (rows=1219 width=356) + Output:["_col0","_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_13] (rows=500 width=178) + predicate:key is not null + TableScan [TS_0] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=500 width=178) + Output:["_col0","_col1"] + Filter Operator [FIL_14] (rows=500 width=178) + predicate:key is not null + TableScan [TS_3] (rows=500 width=178) + default@src,src,Tbl:COMPLETE,Col:COMPLETE,Output:["key","value"] PREHOOK: query: explain select /*+ mapjoin(k)*/ sum(hash(k.key)), sum(hash(v.val)) from T1 k join T1 v on k.key=v.val PREHOOK: type: QUERY @@ -8506,57 +5719,33 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_13] - compressed:true - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_11] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_9] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:hash(_col0) (type: int), hash(_col6) (type: int) - Map Join Operator [MAPJOIN_18] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"key (type: string)","Map 4":"val (type: string)"} - | outputColumnNames:["_col0","_col6"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_5] - | key expressions:val (type: string) - | Map-reduce partition columns:val (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_17] - | predicate:val is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:v - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Filter Operator [FIL_16] - predicate:key is not null (type: boolean) - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:k - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_13] + Group By Operator [GBY_11] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_10] + Group By Operator [GBY_9] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_8] + PartitionCols:rand() + Map Join Operator [MAPJOIN_18] (rows=1 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col6"],keys:{"FIL_16":"key","RS_5":"val"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_5] + PartitionCols:val + Filter Operator [FIL_17] (rows=1 width=30) + predicate:val is not null + TableScan [TS_1] (rows=1 width=30) + default@t1,v,Tbl:COMPLETE,Col:NONE,Output:["val"] + <-Filter Operator [FIL_16] (rows=1 width=30) + predicate:key is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,k,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain select sum(hash(k.key)), sum(hash(v.val)) from T1 k join T1 v on k.key=v.key PREHOOK: type: QUERY @@ -8570,67 +5759,39 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_14] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_12] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int) - Select Operator [SEL_9] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_21] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col0 (type: string)","Map 4":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col2"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_20] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:k - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_19] - predicate:key is not null (type: boolean) - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:k - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_16] + Group By Operator [GBY_14] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_13] + Group By Operator [GBY_12] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:rand() + Select Operator [SEL_9] (rows=1 width=33) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_21] (rows=1 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col2"],keys:{"SEL_2":"_col0","RS_7":"_col0"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=30) + Output:["_col0","_col1"] + Filter Operator [FIL_20] (rows=1 width=30) + predicate:key is not null + TableScan [TS_3] (rows=1 width=30) + default@t1,k,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Select Operator [SEL_2] (rows=1 width=30) + Output:["_col0"] + Filter Operator [FIL_19] (rows=1 width=30) + predicate:key is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,k,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain select count(1) from T1 a join T1 b on a.key = b.key PREHOOK: type: QUERY @@ -8644,61 +5805,37 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_16] - compressed:true - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_14] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_12] - | aggregations:["count(1)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_21] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col0 (type: string)","Map 4":"_col0 (type: string)"} - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_7] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_20] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:a - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_19] - predicate:key is not null (type: boolean) - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:a - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_16] + Group By Operator [GBY_14] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_13] + Group By Operator [GBY_12] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_11] + PartitionCols:rand() + Map Join Operator [MAPJOIN_21] (rows=1 width=33) + HybridGraceHashJoin:true,keys:{"SEL_2":"_col0","RS_7":"_col0"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_7] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=1 width=30) + Output:["_col0"] + Filter Operator [FIL_20] (rows=1 width=30) + predicate:key is not null + TableScan [TS_3] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=1 width=30) + Output:["_col0"] + Filter Operator [FIL_19] (rows=1 width=30) + predicate:key is not null + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain FROM T1 a LEFT OUTER JOIN T2 c ON c.key+1=a.key select sum(hash(a.key)), sum(hash(a.val)), sum(hash(c.key)) PREHOOK: type: QUERY @@ -8712,61 +5849,35 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_14] - compressed:true - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_12] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_11] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_10] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_9] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: int), _col1 (type: int), _col2 (type: int) - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_17] - | condition map:[{"":"Left Outer Join0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"UDFToDouble(_col0) (type: double)","Map 4":"(UDFToDouble(_col0) + UDFToDouble(1)) (type: double)"} - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_5] - | key expressions:(UDFToDouble(_col0) + UDFToDouble(1)) (type: double) - | Map-reduce partition columns:(UDFToDouble(_col0) + UDFToDouble(1)) (type: double) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_3] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_2] - | alias:c - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:a - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_14] + Group By Operator [GBY_12] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_11] + Group By Operator [GBY_10] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:rand() + Select Operator [SEL_7] (rows=1 width=33) + Output:["_col0","_col1","_col2"] + Map Join Operator [MAPJOIN_17] (rows=1 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col2"],keys:{"SEL_1":"UDFToDouble(_col0)","RS_5":"(UDFToDouble(_col0) + UDFToDouble(1))"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_5] + PartitionCols:(UDFToDouble(_col0) + UDFToDouble(1)) + Select Operator [SEL_3] (rows=1 width=30) + Output:["_col0"] + TableScan [TS_2] (rows=1 width=30) + default@t2,c,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_1] (rows=1 width=30) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] PREHOOK: query: explain FROM T1 a RIGHT OUTER JOIN T2 c ON c.key+1=a.key select /*+ STREAMTABLE(a) */ sum(hash(a.key)), sum(hash(a.val)), sum(hash(c.key)) PREHOOK: type: QUERY @@ -8780,52 +5891,29 @@ Reducer 3 <- Map 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_9] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_7] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Map 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:hash(_col0) (type: int), hash(_col1) (type: int), hash(_col5) (type: int) - Map Join Operator [MAPJOIN_14] - | condition map:[{"":"Right Outer Join0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"UDFToDouble(key) (type: double)","Map 2":"(key + 1) (type: double)"} - | outputColumnNames:["_col0","_col1","_col5"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [BROADCAST_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:UDFToDouble(key) (type: double) - | Map-reduce partition columns:UDFToDouble(key) (type: double) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:key (type: string), val (type: string) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-TableScan [TS_1] - alias:c - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_11] + Group By Operator [GBY_9] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Group By Operator [GBY_7] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Map 2 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:rand() + Map Join Operator [MAPJOIN_14] (rows=1 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col5"],keys:{"RS_2":"UDFToDouble(key)","TS_1":"(key + 1)"} + <-Map 1 [BROADCAST_EDGE] + BROADCAST [RS_2] + PartitionCols:UDFToDouble(key) + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-TableScan [TS_1] (rows=1 width=30) + default@t2,c,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain FROM T1 a FULL OUTER JOIN T2 c ON c.key+1=a.key select /*+ STREAMTABLE(a) */ sum(hash(a.key)), sum(hash(a.val)), sum(hash(c.key)) PREHOOK: type: QUERY @@ -8839,58 +5927,32 @@ Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_9] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - sort order: - Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint) - Group By Operator [GBY_7] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 24 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:hash(_col0) (type: int), hash(_col1) (type: int), hash(_col5) (type: int) - Merge Join Operator [MERGEJOIN_12] - | condition map:[{"":"Outer Join 0 to 1"}] - | keys:{"0":"UDFToDouble(key) (type: double)","1":"(key + 1) (type: double)"} - | outputColumnNames:["_col0","_col1","_col5"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_2] - | key expressions:UDFToDouble(key) (type: double) - | Map-reduce partition columns:UDFToDouble(key) (type: double) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:key (type: string), val (type: string) - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-Map 5 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - key expressions:(key + 1) (type: double) - Map-reduce partition columns:(key + 1) (type: double) - sort order:+ - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - value expressions:key (type: string) - TableScan [TS_1] - alias:c - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_11] + Group By Operator [GBY_9] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Group By Operator [GBY_7] (rows=1 width=24) + Output:["_col0","_col1","_col2"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)","sum(VALUE._col2)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:rand() + Merge Join Operator [MERGEJOIN_12] (rows=1 width=33) + Output:["_col0","_col1","_col5"],keys:{"0":"UDFToDouble(key)","1":"(key + 1)"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + PartitionCols:UDFToDouble(key) + TableScan [TS_0] (rows=1 width=30) + default@t1,a,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:(key + 1) + TableScan [TS_1] (rows=1 width=30) + default@t2,c,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain select /*+ mapjoin(v)*/ sum(hash(k.key)), sum(hash(v.val)) from T1 k left outer join T1 v on k.key+1=v.key PREHOOK: type: QUERY @@ -8904,50 +5966,27 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_11] - compressed:true - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_9] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_8] - sort order: - Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint), _col1 (type: bigint) - Group By Operator [GBY_7] - | aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 16 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_6] - Map-reduce partition columns:rand() (type: double) - sort order: - Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - value expressions:hash(_col0) (type: int), hash(_col6) (type: int) - Map Join Operator [MAPJOIN_14] - | condition map:[{"":"Left Outer Join0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"(key + 1) (type: double)","Map 4":"UDFToDouble(key) (type: double)"} - | outputColumnNames:["_col0","_col6"] - | Statistics:Num rows: 1 Data size: 33 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [BROADCAST_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:UDFToDouble(key) (type: double) - | Map-reduce partition columns:UDFToDouble(key) (type: double) - | sort order:+ - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - | value expressions:val (type: string) - | TableScan [TS_1] - | alias:v - | Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE - |<-TableScan [TS_0] - alias:k - Statistics:Num rows: 1 Data size: 30 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_11] + Group By Operator [GBY_9] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_8] + Group By Operator [GBY_7] (rows=1 width=16) + Output:["_col0","_col1"],aggregations:["sum(VALUE._col0)","sum(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_6] + PartitionCols:rand() + Map Join Operator [MAPJOIN_14] (rows=1 width=33) + HybridGraceHashJoin:true,Output:["_col0","_col6"],keys:{"TS_0":"(key + 1)","RS_3":"UDFToDouble(key)"} + <-Map 4 [BROADCAST_EDGE] + BROADCAST [RS_3] + PartitionCols:UDFToDouble(key) + TableScan [TS_1] (rows=1 width=30) + default@t1,v,Tbl:COMPLETE,Col:NONE,Output:["key","val"] + <-TableScan [TS_0] (rows=1 width=30) + default@t1,k,Tbl:COMPLETE,Col:NONE,Output:["key"] diff --git a/ql/src/test/results/clientpositive/tez/explainuser_2.q.out b/ql/src/test/results/clientpositive/tez/explainuser_2.q.out index eb7d564..788e50f 100644 --- a/ql/src/test/results/clientpositive/tez/explainuser_2.q.out +++ b/ql/src/test/results/clientpositive/tez/explainuser_2.q.out @@ -185,81 +185,47 @@ Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Reducer 3 <- Map 5 (SIMPLE_EDGE), Reducer 2 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 3 - File Output Operator [FS_16] - compressed:false - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_26] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col3 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col3","_col6"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - |<-Map 5 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_24] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_12] - key expressions:_col3 (type: string) - Map-reduce partition columns:_col3 (type: string) - sort order:+ - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string) - Merge Join Operator [MERGEJOIN_25] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_9] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_22] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:z - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_10] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: string) - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_23] - predicate:(key is not null and value is not null) (type: boolean) - Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:x - Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 3 + File Output Operator [FS_16] + Select Operator [SEL_15] (rows=605 width=10) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_26] (rows=605 width=10) + Output:["_col0","_col3","_col6"],keys:{"0":"_col3","1":"_col0"} + <-Map 5 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_24] (rows=500 width=10) + predicate:key is not null + TableScan [TS_6] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_25] (rows=550 width=10) + Output:["_col0","_col3"],keys:{"0":"_col0","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_9] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_22] (rows=500 width=10) + predicate:value is not null + TableScan [TS_0] (rows=500 width=10) + default@srcpart,z,Tbl:COMPLETE,Col:NONE,Output:["value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_10] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_23] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_3] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: EXPLAIN select @@ -331,252 +297,134 @@ Reducer 8 <- Map 12 (SIMPLE_EDGE), Map 7 (SIMPLE_EDGE) Reducer 9 <- Map 13 (SIMPLE_EDGE), Reducer 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_55] - compressed:false - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_54] - Number of rows:100 - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_53] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_52] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - Select Operator [SEL_51] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_50] - | aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_49] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - Group By Operator [GBY_48] - aggregations:["count(_col13)","count(_col21)","count(_col3)"] - keys:_col2 (type: string), _col12 (type: string), _col20 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_47] - outputColumnNames:["_col2","_col12","_col20","_col13","_col21","_col3"] - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_97] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string), _col3 (type: string)","1":"_col15 (type: string), _col17 (type: string)"} - | outputColumnNames:["_col2","_col3","_col12","_col13","_col20","_col21"] - | Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | key expressions:_col15 (type: string), _col17 (type: string) - | Map-reduce partition columns:_col15 (type: string), _col17 (type: string) - | sort order:++ - | Statistics:Num rows: 1464 Data size: 15552 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col6 (type: string), _col7 (type: string), _col14 (type: string) - | Select Operator [SEL_40] - | outputColumnNames:["_col14","_col15","_col17","_col6","_col7"] - | Statistics:Num rows: 1464 Data size: 15552 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_96] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col4 (type: string), _col6 (type: string)","1":"_col2 (type: string), _col4 (type: string)"} - | | outputColumnNames:["_col2","_col3","_col14","_col15","_col17"] - | | Statistics:Num rows: 1464 Data size: 15552 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 10 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_37] - | | key expressions:_col4 (type: string), _col6 (type: string) - | | Map-reduce partition columns:_col4 (type: string), _col6 (type: string) - | | sort order:++ - | | Statistics:Num rows: 1331 Data size: 14139 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: string), _col3 (type: string) - | | Merge Join Operator [MERGEJOIN_94] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col3 (type: string)","1":"_col1 (type: string)"} - | | | outputColumnNames:["_col2","_col3","_col4","_col6"] - | | | Statistics:Num rows: 1331 Data size: 14139 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 14 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_35] - | | | key expressions:_col1 (type: string) - | | | Map-reduce partition columns:_col1 (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_17] - | | | outputColumnNames:["_col1"] - | | | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_88] - | | | predicate:((key = 'src1key') and value is not null) (type: boolean) - | | | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_15] - | | | alias:src1 - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 9 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_34] - | | key expressions:_col3 (type: string) - | | Map-reduce partition columns:_col3 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: string), _col4 (type: string), _col6 (type: string) - | | Merge Join Operator [MERGEJOIN_93] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | | | outputColumnNames:["_col2","_col3","_col4","_col6"] - | | | Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 13 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_32] - | | | key expressions:_col0 (type: string) - | | | Map-reduce partition columns:_col0 (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_14] - | | | outputColumnNames:["_col0"] - | | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_87] - | | | predicate:((value = 'd1value') and key is not null) (type: boolean) - | | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_12] - | | | alias:d1 - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 8 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_31] - | | key expressions:_col2 (type: string) - | | Map-reduce partition columns:_col2 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col3 (type: string), _col4 (type: string), _col6 (type: string) - | | Merge Join Operator [MERGEJOIN_92] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"_col1 (type: string)","1":"_col3 (type: string)"} - | | | outputColumnNames:["_col2","_col3","_col4","_col6"] - | | | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 12 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_29] - | | | key expressions:_col3 (type: string) - | | | Map-reduce partition columns:_col3 (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: string) - | | | Select Operator [SEL_11] - | | | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_86] - | | | predicate:(((((k3 is not null and (v3 = 'ssv3')) and k2 is not null) and k1 is not null) and v1 is not null) and v2 is not null) (type: boolean) - | | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_9] - | | | alias:ss - | | | Statistics:Num rows: 85 Data size: 2945 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 7 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_28] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_8] - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_85] - | | predicate:((key = 'srcpartkey') and value is not null) (type: boolean) - | | Statistics:Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_6] - | | alias:srcpart - | | Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_38] - | key expressions:_col2 (type: string), _col4 (type: string) - | Map-reduce partition columns:_col2 (type: string), _col4 (type: string) - | sort order:++ - | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: string), _col5 (type: string) - | Merge Join Operator [MERGEJOIN_95] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_24] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) - | | Select Operator [SEL_20] - | | outputColumnNames:["_col0","_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_89] - | | predicate:((((((v1 = 'srv1') and k3 is not null) and k2 is not null) and v3 is not null) and v2 is not null) and k1 is not null) (type: boolean) - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_18] - | | alias:sr - | | Statistics:Num rows: 85 Data size: 2945 Basic stats: COMPLETE Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_23] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_90] - | predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) (type: boolean) - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:d1 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [SIMPLE_EDGE] - Reduce Output Operator [RS_44] - key expressions:_col1 (type: string), _col3 (type: string) - Map-reduce partition columns:_col1 (type: string), _col3 (type: string) - sort order:++ - Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - value expressions:_col2 (type: string) - Merge Join Operator [MERGEJOIN_91] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2","_col3"] - | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_41] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string), _col2 (type: string), _col3 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_83] - | predicate:((v3 is not null and v2 is not null) and k1 is not null) (type: boolean) - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:cs - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [SIMPLE_EDGE] - Reduce Output Operator [RS_42] - key expressions:_col0 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:+ - Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_84] - predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) (type: boolean) - Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:d1 - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_55] + Limit [LIM_54] (rows=100 width=10) + Number of rows:100 + Select Operator [SEL_53] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_52] + Select Operator [SEL_51] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_50] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_48] (rows=1610 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(_col13)","count(_col21)","count(_col3)"],keys:_col2, _col12, _col20 + Select Operator [SEL_47] (rows=1610 width=10) + Output:["_col2","_col12","_col20","_col13","_col21","_col3"] + Merge Join Operator [MERGEJOIN_97] (rows=1610 width=10) + Output:["_col2","_col3","_col12","_col13","_col20","_col21"],keys:{"0":"_col1, _col3","1":"_col15, _col17"} + <-Reducer 11 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col15, _col17 + Select Operator [SEL_40] (rows=1464 width=10) + Output:["_col14","_col15","_col17","_col6","_col7"] + Merge Join Operator [MERGEJOIN_96] (rows=1464 width=10) + Output:["_col2","_col3","_col14","_col15","_col17"],keys:{"0":"_col4, _col6","1":"_col2, _col4"} + <-Reducer 10 [SIMPLE_EDGE] + SHUFFLE [RS_37] + PartitionCols:_col4, _col6 + Merge Join Operator [MERGEJOIN_94] (rows=1331 width=10) + Output:["_col2","_col3","_col4","_col6"],keys:{"0":"_col3","1":"_col1"} + <-Map 14 [SIMPLE_EDGE] + SHUFFLE [RS_35] + PartitionCols:_col1 + Select Operator [SEL_17] (rows=12 width=7) + Output:["_col1"] + Filter Operator [FIL_88] (rows=12 width=7) + predicate:((key = 'src1key') and value is not null) + TableScan [TS_15] (rows=25 width=7) + default@src1,src1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 9 [SIMPLE_EDGE] + SHUFFLE [RS_34] + PartitionCols:_col3 + Merge Join Operator [MERGEJOIN_93] (rows=1210 width=10) + Output:["_col2","_col3","_col4","_col6"],keys:{"0":"_col2","1":"_col0"} + <-Map 13 [SIMPLE_EDGE] + SHUFFLE [RS_32] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_87] (rows=250 width=10) + predicate:((value = 'd1value') and key is not null) + TableScan [TS_12] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 8 [SIMPLE_EDGE] + SHUFFLE [RS_31] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_92] (rows=1100 width=10) + Output:["_col2","_col3","_col4","_col6"],keys:{"0":"_col1","1":"_col3"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_29] + PartitionCols:_col3 + Select Operator [SEL_11] (rows=42 width=34) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_86] (rows=42 width=34) + predicate:(((((k3 is not null and (v3 = 'ssv3')) and k2 is not null) and k1 is not null) and v1 is not null) and v2 is not null) + TableScan [TS_9] (rows=85 width=34) + default@ss,ss,Tbl:COMPLETE,Col:NONE,Output:["k1","v1","k2","v2","k3","v3"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_28] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=1000 width=10) + Output:["_col1"] + Filter Operator [FIL_85] (rows=1000 width=10) + predicate:((key = 'srcpartkey') and value is not null) + TableScan [TS_6] (rows=2000 width=10) + default@srcpart,srcpart,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_38] + PartitionCols:_col2, _col4 + Merge Join Operator [MERGEJOIN_95] (rows=275 width=10) + Output:["_col2","_col3","_col4","_col5"],keys:{"0":"_col0","1":"_col0"} + <-Map 15 [SIMPLE_EDGE] + SHUFFLE [RS_24] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=42 width=34) + Output:["_col0","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_89] (rows=42 width=34) + predicate:((((((v1 = 'srv1') and k3 is not null) and k2 is not null) and v3 is not null) and v2 is not null) and k1 is not null) + TableScan [TS_18] (rows=85 width=34) + default@sr,sr,Tbl:COMPLETE,Col:NONE,Output:["k1","v1","k2","v2","k3","v3"] + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_90] (rows=250 width=10) + predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) + TableScan [TS_21] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 2 [SIMPLE_EDGE] + SHUFFLE [RS_44] + PartitionCols:_col1, _col3 + Merge Join Operator [MERGEJOIN_91] (rows=275 width=10) + Output:["_col1","_col2","_col3"],keys:{"0":"_col0","1":"_col0"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_41] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=170 width=34) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_83] (rows=170 width=34) + predicate:((v3 is not null and v2 is not null) and k1 is not null) + TableScan [TS_0] (rows=170 width=34) + default@cs,cs,Tbl:COMPLETE,Col:NONE,Output:["k1","v2","k3","v3"] + <-Map 6 [SIMPLE_EDGE] + SHUFFLE [RS_42] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_84] (rows=250 width=10) + predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) + TableScan [TS_3] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain SELECT x.key, z.value, y.value @@ -612,245 +460,138 @@ Reducer 5 <- Map 10 (SIMPLE_EDGE), Reducer 4 (SIMPLE_EDGE), Union 6 (CONTAINS) Reducer 7 <- Union 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_59] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_57] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 6 [SIMPLE_EDGE] - |<-Reducer 15 [CONTAINS] - | Reduce Output Operator [RS_56] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_55] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_51] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_85] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_49] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_44] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_81] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_42] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 14 [SIMPLE_EDGE] - | Reduce Output Operator [RS_48] - | key expressions:_col2 (type: string) - | Map-reduce partition columns:_col2 (type: string) - | sort order:+ - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Merge Join Operator [MERGEJOIN_84] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - | |<-Map 17 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_46] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_80] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [SIMPLE_EDGE] - | Reduce Output Operator [RS_45] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_38] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 12 [SIMPLE_EDGE] - | |<-Map 11 [CONTAINS] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_35] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_78] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [CONTAINS] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_35] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_79] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [CONTAINS] - Reduce Output Operator [RS_56] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_55] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_83] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_18] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_77] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col2 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:+ - Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Merge Join Operator [MERGEJOIN_82] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_76] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_13] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_12] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_9] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_74] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [CONTAINS] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_75] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_59] + Group By Operator [GBY_57] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 6 [SIMPLE_EDGE] + <-Reducer 15 [CONTAINS] + Reduce Output Operator [RS_56] + PartitionCols:_col0, _col1 + Group By Operator [GBY_55] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_51] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_85] (rows=550 width=10) + Output:["_col1","_col2"],keys:{"0":"_col2","1":"_col0"} + <-Map 18 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col0 + Select Operator [SEL_44] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_81] (rows=500 width=10) + predicate:key is not null + TableScan [TS_42] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Reducer 14 [SIMPLE_EDGE] + SHUFFLE [RS_48] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_84] (rows=288 width=10) + Output:["_col1","_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 17 [SIMPLE_EDGE] + SHUFFLE [RS_46] + PartitionCols:_col1 + Select Operator [SEL_41] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_80] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_39] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 13 [SIMPLE_EDGE] + SHUFFLE [RS_45] + PartitionCols:_col1 + Select Operator [SEL_38] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_37] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 12 [SIMPLE_EDGE] + <-Map 11 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_28] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_78] (rows=25 width=7) + predicate:value is not null + TableScan [TS_26] (rows=25 width=7) + Output:["key","value"] + <-Map 16 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_31] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_79] (rows=500 width=10) + predicate:value is not null + TableScan [TS_29] (rows=500 width=10) + Output:["key","value"] + <-Reducer 5 [CONTAINS] + Reduce Output Operator [RS_56] + PartitionCols:_col0, _col1 + Group By Operator [GBY_55] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_83] (rows=550 width=10) + Output:["_col1","_col2"],keys:{"0":"_col2","1":"_col0"} + <-Map 10 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_77] (rows=500 width=10) + predicate:key is not null + TableScan [TS_16] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_82] (rows=288 width=10) + Output:["_col1","_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col1 + Select Operator [SEL_15] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_76] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_13] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col1 + Select Operator [SEL_12] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_11] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_2] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_74] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 8 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_75] (rows=500 width=10) + predicate:value is not null + TableScan [TS_3] (rows=500 width=10) + Output:["key","value"] PREHOOK: query: explain SELECT x.key, y.value @@ -906,475 +647,265 @@ Reducer 7 <- Union 6 (SIMPLE_EDGE), Union 8 (CONTAINS) Reducer 9 <- Union 8 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 9 - File Output Operator [FS_122] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_120] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 8 [SIMPLE_EDGE] - |<-Reducer 32 [CONTAINS] - | Reduce Output Operator [RS_119] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_118] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_114] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_170] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col5"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 37 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_112] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_107] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_164] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_105] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 31 [SIMPLE_EDGE] - | Reduce Output Operator [RS_111] - | key expressions:_col2 (type: string) - | Map-reduce partition columns:_col2 (type: string) - | sort order:+ - | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_169] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | |<-Map 36 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_109] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_104] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_163] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_102] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 30 [SIMPLE_EDGE] - | Reduce Output Operator [RS_108] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_101] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_100] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | |<-Union 29 [SIMPLE_EDGE] - | |<-Map 35 [CONTAINS] - | | Reduce Output Operator [RS_99] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_98] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_94] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_162] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_92] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 28 [CONTAINS] - | Reduce Output Operator [RS_99] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_98] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_90] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 27 [SIMPLE_EDGE] - | |<-Map 34 [CONTAINS] - | | Reduce Output Operator [RS_89] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_88] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_84] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_161] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_82] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 26 [CONTAINS] - | Reduce Output Operator [RS_89] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_88] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_80] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 25 [SIMPLE_EDGE] - | |<-Map 24 [CONTAINS] - | | Reduce Output Operator [RS_79] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_78] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_71] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_159] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_69] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 33 [CONTAINS] - | Reduce Output Operator [RS_79] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_78] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_74] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_160] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_72] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 7 [CONTAINS] - Reduce Output Operator [RS_119] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_118] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_67] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 6 [SIMPLE_EDGE] - |<-Reducer 19 [CONTAINS] - | Reduce Output Operator [RS_66] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_65] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_61] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_168] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col5"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 23 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_59] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_54] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_158] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_52] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 18 [SIMPLE_EDGE] - | Reduce Output Operator [RS_58] - | key expressions:_col2 (type: string) - | Map-reduce partition columns:_col2 (type: string) - | sort order:+ - | Statistics:Num rows: 419 Data size: 4431 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_167] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 419 Data size: 4431 Basic stats: COMPLETE Column stats: NONE - | |<-Map 22 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_56] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_51] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_157] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_49] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_55] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_48] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_47] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 16 [SIMPLE_EDGE] - | |<-Map 21 [CONTAINS] - | | Reduce Output Operator [RS_46] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_45] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_156] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 15 [CONTAINS] - | Reduce Output Operator [RS_46] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_45] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 14 [SIMPLE_EDGE] - | |<-Map 13 [CONTAINS] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_35] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_154] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 20 [CONTAINS] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_35] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_155] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [CONTAINS] - Reduce Output Operator [RS_66] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_65] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_166] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col2","_col5"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 12 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_18] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_153] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col2 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:+ - Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_165] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_152] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_13] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_19] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_12] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_9] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_150] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [CONTAINS] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_151] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 9 + File Output Operator [FS_122] + Group By Operator [GBY_120] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 8 [SIMPLE_EDGE] + <-Reducer 32 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_114] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_170] (rows=550 width=10) + Output:["_col2","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 37 [SIMPLE_EDGE] + SHUFFLE [RS_112] + PartitionCols:_col0 + Select Operator [SEL_107] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_164] (rows=500 width=10) + predicate:key is not null + TableScan [TS_105] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 31 [SIMPLE_EDGE] + SHUFFLE [RS_111] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_169] (rows=484 width=10) + Output:["_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 36 [SIMPLE_EDGE] + SHUFFLE [RS_109] + PartitionCols:_col1 + Select Operator [SEL_104] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_163] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_102] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 30 [SIMPLE_EDGE] + SHUFFLE [RS_108] + PartitionCols:_col1 + Select Operator [SEL_101] (rows=440 width=10) + Output:["_col1"] + Group By Operator [GBY_100] (rows=440 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 29 [SIMPLE_EDGE] + <-Map 35 [CONTAINS] + Reduce Output Operator [RS_99] + PartitionCols:_col0, _col1 + Group By Operator [GBY_98] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_94] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_162] (rows=500 width=10) + predicate:value is not null + TableScan [TS_92] (rows=500 width=10) + Output:["key","value"] + <-Reducer 28 [CONTAINS] + Reduce Output Operator [RS_99] + PartitionCols:_col0, _col1 + Group By Operator [GBY_98] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_90] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 27 [SIMPLE_EDGE] + <-Map 34 [CONTAINS] + Reduce Output Operator [RS_89] + PartitionCols:_col0, _col1 + Group By Operator [GBY_88] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_84] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_161] (rows=500 width=10) + predicate:value is not null + TableScan [TS_82] (rows=500 width=10) + Output:["key","value"] + <-Reducer 26 [CONTAINS] + Reduce Output Operator [RS_89] + PartitionCols:_col0, _col1 + Group By Operator [GBY_88] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_80] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 25 [SIMPLE_EDGE] + <-Map 24 [CONTAINS] + Reduce Output Operator [RS_79] + PartitionCols:_col0, _col1 + Group By Operator [GBY_78] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_71] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_159] (rows=25 width=7) + predicate:value is not null + TableScan [TS_69] (rows=25 width=7) + Output:["key","value"] + <-Map 33 [CONTAINS] + Reduce Output Operator [RS_79] + PartitionCols:_col0, _col1 + Group By Operator [GBY_78] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_74] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_160] (rows=500 width=10) + predicate:value is not null + TableScan [TS_72] (rows=500 width=10) + Output:["key","value"] + <-Reducer 7 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_67] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 6 [SIMPLE_EDGE] + <-Reducer 19 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_61] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_168] (rows=550 width=10) + Output:["_col2","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 23 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col0 + Select Operator [SEL_54] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_158] (rows=500 width=10) + predicate:key is not null + TableScan [TS_52] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 18 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_167] (rows=419 width=10) + Output:["_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col1 + Select Operator [SEL_51] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_157] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_49] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col1 + Select Operator [SEL_48] (rows=381 width=10) + Output:["_col1"] + Group By Operator [GBY_47] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 16 [SIMPLE_EDGE] + <-Map 21 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_41] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_156] (rows=500 width=10) + predicate:value is not null + TableScan [TS_39] (rows=500 width=10) + Output:["key","value"] + <-Reducer 15 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_37] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 14 [SIMPLE_EDGE] + <-Map 13 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_28] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_154] (rows=25 width=7) + predicate:value is not null + TableScan [TS_26] (rows=25 width=7) + Output:["key","value"] + <-Map 20 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_31] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_155] (rows=500 width=10) + predicate:value is not null + TableScan [TS_29] (rows=500 width=10) + Output:["key","value"] + <-Reducer 5 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_166] (rows=550 width=10) + Output:["_col2","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 12 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_153] (rows=500 width=10) + predicate:key is not null + TableScan [TS_16] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_165] (rows=288 width=10) + Output:["_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_20] + PartitionCols:_col1 + Select Operator [SEL_15] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_152] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_13] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col1 + Select Operator [SEL_12] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_11] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_2] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_150] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 10 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_151] (rows=500 width=10) + predicate:value is not null + TableScan [TS_3] (rows=500 width=10) + Output:["key","value"] PREHOOK: query: EXPLAIN SELECT x.key, z.value, y.value @@ -1392,70 +923,41 @@ Vertex dependency in root stage Map 1 <- Map 2 (BROADCAST_EDGE), Map 3 (BROADCAST_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_16] - compressed:false - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_26] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col3 (type: string)","Map 3":"_col0 (type: string)"} - | outputColumnNames:["_col0","_col3","_col6"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [BROADCAST_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_8] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_24] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_25] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col0 (type: string)","Map 2":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col3"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 2 [BROADCAST_EDGE] - | Reduce Output Operator [RS_10] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_5] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_23] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_22] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:z - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_16] + Select Operator [SEL_15] (rows=605 width=10) + Output:["_col0","_col1","_col2"] + Map Join Operator [MAPJOIN_26] (rows=605 width=10) + HybridGraceHashJoin:true,Output:["_col0","_col3","_col6"],keys:{"MAPJOIN_25":"_col3","RS_13":"_col0"} + <-Map 3 [BROADCAST_EDGE] + BROADCAST [RS_13] + PartitionCols:_col0 + Select Operator [SEL_8] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_24] (rows=500 width=10) + predicate:key is not null + TableScan [TS_6] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_25] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col0","_col3"],keys:{"SEL_2":"_col0","RS_10":"_col1"} + <-Map 2 [BROADCAST_EDGE] + BROADCAST [RS_10] + PartitionCols:_col1 + Select Operator [SEL_5] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_23] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_3] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_2] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_22] (rows=500 width=10) + predicate:value is not null + TableScan [TS_0] (rows=500 width=10) + default@srcpart,z,Tbl:COMPLETE,Col:NONE,Output:["value"] PREHOOK: query: EXPLAIN select @@ -1523,212 +1025,113 @@ Reducer 4 <- Map 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:100 - Stage-1 - Reducer 5 - File Output Operator [FS_55] - compressed:false - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_54] - Number of rows:100 - Statistics:Num rows: 100 Data size: 1000 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_53] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_52] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - Select Operator [SEL_51] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_50] - | aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string), KEY._col2 (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - | Statistics:Num rows: 805 Data size: 8553 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_49] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string), _col2 (type: string) - sort order:+++ - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - value expressions:_col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) - Group By Operator [GBY_48] - aggregations:["count(_col13)","count(_col21)","count(_col3)"] - keys:_col2 (type: string), _col12 (type: string), _col20 (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3","_col4","_col5"] - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_47] - outputColumnNames:["_col2","_col12","_col20","_col13","_col21","_col3"] - Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_97] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col1 (type: string), _col3 (type: string)","Map 3":"_col15 (type: string), _col17 (type: string)"} - | outputColumnNames:["_col2","_col3","_col12","_col13","_col20","_col21"] - | Statistics:Num rows: 1610 Data size: 17107 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [BROADCAST_EDGE] - | Reduce Output Operator [RS_44] - | key expressions:_col1 (type: string), _col3 (type: string) - | Map-reduce partition columns:_col1 (type: string), _col3 (type: string) - | sort order:++ - | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col2 (type: string) - | Map Join Operator [MAPJOIN_91] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 1":"_col0 (type: string)","Map 2":"_col0 (type: string)"} - | | outputColumnNames:["_col1","_col2","_col3"] - | | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | |<-Map 2 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_42] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_84] - | | predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) (type: boolean) - | | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:d1 - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_83] - | predicate:((v3 is not null and v2 is not null) and k1 is not null) (type: boolean) - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:cs - | Statistics:Num rows: 170 Data size: 5890 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_40] - outputColumnNames:["_col14","_col15","_col17","_col6","_col7"] - Statistics:Num rows: 1464 Data size: 15552 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_96] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 3":"_col4 (type: string), _col6 (type: string)","Map 10":"_col2 (type: string), _col4 (type: string)"} - | outputColumnNames:["_col2","_col3","_col14","_col15","_col17"] - | Statistics:Num rows: 1464 Data size: 15552 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [BROADCAST_EDGE] - | Reduce Output Operator [RS_38] - | key expressions:_col2 (type: string), _col4 (type: string) - | Map-reduce partition columns:_col2 (type: string), _col4 (type: string) - | sort order:++ - | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col3 (type: string), _col5 (type: string) - | Map Join Operator [MAPJOIN_95] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 9":"_col0 (type: string)","Map 10":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 275 Data size: 2921 Basic stats: COMPLETE Column stats: NONE - | |<-Map 9 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_24] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col2 (type: string), _col3 (type: string), _col4 (type: string), _col5 (type: string) - | | Select Operator [SEL_20] - | | outputColumnNames:["_col0","_col2","_col3","_col4","_col5"] - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_89] - | | predicate:((((((v1 = 'srv1') and k3 is not null) and k2 is not null) and v3 is not null) and v2 is not null) and k1 is not null) (type: boolean) - | | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_18] - | | alias:sr - | | Statistics:Num rows: 85 Data size: 2945 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_23] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_90] - | predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) (type: boolean) - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:d1 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_94] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 3":"_col3 (type: string)","Map 8":"_col1 (type: string)"} - | outputColumnNames:["_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 1331 Data size: 14139 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [BROADCAST_EDGE] - | Reduce Output Operator [RS_35] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_88] - | predicate:((key = 'src1key') and value is not null) (type: boolean) - | Statistics:Num rows: 12 Data size: 91 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_93] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 3":"_col2 (type: string)","Map 7":"_col0 (type: string)"} - | outputColumnNames:["_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [BROADCAST_EDGE] - | Reduce Output Operator [RS_32] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_14] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_87] - | predicate:((value = 'd1value') and key is not null) (type: boolean) - | Statistics:Num rows: 250 Data size: 2656 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:d1 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_92] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 3":"_col1 (type: string)","Map 6":"_col3 (type: string)"} - | outputColumnNames:["_col2","_col3","_col4","_col6"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [BROADCAST_EDGE] - | Reduce Output Operator [RS_29] - | key expressions:_col3 (type: string) - | Map-reduce partition columns:_col3 (type: string) - | sort order:+ - | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string), _col4 (type: string) - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_86] - | predicate:(((((k3 is not null and (v3 = 'ssv3')) and k2 is not null) and k1 is not null) and v1 is not null) and v2 is not null) (type: boolean) - | Statistics:Num rows: 42 Data size: 1455 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_9] - | alias:ss - | Statistics:Num rows: 85 Data size: 2945 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_8] - outputColumnNames:["_col1"] - Statistics:Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_85] - predicate:((key = 'srcpartkey') and value is not null) (type: boolean) - Statistics:Num rows: 1000 Data size: 10624 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_6] - alias:srcpart - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:100 + Stage-1 + Reducer 5 + File Output Operator [FS_55] + Limit [LIM_54] (rows=100 width=10) + Number of rows:100 + Select Operator [SEL_53] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_52] + Select Operator [SEL_51] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"] + Group By Operator [GBY_50] (rows=805 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(VALUE._col0)","count(VALUE._col1)","count(VALUE._col2)"],keys:KEY._col0, KEY._col1, KEY._col2 + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:_col0, _col1, _col2 + Group By Operator [GBY_48] (rows=1610 width=10) + Output:["_col0","_col1","_col2","_col3","_col4","_col5"],aggregations:["count(_col13)","count(_col21)","count(_col3)"],keys:_col2, _col12, _col20 + Select Operator [SEL_47] (rows=1610 width=10) + Output:["_col2","_col12","_col20","_col13","_col21","_col3"] + Map Join Operator [MAPJOIN_97] (rows=1610 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col12","_col13","_col20","_col21"],keys:{"RS_44":"_col1, _col3","SEL_40":"_col15, _col17"} + <-Map 1 [BROADCAST_EDGE] + BROADCAST [RS_44] + PartitionCols:_col1, _col3 + Map Join Operator [MAPJOIN_91] (rows=275 width=10) + HybridGraceHashJoin:true,Output:["_col1","_col2","_col3"],keys:{"SEL_2":"_col0","RS_42":"_col0"} + <-Map 2 [BROADCAST_EDGE] + BROADCAST [RS_42] + PartitionCols:_col0 + Select Operator [SEL_5] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_84] (rows=250 width=10) + predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) + TableScan [TS_3] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_2] (rows=170 width=34) + Output:["_col0","_col1","_col2","_col3"] + Filter Operator [FIL_83] (rows=170 width=34) + predicate:((v3 is not null and v2 is not null) and k1 is not null) + TableScan [TS_0] (rows=170 width=34) + default@cs,cs,Tbl:COMPLETE,Col:NONE,Output:["k1","v2","k3","v3"] + <-Select Operator [SEL_40] (rows=1464 width=10) + Output:["_col14","_col15","_col17","_col6","_col7"] + Map Join Operator [MAPJOIN_96] (rows=1464 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col14","_col15","_col17"],keys:{"MAPJOIN_94":"_col4, _col6","RS_38":"_col2, _col4"} + <-Map 10 [BROADCAST_EDGE] + BROADCAST [RS_38] + PartitionCols:_col2, _col4 + Map Join Operator [MAPJOIN_95] (rows=275 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col4","_col5"],keys:{"RS_24":"_col0","SEL_23":"_col0"} + <-Map 9 [BROADCAST_EDGE] + BROADCAST [RS_24] + PartitionCols:_col0 + Select Operator [SEL_20] (rows=42 width=34) + Output:["_col0","_col2","_col3","_col4","_col5"] + Filter Operator [FIL_89] (rows=42 width=34) + predicate:((((((v1 = 'srv1') and k3 is not null) and k2 is not null) and v3 is not null) and v2 is not null) and k1 is not null) + TableScan [TS_18] (rows=85 width=34) + default@sr,sr,Tbl:COMPLETE,Col:NONE,Output:["k1","v1","k2","v2","k3","v3"] + <-Select Operator [SEL_23] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_90] (rows=250 width=10) + predicate:((value) IN ('2000Q1', '2000Q2', '2000Q3') and key is not null) + TableScan [TS_21] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_94] (rows=1331 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col4","_col6"],keys:{"MAPJOIN_93":"_col3","RS_35":"_col1"} + <-Map 8 [BROADCAST_EDGE] + BROADCAST [RS_35] + PartitionCols:_col1 + Select Operator [SEL_17] (rows=12 width=7) + Output:["_col1"] + Filter Operator [FIL_88] (rows=12 width=7) + predicate:((key = 'src1key') and value is not null) + TableScan [TS_15] (rows=25 width=7) + default@src1,src1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_93] (rows=1210 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col4","_col6"],keys:{"MAPJOIN_92":"_col2","RS_32":"_col0"} + <-Map 7 [BROADCAST_EDGE] + BROADCAST [RS_32] + PartitionCols:_col0 + Select Operator [SEL_14] (rows=250 width=10) + Output:["_col0"] + Filter Operator [FIL_87] (rows=250 width=10) + predicate:((value = 'd1value') and key is not null) + TableScan [TS_12] (rows=500 width=10) + default@src,d1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_92] (rows=1100 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col3","_col4","_col6"],keys:{"SEL_8":"_col1","RS_29":"_col3"} + <-Map 6 [BROADCAST_EDGE] + BROADCAST [RS_29] + PartitionCols:_col3 + Select Operator [SEL_11] (rows=42 width=34) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_86] (rows=42 width=34) + predicate:(((((k3 is not null and (v3 = 'ssv3')) and k2 is not null) and k1 is not null) and v1 is not null) and v2 is not null) + TableScan [TS_9] (rows=85 width=34) + default@ss,ss,Tbl:COMPLETE,Col:NONE,Output:["k1","v1","k2","v2","k3","v3"] + <-Select Operator [SEL_8] (rows=1000 width=10) + Output:["_col1"] + Filter Operator [FIL_85] (rows=1000 width=10) + predicate:((key = 'srcpartkey') and value is not null) + TableScan [TS_6] (rows=2000 width=10) + default@srcpart,srcpart,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain SELECT x.key, z.value, y.value @@ -1760,223 +1163,126 @@ Reducer 3 <- Map 7 (BROADCAST_EDGE), Map 8 (BROADCAST_EDGE), Union 2 (SIMPLE_EDG Reducer 5 <- Union 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_59] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_57] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 4 [SIMPLE_EDGE] - |<-Reducer 11 [CONTAINS] - | Reduce Output Operator [RS_56] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_55] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_51] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_85] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 11":"_col2 (type: string)","Map 14":"_col0 (type: string)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 14 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_49] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_44] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_81] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_42] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map Join Operator [MAPJOIN_84] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 11":"_col1 (type: string)","Map 13":"_col1 (type: string)"} - | | outputColumnNames:["_col1","_col2"] - | | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_46] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_80] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_38] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 10 [SIMPLE_EDGE] - | |<-Map 12 [CONTAINS] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_35] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_31] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_79] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_29] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 9 [CONTAINS] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_35] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_28] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_78] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_26] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [CONTAINS] - Reduce Output Operator [RS_56] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_55] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_83] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 3":"_col2 (type: string)","Map 8":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [BROADCAST_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_18] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_77] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_82] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 3":"_col1 (type: string)","Map 7":"_col1 (type: string)"} - | outputColumnNames:["_col1","_col2"] - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [BROADCAST_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_76] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_13] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_12] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_9] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_74] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [CONTAINS] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_75] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_59] + Group By Operator [GBY_57] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 4 [SIMPLE_EDGE] + <-Reducer 11 [CONTAINS] + Reduce Output Operator [RS_56] + PartitionCols:_col0, _col1 + Group By Operator [GBY_55] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_51] (rows=550 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_85] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col1","_col2"],keys:{"MAPJOIN_84":"_col2","RS_49":"_col0"} + <-Map 14 [BROADCAST_EDGE] + BROADCAST [RS_49] + PartitionCols:_col0 + Select Operator [SEL_44] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_81] (rows=500 width=10) + predicate:key is not null + TableScan [TS_42] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Map Join Operator [MAPJOIN_84] (rows=288 width=10) + HybridGraceHashJoin:true,Output:["_col1","_col2"],keys:{"SEL_38":"_col1","RS_46":"_col1"} + <-Map 13 [BROADCAST_EDGE] + BROADCAST [RS_46] + PartitionCols:_col1 + Select Operator [SEL_41] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_80] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_39] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_38] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_37] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 10 [SIMPLE_EDGE] + <-Map 12 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_31] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_79] (rows=500 width=10) + predicate:value is not null + TableScan [TS_29] (rows=500 width=10) + Output:["key","value"] + <-Map 9 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_28] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_78] (rows=25 width=7) + predicate:value is not null + TableScan [TS_26] (rows=25 width=7) + Output:["key","value"] + <-Reducer 3 [CONTAINS] + Reduce Output Operator [RS_56] + PartitionCols:_col0, _col1 + Group By Operator [GBY_55] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=550 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_83] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col1","_col2"],keys:{"MAPJOIN_82":"_col2","RS_23":"_col0"} + <-Map 8 [BROADCAST_EDGE] + BROADCAST [RS_23] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_77] (rows=500 width=10) + predicate:key is not null + TableScan [TS_16] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Map Join Operator [MAPJOIN_82] (rows=288 width=10) + HybridGraceHashJoin:true,Output:["_col1","_col2"],keys:{"SEL_12":"_col1","RS_20":"_col1"} + <-Map 7 [BROADCAST_EDGE] + BROADCAST [RS_20] + PartitionCols:_col1 + Select Operator [SEL_15] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_76] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_13] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_12] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_11] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_2] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_74] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 6 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_75] (rows=500 width=10) + predicate:value is not null + TableScan [TS_3] (rows=500 width=10) + Output:["key","value"] PREHOOK: query: explain SELECT x.key, y.value @@ -2026,445 +1332,247 @@ Reducer 5 <- Union 4 (SIMPLE_EDGE), Union 6 (CONTAINS) Reducer 7 <- Union 6 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 7 - File Output Operator [FS_122] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_120] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 6 [SIMPLE_EDGE] - |<-Reducer 26 [CONTAINS] - | Reduce Output Operator [RS_119] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_118] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_114] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_170] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 26":"_col2 (type: string)","Map 31":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col5"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 31 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_112] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_107] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_164] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_105] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map Join Operator [MAPJOIN_169] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 26":"_col1 (type: string)","Map 30":"_col1 (type: string)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | |<-Map 30 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_109] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_104] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_163] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_102] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_101] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_100] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | |<-Union 25 [SIMPLE_EDGE] - | |<-Map 29 [CONTAINS] - | | Reduce Output Operator [RS_99] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_98] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_94] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_162] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_92] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 24 [CONTAINS] - | Reduce Output Operator [RS_99] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_98] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_90] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 23 [SIMPLE_EDGE] - | |<-Map 28 [CONTAINS] - | | Reduce Output Operator [RS_89] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_88] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_84] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_161] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_82] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 22 [CONTAINS] - | Reduce Output Operator [RS_89] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_88] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_80] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 21 [SIMPLE_EDGE] - | |<-Map 20 [CONTAINS] - | | Reduce Output Operator [RS_79] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_78] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_71] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_159] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_69] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 27 [CONTAINS] - | Reduce Output Operator [RS_79] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_78] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_74] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_160] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_72] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 5 [CONTAINS] - Reduce Output Operator [RS_119] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_118] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_67] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Union 4 [SIMPLE_EDGE] - |<-Reducer 15 [CONTAINS] - | Reduce Output Operator [RS_66] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_65] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_61] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_168] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 15":"_col2 (type: string)","Map 19":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col5"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 19 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_59] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_54] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_158] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_52] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map Join Operator [MAPJOIN_167] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Reducer 15":"_col1 (type: string)","Map 18":"_col1 (type: string)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 419 Data size: 4431 Basic stats: COMPLETE Column stats: NONE - | |<-Map 18 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_56] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_51] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_157] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_49] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_48] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_47] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 14 [SIMPLE_EDGE] - | |<-Map 17 [CONTAINS] - | | Reduce Output Operator [RS_46] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_45] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_156] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 13 [CONTAINS] - | Reduce Output Operator [RS_46] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_45] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 12 [SIMPLE_EDGE] - | |<-Map 11 [CONTAINS] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_35] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_154] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [CONTAINS] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_35] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_155] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [CONTAINS] - Reduce Output Operator [RS_66] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_65] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1100 Data size: 11686 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_166] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 3":"_col2 (type: string)","Map 10":"_col0 (type: string)"} - | outputColumnNames:["_col2","_col5"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [BROADCAST_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_18] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_153] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map Join Operator [MAPJOIN_165] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 3":"_col1 (type: string)","Map 9":"_col1 (type: string)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [BROADCAST_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_152] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_13] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_12] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_9] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_150] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 8 [CONTAINS] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_151] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 7 + File Output Operator [FS_122] + Group By Operator [GBY_120] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 6 [SIMPLE_EDGE] + <-Reducer 26 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_114] (rows=550 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_170] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col5"],keys:{"MAPJOIN_169":"_col2","RS_112":"_col0"} + <-Map 31 [BROADCAST_EDGE] + BROADCAST [RS_112] + PartitionCols:_col0 + Select Operator [SEL_107] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_164] (rows=500 width=10) + predicate:key is not null + TableScan [TS_105] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_169] (rows=484 width=10) + HybridGraceHashJoin:true,Output:["_col2"],keys:{"SEL_101":"_col1","RS_109":"_col1"} + <-Map 30 [BROADCAST_EDGE] + BROADCAST [RS_109] + PartitionCols:_col1 + Select Operator [SEL_104] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_163] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_102] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_101] (rows=440 width=10) + Output:["_col1"] + Group By Operator [GBY_100] (rows=440 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 25 [SIMPLE_EDGE] + <-Map 29 [CONTAINS] + Reduce Output Operator [RS_99] + PartitionCols:_col0, _col1 + Group By Operator [GBY_98] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_94] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_162] (rows=500 width=10) + predicate:value is not null + TableScan [TS_92] (rows=500 width=10) + Output:["key","value"] + <-Reducer 24 [CONTAINS] + Reduce Output Operator [RS_99] + PartitionCols:_col0, _col1 + Group By Operator [GBY_98] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_90] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 23 [SIMPLE_EDGE] + <-Map 28 [CONTAINS] + Reduce Output Operator [RS_89] + PartitionCols:_col0, _col1 + Group By Operator [GBY_88] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_84] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_161] (rows=500 width=10) + predicate:value is not null + TableScan [TS_82] (rows=500 width=10) + Output:["key","value"] + <-Reducer 22 [CONTAINS] + Reduce Output Operator [RS_89] + PartitionCols:_col0, _col1 + Group By Operator [GBY_88] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_80] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 21 [SIMPLE_EDGE] + <-Map 20 [CONTAINS] + Reduce Output Operator [RS_79] + PartitionCols:_col0, _col1 + Group By Operator [GBY_78] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_71] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_159] (rows=25 width=7) + predicate:value is not null + TableScan [TS_69] (rows=25 width=7) + Output:["key","value"] + <-Map 27 [CONTAINS] + Reduce Output Operator [RS_79] + PartitionCols:_col0, _col1 + Group By Operator [GBY_78] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_74] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_160] (rows=500 width=10) + predicate:value is not null + TableScan [TS_72] (rows=500 width=10) + Output:["key","value"] + <-Reducer 5 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_67] (rows=550 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 4 [SIMPLE_EDGE] + <-Reducer 15 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_61] (rows=550 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_168] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col5"],keys:{"MAPJOIN_167":"_col2","RS_59":"_col0"} + <-Map 19 [BROADCAST_EDGE] + BROADCAST [RS_59] + PartitionCols:_col0 + Select Operator [SEL_54] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_158] (rows=500 width=10) + predicate:key is not null + TableScan [TS_52] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_167] (rows=419 width=10) + HybridGraceHashJoin:true,Output:["_col2"],keys:{"SEL_48":"_col1","RS_56":"_col1"} + <-Map 18 [BROADCAST_EDGE] + BROADCAST [RS_56] + PartitionCols:_col1 + Select Operator [SEL_51] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_157] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_49] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_48] (rows=381 width=10) + Output:["_col1"] + Group By Operator [GBY_47] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 14 [SIMPLE_EDGE] + <-Map 17 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_41] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_156] (rows=500 width=10) + predicate:value is not null + TableScan [TS_39] (rows=500 width=10) + Output:["key","value"] + <-Reducer 13 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_37] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 12 [SIMPLE_EDGE] + <-Map 11 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_28] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_154] (rows=25 width=7) + predicate:value is not null + TableScan [TS_26] (rows=25 width=7) + Output:["key","value"] + <-Map 16 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_31] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_155] (rows=500 width=10) + predicate:value is not null + TableScan [TS_29] (rows=500 width=10) + Output:["key","value"] + <-Reducer 3 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1100 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=550 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_166] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col2","_col5"],keys:{"MAPJOIN_165":"_col2","RS_23":"_col0"} + <-Map 10 [BROADCAST_EDGE] + BROADCAST [RS_23] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_153] (rows=500 width=10) + predicate:key is not null + TableScan [TS_16] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map Join Operator [MAPJOIN_165] (rows=288 width=10) + HybridGraceHashJoin:true,Output:["_col2"],keys:{"SEL_12":"_col1","RS_20":"_col1"} + <-Map 9 [BROADCAST_EDGE] + BROADCAST [RS_20] + PartitionCols:_col1 + Select Operator [SEL_15] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_152] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_13] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_12] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_11] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_2] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_150] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 8 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_151] (rows=500 width=10) + predicate:value is not null + TableScan [TS_3] (rows=500 width=10) + Output:["key","value"] PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -2607,38 +1715,26 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | - |<-Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_14] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_13] - predicate:key is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:s1 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_10] + Merge Join Operator [MERGEJOIN_15] (rows=266 width=10) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_14] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_13] (rows=242 width=10) + predicate:key is not null + TableScan [TS_0] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key join tab s2 on s1.value=s2.value @@ -2652,65 +1748,40 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_16] - compressed:false - Statistics:Num rows: 292 Data size: 3104 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_27] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 292 Data size: 3104 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int) - | Merge Join Operator [MERGEJOIN_25] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | | - | |<-Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_23] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:s1 - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_22] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_8] - outputColumnNames:["_col1"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_24] - predicate:value is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_6] - alias:s1 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_16] + Merge Join Operator [MERGEJOIN_27] (rows=292 width=10) + Output:["_col0","_col1"],keys:{"0":"_col1","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_25] (rows=266 width=10) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_23] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=242 width=10) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242 width=10) + Output:["_col1"] + Filter Operator [FIL_24] (rows=242 width=10) + predicate:value is not null + TableScan [TS_6] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["value"] PREHOOK: query: explain select s1.key as key, s1.value as value from tab s1 join tab2 s3 on s1.key=s3.key @@ -2721,38 +1792,26 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_15] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | - |<-Select Operator [SEL_5] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_14] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_3] - | alias:s3 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_2] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_13] - predicate:key is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:s1 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_10] + Merge Join Operator [MERGEJOIN_15] (rows=266 width=10) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_14] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab2,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_13] (rows=242 width=10) + predicate:key is not null + TableScan [TS_0] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain select s1.key as key, s1.value as value from tab s1 join tab2 s3 on s1.key=s3.key join tab2 s2 on s1.value=s2.value @@ -2766,65 +1825,40 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_16] - compressed:false - Statistics:Num rows: 292 Data size: 3104 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Merge Join Operator [MERGEJOIN_27] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 292 Data size: 3104 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int) - | Merge Join Operator [MERGEJOIN_25] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | | - | |<-Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_23] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:s3 - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_22] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_8] - outputColumnNames:["_col1"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_24] - predicate:value is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_6] - alias:s3 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_16] + Merge Join Operator [MERGEJOIN_27] (rows=292 width=10) + Output:["_col0","_col1"],keys:{"0":"_col1","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_25] (rows=266 width=10) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_23] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab2,s3,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_22] (rows=242 width=10) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242 width=10) + Output:["_col1"] + Filter Operator [FIL_24] (rows=242 width=10) + predicate:value is not null + TableScan [TS_6] (rows=242 width=10) + default@tab2,s3,Tbl:COMPLETE,Col:NONE,Output:["value"] PREHOOK: query: explain select count(*) from (select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key @@ -2847,92 +1881,56 @@ Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 4 - File Output Operator [FS_26] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_24] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_23] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_22] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_39] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | Statistics:Num rows: 558 Data size: 5926 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_17] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_36] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_15] - | alias:b - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 508 Data size: 5388 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_37] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | | - | |<-Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_34] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:s1 - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_33] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Map 6 [CONTAINS] - Reduce Output Operator [RS_18] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 508 Data size: 5388 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_12] - outputColumnNames:["_col0"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_35] - predicate:key is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_10] - alias:s1 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 4 + File Output Operator [FS_26] + Group By Operator [GBY_24] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_23] + Group By Operator [GBY_22] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_39] (rows=558 width=10) + keys:{"0":"_col0","1":"_col0"} + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col0 + Select Operator [SEL_17] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_36] (rows=500 width=10) + predicate:key is not null + TableScan [TS_15] (rows=500 width=10) + default@tab_part,b,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_18] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_37] (rows=266 width=10) + Output:["_col0"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_34] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_33] (rows=242 width=10) + predicate:key is not null + TableScan [TS_0] (rows=242 width=10) + Output:["key"] + <-Map 6 [CONTAINS] + Reduce Output Operator [RS_18] + PartitionCols:_col0 + Select Operator [SEL_12] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_35] (rows=242 width=10) + predicate:key is not null + TableScan [TS_10] (rows=242 width=10) + Output:["key"] PREHOOK: query: explain select count(*) from (select s1.key as key, s1.value as value from tab s1 join tab s3 on s1.key=s3.key join tab s2 on s1.value=s2.value @@ -2955,119 +1953,70 @@ Reducer 4 <- Map 9 (SIMPLE_EDGE), Union 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 5 - File Output Operator [FS_32] - compressed:false - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_30] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_29] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_28] - aggregations:["count()"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_51] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | Statistics:Num rows: 587 Data size: 6237 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [SIMPLE_EDGE] - | Reduce Output Operator [RS_25] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_23] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_47] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:b - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Union 3 [SIMPLE_EDGE] - |<-Map 8 [CONTAINS] - | Reduce Output Operator [RS_24] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 534 Data size: 5670 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_18] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_46] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [CONTAINS] - Reduce Output Operator [RS_24] - key expressions:_col0 (type: int) - Map-reduce partition columns:_col0 (type: int) - sort order:+ - Statistics:Num rows: 534 Data size: 5670 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_50] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0"] - | Statistics:Num rows: 292 Data size: 3104 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_12] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: int) - | Merge Join Operator [MERGEJOIN_48] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: int)","1":"_col0 (type: int)"} - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 266 Data size: 2822 Basic stats: COMPLETE Column stats: NONE - | | - | |<-Select Operator [SEL_5] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_44] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_3] - | | alias:s1 - | | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_43] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:s1 - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - Reduce Output Operator [RS_13] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_8] - outputColumnNames:["_col1"] - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_45] - predicate:value is not null (type: boolean) - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_6] - alias:s1 - Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 5 + File Output Operator [FS_32] + Group By Operator [GBY_30] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_29] + Group By Operator [GBY_28] (rows=1 width=8) + Output:["_col0"],aggregations:["count()"] + Merge Join Operator [MERGEJOIN_51] (rows=587 width=10) + keys:{"0":"_col0","1":"_col0"} + <-Map 9 [SIMPLE_EDGE] + SHUFFLE [RS_25] + PartitionCols:_col0 + Select Operator [SEL_23] (rows=500 width=10) + Output:["_col0"] + Filter Operator [FIL_47] (rows=500 width=10) + predicate:key is not null + TableScan [TS_21] (rows=500 width=10) + default@tab_part,b,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Union 3 [SIMPLE_EDGE] + <-Map 8 [CONTAINS] + Reduce Output Operator [RS_24] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_46] (rows=242 width=10) + predicate:key is not null + TableScan [TS_16] (rows=242 width=10) + Output:["key"] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_24] + PartitionCols:_col0 + Merge Join Operator [MERGEJOIN_50] (rows=292 width=10) + Output:["_col0"],keys:{"0":"_col1","1":"_col1"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_12] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_48] (rows=266 width=10) + Output:["_col0","_col1"],keys:{"0":"_col0","1":"_col0"} + + <-Select Operator [SEL_5] (rows=242 width=10) + Output:["_col0"] + Filter Operator [FIL_44] (rows=242 width=10) + predicate:key is not null + TableScan [TS_3] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_43] (rows=242 width=10) + predicate:(key is not null and value is not null) + TableScan [TS_0] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 7 [SIMPLE_EDGE] + SHUFFLE [RS_13] + PartitionCols:_col1 + Select Operator [SEL_8] (rows=242 width=10) + Output:["_col1"] + Filter Operator [FIL_45] (rows=242 width=10) + predicate:value is not null + TableScan [TS_6] (rows=242 width=10) + default@tab,s1,Tbl:COMPLETE,Col:NONE,Output:["value"] PREHOOK: query: explain SELECT x.key, y.value @@ -3095,380 +2044,499 @@ SELECT x.key, y.value FROM src1 x JOIN src1 y ON (x.key = y.key) JOIN (select key, value from src1 union all select key, value from src union all select key, value from src union all select key, value from src)z ON (x.value = z.value) POSTHOOK: type: QUERY -Plan optimized by CBO. +STAGE DEPENDENCIES: + Stage-1 is a root stage + Stage-0 depends on stages: Stage-1 -Vertex dependency in root stage -Map 1 <- Map 6 (BROADCAST_EDGE), Union 2 (CONTAINS) -Map 12 <- Union 9 (CONTAINS) -Map 13 <- Union 9 (CONTAINS) -Map 16 <- Map 17 (BROADCAST_EDGE) -Map 18 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 19 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 20 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 21 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 5 <- Map 6 (BROADCAST_EDGE), Union 2 (CONTAINS) -Map 8 <- Union 9 (CONTAINS) -Reducer 10 <- Map 14 (SIMPLE_EDGE), Union 9 (SIMPLE_EDGE) -Reducer 11 <- Map 15 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE), Union 4 (CONTAINS) -Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +STAGE PLANS: + Stage: Stage-1 + Tez + Edges: + Map 1 <- Map 6 (BROADCAST_EDGE), Union 2 (CONTAINS) + Map 12 <- Union 9 (CONTAINS) + Map 13 <- Union 9 (CONTAINS) + Map 16 <- Map 17 (BROADCAST_EDGE) + Map 18 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 19 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 20 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 21 <- Map 16 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 5 <- Map 6 (BROADCAST_EDGE), Union 2 (CONTAINS) + Map 8 <- Union 9 (CONTAINS) + Reducer 10 <- Map 14 (SIMPLE_EDGE), Union 9 (SIMPLE_EDGE) + Reducer 11 <- Map 15 (SIMPLE_EDGE), Reducer 10 (SIMPLE_EDGE), Union 4 (CONTAINS) + Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +#### A masked pattern was here #### + Vertices: + Map 1 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col1 + input vertices: + 1 Map 6 + Statistics: Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE + Map 12 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Map 13 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Map 14 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string) + Map 15 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col1 (type: string) + Map 16 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0, _col1, _col3 + input vertices: + 1 Map 17 + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col3 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col3 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col3 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col3 (type: string) + Map 17 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + value expressions: _col1 (type: string) + Map 18 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0, _col3 + input vertices: + 0 Map 16 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col3 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Map 19 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0, _col3 + input vertices: + 0 Map 16 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col3 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Map 20 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0, _col3 + input vertices: + 0 Map 16 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col3 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Map 21 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col0, _col3 + input vertices: + 0 Map 16 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col3 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Map 5 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col1 + input vertices: + 1 Map 6 + Statistics: Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE + Map 6 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string) + Map 7 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Select Operator + expressions: key (type: string), value (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: _col1 (type: string) + Map 8 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col0 (type: string) + sort order: + + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Reducer 10 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col0 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE + Reducer 11 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col1, _col4 + Statistics: Num rows: 1239 Data size: 13085 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col1 (type: string), _col4 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1239 Data size: 13085 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Reducer 3 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col0 (type: string) + outputColumnNames: _col1, _col4 + Statistics: Num rows: 634 Data size: 6658 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col1 (type: string), _col4 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 634 Data size: 6658 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + Union 2 + Vertex: Union 2 + Union 4 + Vertex: Union 4 + Union 9 + Vertex: Union 9 -Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Union 4 - |<-Map 18 [CONTAINS] - | File Output Operator [FS_78] - | compressed:false - | Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - | Select Operator [SEL_76] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_123] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 16":"_col1 (type: string)","Map 18":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<-Map 16 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_73] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col3 (type: string) - | | Map Join Operator [MAPJOIN_122] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | HybridGraceHashJoin:true - | | | keys:{"Map 16":"_col0 (type: string)","Map 17":"_col0 (type: string)"} - | | | outputColumnNames:["_col0","_col1","_col3"] - | | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 17 [BROADCAST_EDGE] - | | | Reduce Output Operator [RS_71] - | | | key expressions:_col0 (type: string) - | | | Map-reduce partition columns:_col0 (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_53] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_113] - | | | predicate:key is not null (type: boolean) - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_51] - | | | alias:x - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Select Operator [SEL_50] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_112] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_48] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Reduce Output Operator [RS_128] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col3 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_122] - | | Reduce Output Operator [RS_129] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col3 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_122] - | | Reduce Output Operator [RS_130] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col3 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_122] - | |<-Select Operator [SEL_56] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_114] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_54] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 19 [CONTAINS] - | File Output Operator [FS_78] - | compressed:false - | Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - | Select Operator [SEL_76] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_123] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 16":"_col1 (type: string)","Map 19":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 16 [BROADCAST_EDGE] - | |<-Select Operator [SEL_59] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_115] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_57] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 20 [CONTAINS] - | File Output Operator [FS_78] - | compressed:false - | Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - | Select Operator [SEL_76] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_123] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 16":"_col1 (type: string)","Map 20":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 16 [BROADCAST_EDGE] - | |<-Select Operator [SEL_64] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_116] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_62] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 21 [CONTAINS] - | File Output Operator [FS_78] - | compressed:false - | Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - | Select Operator [SEL_76] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_123] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 16":"_col1 (type: string)","Map 21":"_col0 (type: string)"} - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 16 [BROADCAST_EDGE] - | |<-Select Operator [SEL_68] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_117] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_66] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 11 [CONTAINS] - | File Output Operator [FS_78] - | compressed:false - | Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - | Select Operator [SEL_45] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1239 Data size: 13085 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_121] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col1","_col4"] - | | Statistics:Num rows: 1239 Data size: 13085 Basic stats: COMPLETE Column stats: NONE - | |<-Map 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_43] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_38] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_111] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_36] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 10 [SIMPLE_EDGE] - | Reduce Output Operator [RS_42] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_120] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col0 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE - | |<-Map 14 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_40] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_35] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_110] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_33] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Union 9 [SIMPLE_EDGE] - | |<-Map 12 [CONTAINS] - | | Reduce Output Operator [RS_39] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_26] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_108] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_24] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 13 [CONTAINS] - | | Reduce Output Operator [RS_39] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_31] - | | outputColumnNames:["_col0"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_109] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_29] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 8 [CONTAINS] - | Reduce Output Operator [RS_39] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_23] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_107] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_21] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [CONTAINS] - File Output Operator [FS_78] - compressed:false - Statistics:Num rows: 3550 Data size: 37482 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_20] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 634 Data size: 6658 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_119] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col1","_col4"] - | Statistics:Num rows: 634 Data size: 6658 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_18] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_13] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_106] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_11] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_17] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_118] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 1":"_col0 (type: string)","Map 6":"_col1 (type: string)"} - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE - | |<-Map 6 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_15] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_10] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_105] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_8] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Reduce Output Operator [RS_124] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Please refer to the previous Select Operator [SEL_10] - | |<-Select Operator [SEL_2] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_103] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 5 [CONTAINS] - Reduce Output Operator [RS_17] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_118] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 5":"_col0 (type: string)","Map 6":"_col1 (type: string)"} - | outputColumnNames:["_col1"] - | Statistics:Num rows: 577 Data size: 6053 Basic stats: COMPLETE Column stats: NONE - |<- Please refer to the previous Map 6 [BROADCAST_EDGE] - |<-Select Operator [SEL_5] - outputColumnNames:["_col0"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_104] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Stage: Stage-0 + Fetch Operator + limit: -1 + Processor Tree: + ListSink PREHOOK: query: explain SELECT x.key, y.value @@ -3522,460 +2590,256 @@ Reducer 6 <- Union 5 (SIMPLE_EDGE), Union 7 (CONTAINS) Reducer 8 <- Union 7 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 8 - File Output Operator [FS_122] - compressed:false - Statistics:Num rows: 530 Data size: 5624 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_120] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 530 Data size: 5624 Basic stats: COMPLETE Column stats: NONE - |<-Union 7 [SIMPLE_EDGE] - |<-Reducer 31 [CONTAINS] - | Reduce Output Operator [RS_119] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1061 Data size: 11260 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_118] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1061 Data size: 11260 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_114] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_167] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 23":"_col1 (type: string)","Reducer 31":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col3"] - | | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | |<-Map 23 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_111] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col3 (type: string) - | | Map Join Operator [MAPJOIN_166] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | HybridGraceHashJoin:true - | | | keys:{"Map 23":"_col0 (type: string)","Map 24":"_col0 (type: string)"} - | | | outputColumnNames:["_col0","_col1","_col3"] - | | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 24 [BROADCAST_EDGE] - | | | Reduce Output Operator [RS_109] - | | | key expressions:_col0 (type: string) - | | | Map-reduce partition columns:_col0 (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:_col1 (type: string) - | | | Select Operator [SEL_74] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_157] - | | | predicate:key is not null (type: boolean) - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_72] - | | | alias:x - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Select Operator [SEL_71] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_156] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_69] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_107] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_106] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | |<-Union 30 [SIMPLE_EDGE] - | |<-Map 34 [CONTAINS] - | | Reduce Output Operator [RS_105] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_104] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_100] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_161] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_98] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 29 [CONTAINS] - | Reduce Output Operator [RS_105] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_104] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_96] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 28 [SIMPLE_EDGE] - | |<-Map 33 [CONTAINS] - | | Reduce Output Operator [RS_95] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_94] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_90] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_160] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_88] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 27 [CONTAINS] - | Reduce Output Operator [RS_95] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_94] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_86] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 26 [SIMPLE_EDGE] - | |<-Map 25 [CONTAINS] - | | Reduce Output Operator [RS_85] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_84] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_77] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_158] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_75] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 32 [CONTAINS] - | Reduce Output Operator [RS_85] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_84] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_80] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_159] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_78] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [CONTAINS] - Reduce Output Operator [RS_119] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1061 Data size: 11260 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_118] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1061 Data size: 11260 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_67] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 577 Data size: 6129 Basic stats: COMPLETE Column stats: NONE - |<-Union 5 [SIMPLE_EDGE] - |<-Reducer 18 [CONTAINS] - | Reduce Output Operator [RS_66] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1155 Data size: 12270 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_65] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1155 Data size: 12270 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_61] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_165] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | | outputColumnNames:["_col2","_col5"] - | | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - | |<-Map 22 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_59] - | | key expressions:_col0 (type: string) - | | Map-reduce partition columns:_col0 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col1 (type: string) - | | Select Operator [SEL_54] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_155] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_52] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 17 [SIMPLE_EDGE] - | Reduce Output Operator [RS_58] - | key expressions:_col2 (type: string) - | Map-reduce partition columns:_col2 (type: string) - | sort order:+ - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_164] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col2"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 21 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_56] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string) - | | Select Operator [SEL_51] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_154] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_49] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | Reduce Output Operator [RS_55] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_48] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_47] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 15 [SIMPLE_EDGE] - | |<-Map 20 [CONTAINS] - | | Reduce Output Operator [RS_46] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_45] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_41] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_153] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_39] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 14 [CONTAINS] - | Reduce Output Operator [RS_46] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_45] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_37] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 13 [SIMPLE_EDGE] - | |<-Map 12 [CONTAINS] - | | Reduce Output Operator [RS_36] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_35] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_28] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_151] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 19 [CONTAINS] - | Reduce Output Operator [RS_36] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_35] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_31] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_152] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_29] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [CONTAINS] - Reduce Output Operator [RS_66] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1155 Data size: 12270 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_65] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1155 Data size: 12270 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_163] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col2 (type: string)","1":"_col0 (type: string)"} - | outputColumnNames:["_col2","_col5"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_23] - | key expressions:_col0 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_18] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_150] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_16] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_22] - key expressions:_col2 (type: string) - Map-reduce partition columns:_col2 (type: string) - sort order:+ - Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_162] - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Reducer 3":"_col1 (type: string)","Map 10":"_col1 (type: string)"} - | outputColumnNames:["_col2"] - | Statistics:Num rows: 288 Data size: 3020 Basic stats: COMPLETE Column stats: NONE - |<-Map 10 [BROADCAST_EDGE] - | Reduce Output Operator [RS_20] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string) - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_149] - | predicate:(key is not null and value is not null) (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_13] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_12] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_11] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_10] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_9] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_147] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:x - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [CONTAINS] - Reduce Output Operator [RS_10] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_148] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:y - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 8 + File Output Operator [FS_122] + Group By Operator [GBY_120] (rows=530 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 7 [SIMPLE_EDGE] + <-Reducer 31 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1061 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_114] (rows=484 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_167] (rows=484 width=10) + HybridGraceHashJoin:true,Output:["_col0","_col3"],keys:{"RS_111":"_col1","SEL_107":"_col1"} + <-Map 23 [BROADCAST_EDGE] + BROADCAST [RS_111] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_166] (rows=27 width=7) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col3"],keys:{"SEL_71":"_col0","RS_109":"_col0"} + <-Map 24 [BROADCAST_EDGE] + BROADCAST [RS_109] + PartitionCols:_col0 + Select Operator [SEL_74] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_157] (rows=25 width=7) + predicate:key is not null + TableScan [TS_72] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_71] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_156] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_69] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_107] (rows=440 width=10) + Output:["_col1"] + Group By Operator [GBY_106] (rows=440 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 30 [SIMPLE_EDGE] + <-Map 34 [CONTAINS] + Reduce Output Operator [RS_105] + PartitionCols:_col0, _col1 + Group By Operator [GBY_104] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_100] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_161] (rows=500 width=10) + predicate:value is not null + TableScan [TS_98] (rows=500 width=10) + Output:["key","value"] + <-Reducer 29 [CONTAINS] + Reduce Output Operator [RS_105] + PartitionCols:_col0, _col1 + Group By Operator [GBY_104] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_96] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 28 [SIMPLE_EDGE] + <-Map 33 [CONTAINS] + Reduce Output Operator [RS_95] + PartitionCols:_col0, _col1 + Group By Operator [GBY_94] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_90] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_160] (rows=500 width=10) + predicate:value is not null + TableScan [TS_88] (rows=500 width=10) + Output:["key","value"] + <-Reducer 27 [CONTAINS] + Reduce Output Operator [RS_95] + PartitionCols:_col0, _col1 + Group By Operator [GBY_94] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_86] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 26 [SIMPLE_EDGE] + <-Map 25 [CONTAINS] + Reduce Output Operator [RS_85] + PartitionCols:_col0, _col1 + Group By Operator [GBY_84] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_77] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_158] (rows=25 width=7) + predicate:value is not null + TableScan [TS_75] (rows=25 width=7) + Output:["key","value"] + <-Map 32 [CONTAINS] + Reduce Output Operator [RS_85] + PartitionCols:_col0, _col1 + Group By Operator [GBY_84] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_80] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_159] (rows=500 width=10) + predicate:value is not null + TableScan [TS_78] (rows=500 width=10) + Output:["key","value"] + <-Reducer 6 [CONTAINS] + Reduce Output Operator [RS_119] + PartitionCols:_col0, _col1 + Group By Operator [GBY_118] (rows=1061 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_67] (rows=577 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 5 [SIMPLE_EDGE] + <-Reducer 18 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1155 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_61] (rows=605 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_165] (rows=605 width=10) + Output:["_col2","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_59] + PartitionCols:_col0 + Select Operator [SEL_54] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_155] (rows=500 width=10) + predicate:key is not null + TableScan [TS_52] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 17 [SIMPLE_EDGE] + SHUFFLE [RS_58] + PartitionCols:_col2 + Merge Join Operator [MERGEJOIN_164] (rows=550 width=10) + Output:["_col2"],keys:{"0":"_col1","1":"_col1"} + <-Map 21 [SIMPLE_EDGE] + SHUFFLE [RS_56] + PartitionCols:_col1 + Select Operator [SEL_51] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_154] (rows=500 width=10) + predicate:(key is not null and value is not null) + TableScan [TS_49] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_55] + PartitionCols:_col1 + Select Operator [SEL_48] (rows=381 width=10) + Output:["_col1"] + Group By Operator [GBY_47] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 15 [SIMPLE_EDGE] + <-Map 20 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_41] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_153] (rows=500 width=10) + predicate:value is not null + TableScan [TS_39] (rows=500 width=10) + Output:["key","value"] + <-Reducer 14 [CONTAINS] + Reduce Output Operator [RS_46] + PartitionCols:_col0, _col1 + Group By Operator [GBY_45] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_37] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 13 [SIMPLE_EDGE] + <-Map 12 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_28] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_151] (rows=25 width=7) + predicate:value is not null + TableScan [TS_26] (rows=25 width=7) + Output:["key","value"] + <-Map 19 [CONTAINS] + Reduce Output Operator [RS_36] + PartitionCols:_col0, _col1 + Group By Operator [GBY_35] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_31] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_152] (rows=500 width=10) + predicate:value is not null + TableScan [TS_29] (rows=500 width=10) + Output:["key","value"] + <-Reducer 4 [CONTAINS] + Reduce Output Operator [RS_66] + PartitionCols:_col0, _col1 + Group By Operator [GBY_65] (rows=1155 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=550 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_163] (rows=550 width=10) + Output:["_col2","_col5"],keys:{"0":"_col2","1":"_col0"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_23] + PartitionCols:_col0 + Select Operator [SEL_18] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_150] (rows=500 width=10) + predicate:key is not null + TableScan [TS_16] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_22] + PartitionCols:_col2 + Map Join Operator [MAPJOIN_162] (rows=288 width=10) + HybridGraceHashJoin:true,Output:["_col2"],keys:{"SEL_12":"_col1","RS_20":"_col1"} + <-Map 10 [BROADCAST_EDGE] + BROADCAST [RS_20] + PartitionCols:_col1 + Select Operator [SEL_15] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_149] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_13] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_12] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_11] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_2] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_147] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 9 [CONTAINS] + Reduce Output Operator [RS_10] + PartitionCols:_col0, _col1 + Group By Operator [GBY_9] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_148] (rows=500 width=10) + predicate:value is not null + TableScan [TS_3] (rows=500 width=10) + Output:["key","value"] PREHOOK: query: CREATE TABLE a(key STRING, value STRING) STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -4039,471 +2903,664 @@ INSERT OVERWRITE TABLE a SELECT tmp.key, tmp.value INSERT OVERWRITE TABLE b SELECT tmp.key, tmp.value INSERT OVERWRITE TABLE c SELECT tmp.key, tmp.value POSTHOOK: type: QUERY -Plan not optimized by CBO. +STAGE DEPENDENCIES: + Stage-3 is a root stage + Stage-4 depends on stages: Stage-3 + Stage-0 depends on stages: Stage-4 + Stage-5 depends on stages: Stage-0 + Stage-8 depends on stages: Stage-0 + Stage-11 depends on stages: Stage-0 + Stage-14 depends on stages: Stage-0 + Stage-17 depends on stages: Stage-0 + Stage-20 depends on stages: Stage-0 + Stage-1 depends on stages: Stage-4 + Stage-6 depends on stages: Stage-1 + Stage-9 depends on stages: Stage-1 + Stage-12 depends on stages: Stage-1 + Stage-15 depends on stages: Stage-1 + Stage-18 depends on stages: Stage-1 + Stage-21 depends on stages: Stage-1 + Stage-2 depends on stages: Stage-4 + Stage-7 depends on stages: Stage-2 + Stage-10 depends on stages: Stage-2 + Stage-13 depends on stages: Stage-2 + Stage-16 depends on stages: Stage-2 + Stage-19 depends on stages: Stage-2 + Stage-22 depends on stages: Stage-2 -Vertex dependency in root stage -Map 1 <- Union 2 (CONTAINS) -Map 11 <- Union 9 (CONTAINS) -Map 12 <- Union 9 (CONTAINS) -Map 16 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 17 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 18 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 19 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) -Map 20 <- Map 21 (BROADCAST_EDGE) -Map 5 <- Union 2 (CONTAINS) -Map 7 <- Map 6 (BROADCAST_EDGE) -Map 8 <- Union 9 (CONTAINS) -Reducer 10 <- Reducer 14 (SIMPLE_EDGE), Union 4 (CONTAINS), Union 9 (SIMPLE_EDGE) -Reducer 14 <- Map 13 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE) -Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +STAGE PLANS: + Stage: Stage-3 + Tez + Edges: + Map 1 <- Union 2 (CONTAINS) + Map 11 <- Union 9 (CONTAINS) + Map 12 <- Union 9 (CONTAINS) + Map 16 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 17 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 18 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 19 <- Map 20 (BROADCAST_EDGE), Union 4 (CONTAINS) + Map 20 <- Map 21 (BROADCAST_EDGE) + Map 5 <- Union 2 (CONTAINS) + Map 7 <- Map 6 (BROADCAST_EDGE) + Map 8 <- Union 9 (CONTAINS) + Reducer 10 <- Reducer 14 (SIMPLE_EDGE), Union 4 (CONTAINS), Union 9 (SIMPLE_EDGE) + Reducer 14 <- Map 13 (SIMPLE_EDGE), Map 15 (SIMPLE_EDGE) + Reducer 3 <- Map 7 (SIMPLE_EDGE), Union 2 (SIMPLE_EDGE), Union 4 (CONTAINS) +#### A masked pattern was here #### + Vertices: + Map 1 + Map Operator Tree: + TableScan + alias: src1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE + Map 11 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Map 12 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Map 13 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Reduce Output Operator + key expressions: key (type: string) + sort order: + + Map-reduce partition columns: key (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: value (type: string) + Map 15 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Reduce Output Operator + key expressions: key (type: string) + sort order: + + Map-reduce partition columns: key (type: string) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + value expressions: value (type: string) + Map 16 + Map Operator Tree: + TableScan + alias: src1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + input vertices: + 0 Map 20 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Map 17 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + input vertices: + 0 Map 20 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Map 18 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + input vertices: + 0 Map 20 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Map 19 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + input vertices: + 0 Map 20 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Map 20 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 key (type: string) + 1 key (type: string) + outputColumnNames: _col0, _col1, _col6 + input vertices: + 1 Map 21 + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Map 21 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Reduce Output Operator + key expressions: key (type: string) + sort order: + + Map-reduce partition columns: key (type: string) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + value expressions: value (type: string) + Map 5 + Map Operator Tree: + TableScan + alias: src + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE + Map 6 + Map Operator Tree: + TableScan + alias: x + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: (key is not null and value is not null) (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: (key is not null and value is not null) + Reduce Output Operator + key expressions: key (type: string) + sort order: + + Map-reduce partition columns: key (type: string) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + value expressions: value (type: string) + Map 7 + Map Operator Tree: + TableScan + alias: y + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: key is not null (type: boolean) + Statistics: Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + predicate: key is not null + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 key (type: string) + 1 key (type: string) + outputColumnNames: _col0, _col1, _col6 + input vertices: + 0 Map 6 + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + HybridGraceHashJoin: true + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Map 8 + Map Operator Tree: + TableScan + alias: src1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Filter Operator + predicate: value is not null (type: boolean) + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + predicate: value is not null + Select Operator + expressions: value (type: string) + outputColumnNames: _col1 + Statistics: Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE + Reducer 10 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + Statistics: Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Reducer 14 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 key (type: string) + 1 key (type: string) + outputColumnNames: _col0, _col1, _col6 + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + Reduce Output Operator + key expressions: _col1 (type: string) + sort order: + + Map-reduce partition columns: _col1 (type: string) + Statistics: Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE + value expressions: _col0 (type: string), _col6 (type: string) + Reducer 3 + Reduce Operator Tree: + Merge Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: string) + 1 _col1 (type: string) + outputColumnNames: _col0, _col6 + Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + Select Operator + expressions: _col0 (type: string), _col6 (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + File Output Operator + compressed: false + Statistics: Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + Union 2 + Vertex: Union 2 + Union 4 + Vertex: Union 4 + Union 9 + Vertex: Union 9 -Stage-5 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - Stage-4 - Dependency Collection{} - Stage-3 - Union 4 - |<-Map 16 [CONTAINS] - | File Output Operator [FS_62] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - | Select Operator [SEL_60] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_108] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 20":"_col1 (type: string)","Map 16":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<-Map 20 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_56] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Map Join Operator [MAPJOIN_105] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | HybridGraceHashJoin:true - | | | keys:{"Map 20":"key (type: string)","Map 21":"key (type: string)"} - | | | outputColumnNames:["_col0","_col1","_col6"] - | | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 21 [BROADCAST_EDGE] - | | | Reduce Output Operator [RS_53] - | | | key expressions:key (type: string) - | | | Map-reduce partition columns:key (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:value (type: string) - | | | Filter Operator [FIL_102] - | | | predicate:key is not null (type: boolean) - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_49] - | | | alias:y - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Filter Operator [FIL_101] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_48] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Reduce Output Operator [RS_110] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_105] - | | Reduce Output Operator [RS_111] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_105] - | | Reduce Output Operator [RS_112] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Please refer to the previous Map Join Operator [MAPJOIN_105] - | |<-Select Operator [SEL_40] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_97] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_39] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | File Output Operator [FS_64] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - | Please refer to the previous Select Operator [SEL_60] - | File Output Operator [FS_66] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - | Please refer to the previous Select Operator [SEL_60] - |<-Map 17 [CONTAINS] - | File Output Operator [FS_62] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - | Select Operator [SEL_60] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_108] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 20":"_col1 (type: string)","Map 17":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 20 [BROADCAST_EDGE] - | |<-Select Operator [SEL_42] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_98] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_41] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | File Output Operator [FS_64] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - | Please refer to the previous Select Operator [SEL_60] - | File Output Operator [FS_66] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - | Please refer to the previous Select Operator [SEL_60] - |<-Map 18 [CONTAINS] - | File Output Operator [FS_62] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - | Select Operator [SEL_60] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_108] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 20":"_col1 (type: string)","Map 18":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 20 [BROADCAST_EDGE] - | |<-Select Operator [SEL_45] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_99] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_44] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | File Output Operator [FS_64] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - | Please refer to the previous Select Operator [SEL_60] - | File Output Operator [FS_66] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - | Please refer to the previous Select Operator [SEL_60] - |<-Map 19 [CONTAINS] - | File Output Operator [FS_62] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - | Select Operator [SEL_60] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_108] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 20":"_col1 (type: string)","Map 19":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 1677 Data size: 17739 Basic stats: COMPLETE Column stats: NONE - | |<- Please refer to the previous Map 20 [BROADCAST_EDGE] - | |<-Select Operator [SEL_47] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_100] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_46] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | File Output Operator [FS_64] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - | Please refer to the previous Select Operator [SEL_60] - | File Output Operator [FS_66] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - | Please refer to the previous Select Operator [SEL_60] - |<-Reducer 10 [CONTAINS] - | File Output Operator [FS_62] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - | Select Operator [SEL_37] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_107] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 1127 Data size: 11896 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 14 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_33] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Merge Join Operator [MERGEJOIN_104] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | keys:{"0":"key (type: string)","1":"key (type: string)"} - | | | outputColumnNames:["_col0","_col1","_col6"] - | | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 13 [SIMPLE_EDGE] - | | | Reduce Output Operator [RS_28] - | | | key expressions:key (type: string) - | | | Map-reduce partition columns:key (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:value (type: string) - | | | Filter Operator [FIL_95] - | | | predicate:(key is not null and value is not null) (type: boolean) - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_25] - | | | alias:x - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 15 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_30] - | | key expressions:key (type: string) - | | Map-reduce partition columns:key (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:value (type: string) - | | Filter Operator [FIL_96] - | | predicate:key is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:y - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Union 9 [SIMPLE_EDGE] - | |<-Map 11 [CONTAINS] - | | Reduce Output Operator [RS_35] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_21] - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_93] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_20] - | | alias:src - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 12 [CONTAINS] - | | Reduce Output Operator [RS_35] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_24] - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_94] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_23] - | | alias:src - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 8 [CONTAINS] - | Reduce Output Operator [RS_35] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 1025 Data size: 10815 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_19] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_92] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_18] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | File Output Operator [FS_64] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - | Please refer to the previous Select Operator [SEL_37] - | File Output Operator [FS_66] - | compressed:false - | Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - | table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - | Please refer to the previous Select Operator [SEL_37] - |<-Reducer 3 [CONTAINS] - File Output Operator [FS_62] - compressed:false - Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - Select Operator [SEL_17] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_106] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col6"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - |<-Map 7 [SIMPLE_EDGE] - | Reduce Output Operator [RS_13] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col6 (type: string) - | Map Join Operator [MAPJOIN_103] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 6":"key (type: string)","Map 7":"key (type: string)"} - | | outputColumnNames:["_col0","_col1","_col6"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 6 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_8] - | | key expressions:key (type: string) - | | Map-reduce partition columns:key (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:value (type: string) - | | Filter Operator [FIL_90] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_5] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Filter Operator [FIL_91] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_15] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_1] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_88] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 5 [CONTAINS] - Reduce Output Operator [RS_15] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_3] - outputColumnNames:["_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_89] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - File Output Operator [FS_64] - compressed:false - Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - Please refer to the previous Select Operator [SEL_17] - File Output Operator [FS_66] - compressed:false - Statistics:Num rows: 3409 Data size: 36062 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - Please refer to the previous Select Operator [SEL_17] -Stage-8 - Stats-Aggr Operator - Please refer to the previous Stage-0 -Stage-11 - Stats-Aggr Operator - Please refer to the previous Stage-0 -Stage-14 - Stats-Aggr Operator - Please refer to the previous Stage-0 -Stage-17 - Stats-Aggr Operator - Please refer to the previous Stage-0 -Stage-20 - Stats-Aggr Operator - Please refer to the previous Stage-0 -Stage-6 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - Please refer to the previous Stage-4 -Stage-9 - Stats-Aggr Operator - Please refer to the previous Stage-1 -Stage-12 - Stats-Aggr Operator - Please refer to the previous Stage-1 -Stage-15 - Stats-Aggr Operator - Please refer to the previous Stage-1 -Stage-18 - Stats-Aggr Operator - Please refer to the previous Stage-1 -Stage-21 - Stats-Aggr Operator - Please refer to the previous Stage-1 -Stage-7 - Stats-Aggr Operator - Stage-2 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - Please refer to the previous Stage-4 -Stage-10 - Stats-Aggr Operator - Please refer to the previous Stage-2 -Stage-13 - Stats-Aggr Operator - Please refer to the previous Stage-2 -Stage-16 - Stats-Aggr Operator - Please refer to the previous Stage-2 -Stage-19 - Stats-Aggr Operator - Please refer to the previous Stage-2 -Stage-22 - Stats-Aggr Operator - Please refer to the previous Stage-2 + Stage: Stage-4 + Dependency Collection + + Stage: Stage-0 + Move Operator + tables: + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.a + + Stage: Stage-5 + Stats-Aggr Operator + + Stage: Stage-8 + Stats-Aggr Operator + + Stage: Stage-11 + Stats-Aggr Operator + + Stage: Stage-14 + Stats-Aggr Operator + + Stage: Stage-17 + Stats-Aggr Operator + + Stage: Stage-20 + Stats-Aggr Operator + + Stage: Stage-1 + Move Operator + tables: + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.b + + Stage: Stage-6 + Stats-Aggr Operator + + Stage: Stage-9 + Stats-Aggr Operator + + Stage: Stage-12 + Stats-Aggr Operator + + Stage: Stage-15 + Stats-Aggr Operator + + Stage: Stage-18 + Stats-Aggr Operator + + Stage: Stage-21 + Stats-Aggr Operator + + Stage: Stage-2 + Move Operator + tables: + replace: true + table: + input format: org.apache.hadoop.mapred.TextInputFormat + output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat + serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe + name: default.c + + Stage: Stage-7 + Stats-Aggr Operator + + Stage: Stage-10 + Stats-Aggr Operator + + Stage: Stage-13 + Stats-Aggr Operator + + Stage: Stage-16 + Stats-Aggr Operator + + Stage: Stage-19 + Stats-Aggr Operator + + Stage: Stage-22 + Stats-Aggr Operator PREHOOK: query: explain FROM @@ -4564,469 +3621,267 @@ Reducer 6 <- Union 5 (SIMPLE_EDGE), Union 7 (CONTAINS) Reducer 8 <- Union 7 (SIMPLE_EDGE) Stage-5 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - Stage-4 - Dependency Collection{} - Stage-3 - Reducer 8 - File Output Operator [FS_114] - compressed:false - Statistics:Num rows: 544 Data size: 5773 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.a"} - Group By Operator [GBY_111] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 544 Data size: 5773 Basic stats: COMPLETE Column stats: NONE - |<-Union 7 [SIMPLE_EDGE] - |<-Reducer 29 [CONTAINS] - | Reduce Output Operator [RS_110] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1089 Data size: 11558 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_109] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1089 Data size: 11558 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_105] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | Map Join Operator [MAPJOIN_160] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 33":"_col1 (type: string)","Reducer 29":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 484 Data size: 5131 Basic stats: COMPLETE Column stats: NONE - | |<-Map 33 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_101] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | value expressions:_col0 (type: string), _col6 (type: string) - | | Map Join Operator [MAPJOIN_157] - | | | condition map:[{"":"Inner Join 0 to 1"}] - | | | HybridGraceHashJoin:true - | | | keys:{"Map 33":"key (type: string)","Map 34":"key (type: string)"} - | | | outputColumnNames:["_col0","_col1","_col6"] - | | | Statistics:Num rows: 27 Data size: 210 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 34 [BROADCAST_EDGE] - | | | Reduce Output Operator [RS_98] - | | | key expressions:key (type: string) - | | | Map-reduce partition columns:key (type: string) - | | | sort order:+ - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | value expressions:value (type: string) - | | | Filter Operator [FIL_154] - | | | predicate:key is not null (type: boolean) - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_94] - | | | alias:y - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Filter Operator [FIL_153] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_93] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Select Operator [SEL_92] - | outputColumnNames:["_col1"] - | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_91] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 440 Data size: 4665 Basic stats: COMPLETE Column stats: NONE - | |<-Union 28 [SIMPLE_EDGE] - | |<-Map 32 [CONTAINS] - | | Reduce Output Operator [RS_90] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_89] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_85] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_152] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_84] - | | alias:src - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 27 [CONTAINS] - | Reduce Output Operator [RS_90] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_89] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 881 Data size: 9341 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_82] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | |<-Union 26 [SIMPLE_EDGE] - | |<-Map 31 [CONTAINS] - | | Reduce Output Operator [RS_81] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_80] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_76] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_151] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_75] - | | alias:src - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 25 [CONTAINS] - | Reduce Output Operator [RS_81] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_80] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_73] - | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | |<-Union 24 [SIMPLE_EDGE] - | |<-Map 23 [CONTAINS] - | | Reduce Output Operator [RS_72] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_71] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_65] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_149] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_64] - | | alias:src1 - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Map 30 [CONTAINS] - | Reduce Output Operator [RS_72] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_71] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_67] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_150] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_66] - | alias:src - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 6 [CONTAINS] - Reduce Output Operator [RS_110] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1089 Data size: 11558 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_109] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1089 Data size: 11558 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_62] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - |<-Union 5 [SIMPLE_EDGE] - |<-Reducer 17 [CONTAINS] - | Reduce Output Operator [RS_61] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_60] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_56] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - | Merge Join Operator [MERGEJOIN_159] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | | outputColumnNames:["_col0","_col6"] - | | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 16 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_54] - | | key expressions:_col1 (type: string) - | | Map-reduce partition columns:_col1 (type: string) - | | sort order:+ - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_43] - | | outputColumnNames:["_col1"] - | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_42] - | | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 381 Data size: 4029 Basic stats: COMPLETE Column stats: NONE - | | |<-Union 15 [SIMPLE_EDGE] - | | |<-Map 19 [CONTAINS] - | | | Reduce Output Operator [RS_41] - | | | key expressions:_col0 (type: string), _col1 (type: string) - | | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | | sort order:++ - | | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | | Group By Operator [GBY_40] - | | | keys:_col0 (type: string), _col1 (type: string) - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_36] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_146] - | | | predicate:value is not null (type: boolean) - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_35] - | | | alias:src - | | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | |<-Reducer 14 [CONTAINS] - | | Reduce Output Operator [RS_41] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_40] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 762 Data size: 8058 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_33] - | | | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - | | |<-Union 13 [SIMPLE_EDGE] - | | |<-Map 12 [CONTAINS] - | | | Reduce Output Operator [RS_32] - | | | key expressions:_col0 (type: string), _col1 (type: string) - | | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | | sort order:++ - | | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | | Group By Operator [GBY_31] - | | | keys:_col0 (type: string), _col1 (type: string) - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | | Select Operator [SEL_25] - | | | outputColumnNames:["_col0","_col1"] - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | Filter Operator [FIL_144] - | | | predicate:value is not null (type: boolean) - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | | TableScan [TS_24] - | | | alias:src1 - | | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | |<-Map 18 [CONTAINS] - | | Reduce Output Operator [RS_32] - | | key expressions:_col0 (type: string), _col1 (type: string) - | | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | | sort order:++ - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Group By Operator [GBY_31] - | | keys:_col0 (type: string), _col1 (type: string) - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | | Select Operator [SEL_27] - | | outputColumnNames:["_col0","_col1"] - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | Filter Operator [FIL_145] - | | predicate:value is not null (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_26] - | | alias:src - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Reducer 21 [SIMPLE_EDGE] - | Reduce Output Operator [RS_52] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col6 (type: string) - | Merge Join Operator [MERGEJOIN_156] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | keys:{"0":"key (type: string)","1":"key (type: string)"} - | | outputColumnNames:["_col0","_col1","_col6"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 20 [SIMPLE_EDGE] - | | Reduce Output Operator [RS_47] - | | key expressions:key (type: string) - | | Map-reduce partition columns:key (type: string) - | | sort order:+ - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | value expressions:value (type: string) - | | Filter Operator [FIL_147] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_44] - | | alias:x - | | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | |<-Map 22 [SIMPLE_EDGE] - | Reduce Output Operator [RS_49] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: string) - | Filter Operator [FIL_148] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_45] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 4 [CONTAINS] - Reduce Output Operator [RS_61] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_60] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1210 Data size: 12854 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_23] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_158] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"_col1 (type: string)","1":"_col1 (type: string)"} - | outputColumnNames:["_col0","_col6"] - | Statistics:Num rows: 605 Data size: 6427 Basic stats: COMPLETE Column stats: NONE - |<-Map 11 [SIMPLE_EDGE] - | Reduce Output Operator [RS_19] - | key expressions:_col1 (type: string) - | Map-reduce partition columns:_col1 (type: string) - | sort order:+ - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col0 (type: string), _col6 (type: string) - | Map Join Operator [MAPJOIN_155] - | | condition map:[{"":"Inner Join 0 to 1"}] - | | HybridGraceHashJoin:true - | | keys:{"Map 10":"key (type: string)","Map 11":"key (type: string)"} - | | outputColumnNames:["_col0","_col1","_col6"] - | | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - | |<-Map 10 [BROADCAST_EDGE] - | | Reduce Output Operator [RS_14] - | | key expressions:key (type: string) - | | Map-reduce partition columns:key (type: string) - | | sort order:+ - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | value expressions:value (type: string) - | | Filter Operator [FIL_142] - | | predicate:(key is not null and value is not null) (type: boolean) - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | | TableScan [TS_11] - | | alias:x - | | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | |<-Filter Operator [FIL_143] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_12] - | alias:y - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_21] - key expressions:_col1 (type: string) - Map-reduce partition columns:_col1 (type: string) - sort order:+ - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_10] - outputColumnNames:["_col1"] - Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_9] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 262 Data size: 2746 Basic stats: COMPLETE Column stats: NONE - |<-Union 2 [SIMPLE_EDGE] - |<-Map 1 [CONTAINS] - | Reduce Output Operator [RS_8] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:++ - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Group By Operator [GBY_7] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - | Select Operator [SEL_1] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_140] - | predicate:value is not null (type: boolean) - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:src1 - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 9 [CONTAINS] - Reduce Output Operator [RS_8] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:++ - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Group By Operator [GBY_7] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 525 Data size: 5503 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_3] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_141] - predicate:value is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - File Output Operator [FS_116] - compressed:false - Statistics:Num rows: 544 Data size: 5773 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - Please refer to the previous Group By Operator [GBY_111] - File Output Operator [FS_118] - compressed:false - Statistics:Num rows: 544 Data size: 5773 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - Please refer to the previous Group By Operator [GBY_111] + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.a"} + Stage-4 + Dependency Collection{} + Stage-3 + Reducer 8 + File Output Operator [FS_114] + table:{"name:":"default.a"} + Group By Operator [GBY_111] (rows=544 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 7 [SIMPLE_EDGE] + <-Reducer 29 [CONTAINS] + Reduce Output Operator [RS_110] + PartitionCols:_col0, _col1 + Group By Operator [GBY_109] (rows=1089 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_105] (rows=484 width=10) + Output:["_col0","_col1"] + Map Join Operator [MAPJOIN_160] (rows=484 width=10) + HybridGraceHashJoin:true,Output:["_col0","_col6"],keys:{"RS_101":"_col1","SEL_92":"_col1"} + <-Map 33 [BROADCAST_EDGE] + BROADCAST [RS_101] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_157] (rows=27 width=7) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col6"],keys:{"FIL_153":"key","RS_98":"key"} + <-Map 34 [BROADCAST_EDGE] + BROADCAST [RS_98] + PartitionCols:key + Filter Operator [FIL_154] (rows=25 width=7) + predicate:key is not null + TableScan [TS_94] (rows=25 width=7) + default@src1,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Filter Operator [FIL_153] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_93] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_92] (rows=440 width=10) + Output:["_col1"] + Group By Operator [GBY_91] (rows=440 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 28 [SIMPLE_EDGE] + <-Map 32 [CONTAINS] + Reduce Output Operator [RS_90] + PartitionCols:_col0, _col1 + Group By Operator [GBY_89] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_85] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_152] (rows=500 width=10) + predicate:value is not null + TableScan [TS_84] (rows=500 width=10) + Output:["key","value"] + <-Reducer 27 [CONTAINS] + Reduce Output Operator [RS_90] + PartitionCols:_col0, _col1 + Group By Operator [GBY_89] (rows=881 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_82] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 26 [SIMPLE_EDGE] + <-Map 31 [CONTAINS] + Reduce Output Operator [RS_81] + PartitionCols:_col0, _col1 + Group By Operator [GBY_80] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_76] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_151] (rows=500 width=10) + predicate:value is not null + TableScan [TS_75] (rows=500 width=10) + Output:["key","value"] + <-Reducer 25 [CONTAINS] + Reduce Output Operator [RS_81] + PartitionCols:_col0, _col1 + Group By Operator [GBY_80] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_73] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 24 [SIMPLE_EDGE] + <-Map 23 [CONTAINS] + Reduce Output Operator [RS_72] + PartitionCols:_col0, _col1 + Group By Operator [GBY_71] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_65] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_149] (rows=25 width=7) + predicate:value is not null + TableScan [TS_64] (rows=25 width=7) + Output:["key","value"] + <-Map 30 [CONTAINS] + Reduce Output Operator [RS_72] + PartitionCols:_col0, _col1 + Group By Operator [GBY_71] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_67] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_150] (rows=500 width=10) + predicate:value is not null + TableScan [TS_66] (rows=500 width=10) + Output:["key","value"] + <-Reducer 6 [CONTAINS] + Reduce Output Operator [RS_110] + PartitionCols:_col0, _col1 + Group By Operator [GBY_109] (rows=1089 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_62] (rows=605 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 5 [SIMPLE_EDGE] + <-Reducer 17 [CONTAINS] + Reduce Output Operator [RS_61] + PartitionCols:_col0, _col1 + Group By Operator [GBY_60] (rows=1210 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_56] (rows=605 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_159] (rows=605 width=10) + Output:["_col0","_col6"],keys:{"0":"_col1","1":"_col1"} + <-Reducer 16 [SIMPLE_EDGE] + SHUFFLE [RS_54] + PartitionCols:_col1 + Select Operator [SEL_43] (rows=381 width=10) + Output:["_col1"] + Group By Operator [GBY_42] (rows=381 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 15 [SIMPLE_EDGE] + <-Map 19 [CONTAINS] + Reduce Output Operator [RS_41] + PartitionCols:_col0, _col1 + Group By Operator [GBY_40] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_36] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_146] (rows=500 width=10) + predicate:value is not null + TableScan [TS_35] (rows=500 width=10) + Output:["key","value"] + <-Reducer 14 [CONTAINS] + Reduce Output Operator [RS_41] + PartitionCols:_col0, _col1 + Group By Operator [GBY_40] (rows=762 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Group By Operator [GBY_33] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 13 [SIMPLE_EDGE] + <-Map 12 [CONTAINS] + Reduce Output Operator [RS_32] + PartitionCols:_col0, _col1 + Group By Operator [GBY_31] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_25] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_144] (rows=25 width=7) + predicate:value is not null + TableScan [TS_24] (rows=25 width=7) + Output:["key","value"] + <-Map 18 [CONTAINS] + Reduce Output Operator [RS_32] + PartitionCols:_col0, _col1 + Group By Operator [GBY_31] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_27] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_145] (rows=500 width=10) + predicate:value is not null + TableScan [TS_26] (rows=500 width=10) + Output:["key","value"] + <-Reducer 21 [SIMPLE_EDGE] + SHUFFLE [RS_52] + PartitionCols:_col1 + Merge Join Operator [MERGEJOIN_156] (rows=550 width=10) + Output:["_col0","_col1","_col6"],keys:{"0":"key","1":"key"} + <-Map 20 [SIMPLE_EDGE] + SHUFFLE [RS_47] + PartitionCols:key + Filter Operator [FIL_147] (rows=500 width=10) + predicate:(key is not null and value is not null) + TableScan [TS_44] (rows=500 width=10) + default@src,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 22 [SIMPLE_EDGE] + SHUFFLE [RS_49] + PartitionCols:key + Filter Operator [FIL_148] (rows=500 width=10) + predicate:key is not null + TableScan [TS_45] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 4 [CONTAINS] + Reduce Output Operator [RS_61] + PartitionCols:_col0, _col1 + Group By Operator [GBY_60] (rows=1210 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_23] (rows=605 width=10) + Output:["_col0","_col1"] + Merge Join Operator [MERGEJOIN_158] (rows=605 width=10) + Output:["_col0","_col6"],keys:{"0":"_col1","1":"_col1"} + <-Map 11 [SIMPLE_EDGE] + SHUFFLE [RS_19] + PartitionCols:_col1 + Map Join Operator [MAPJOIN_155] (rows=550 width=10) + HybridGraceHashJoin:true,Output:["_col0","_col1","_col6"],keys:{"RS_14":"key","FIL_143":"key"} + <-Map 10 [BROADCAST_EDGE] + BROADCAST [RS_14] + PartitionCols:key + Filter Operator [FIL_142] (rows=25 width=7) + predicate:(key is not null and value is not null) + TableScan [TS_11] (rows=25 width=7) + default@src1,x,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Filter Operator [FIL_143] (rows=500 width=10) + predicate:key is not null + TableScan [TS_12] (rows=500 width=10) + default@src,y,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Reducer 3 [SIMPLE_EDGE] + SHUFFLE [RS_21] + PartitionCols:_col1 + Select Operator [SEL_10] (rows=262 width=10) + Output:["_col1"] + Group By Operator [GBY_9] (rows=262 width=10) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 2 [SIMPLE_EDGE] + <-Map 1 [CONTAINS] + Reduce Output Operator [RS_8] + PartitionCols:_col0, _col1 + Group By Operator [GBY_7] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_1] (rows=25 width=7) + Output:["_col0","_col1"] + Filter Operator [FIL_140] (rows=25 width=7) + predicate:value is not null + TableScan [TS_0] (rows=25 width=7) + Output:["key","value"] + <-Map 9 [CONTAINS] + Reduce Output Operator [RS_8] + PartitionCols:_col0, _col1 + Group By Operator [GBY_7] (rows=525 width=10) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_3] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_141] (rows=500 width=10) + predicate:value is not null + TableScan [TS_2] (rows=500 width=10) + Output:["key","value"] + File Output Operator [FS_116] + table:{"name:":"default.b"} + Please refer to the previous Group By Operator [GBY_111] + File Output Operator [FS_118] + table:{"name:":"default.c"} + Please refer to the previous Group By Operator [GBY_111] Stage-6 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.b"} - Please refer to the previous Stage-4 + Stats-Aggr Operator + Stage-1 + Move Operator + table:{"name:":"default.b"} + Please refer to the previous Stage-4 Stage-7 - Stats-Aggr Operator - Stage-2 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.c"} - Please refer to the previous Stage-4 + Stats-Aggr Operator + Stage-2 + Move Operator + table:{"name:":"default.c"} + Please refer to the previous Stage-4 PREHOOK: query: CREATE TABLE DEST1(key STRING, value STRING) STORED AS TEXTFILE PREHOOK: type: CREATETABLE @@ -5067,105 +3922,64 @@ Reducer 4 <- Union 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (SIMPLE_EDGE) Stage-4 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Stage-3 - Dependency Collection{} - Stage-2 - Reducer 5 - File Output Operator [FS_20] - compressed:false - Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Group By Operator [GBY_18] - | aggregations:["count(DISTINCT KEY._col1:0._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - |<-Reducer 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:++ - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_16] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), substr(_col1, 5) (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_13] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: PARTIAL - |<-Union 3 [SIMPLE_EDGE] - |<-Map 6 [CONTAINS] - | Reduce Output Operator [RS_12] - | key expressions:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_11] - | keys:_col0 (type: string), _col1 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:s2 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Reducer 2 [CONTAINS] - Reduce Output Operator [RS_12] - key expressions:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:+++ - Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_11] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 272 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_2] - aggregations:["count(1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:s1 - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - File Output Operator [FS_26] - compressed:false - Statistics:Num rows: 1 Data size: 456 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Select Operator [SEL_25] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 456 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_24] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), _col1 (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - Please refer to the previous Group By Operator [GBY_13] + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.dest1"} + Stage-3 + Dependency Collection{} + Stage-2 + Reducer 5 + File Output Operator [FS_20] + table:{"name:":"default.dest1"} + Group By Operator [GBY_18] (rows=1 width=96) + Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 + <-Reducer 4 [SIMPLE_EDGE] + SHUFFLE [RS_17] + PartitionCols:_col0 + Group By Operator [GBY_16] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Group By Operator [GBY_13] (rows=1 width=272) + Output:["_col0","_col1"],keys:KEY._col0, KEY._col1 + <-Union 3 [SIMPLE_EDGE] + <-Map 6 [CONTAINS] + Reduce Output Operator [RS_12] + PartitionCols:_col0, _col1 + Group By Operator [GBY_11] (rows=1 width=272) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_7] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_6] (rows=500 width=10) + Output:["key","value"] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_12] + PartitionCols:_col0, _col1 + Group By Operator [GBY_11] (rows=1 width=272) + Output:["_col0","_col1"],keys:_col0, _col1 + Select Operator [SEL_5] (rows=1 width=272) + Output:["_col0","_col1"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + Select Operator [SEL_1] (rows=500 width=10) + TableScan [TS_0] (rows=500 width=10) + default@src,s1,Tbl:COMPLETE,Col:COMPLETE + File Output Operator [FS_26] + table:{"name:":"default.dest2"} + Select Operator [SEL_25] (rows=1 width=456) + Output:["_col0","_col1","_col2"] + Group By Operator [GBY_24] (rows=1 width=464) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1 + Please refer to the previous Group By Operator [GBY_13] Stage-5 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Please refer to the previous Stage-3 + Stats-Aggr Operator + Stage-1 + Move Operator + table:{"name:":"default.dest2"} + Please refer to the previous Stage-3 PREHOOK: query: EXPLAIN FROM UNIQUEJOIN PRESERVE src a (a.key), PRESERVE src1 b (b.key), PRESERVE srcpart c (c.key) SELECT a.key, b.key, c.key PREHOOK: type: QUERY @@ -5177,49 +3991,30 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE), Map 4 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 4400 Data size: 46745 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_7] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 4400 Data size: 46745 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_9] - | condition map:[{"":"Unique Join0 to 0"},{"":"Unique Join0 to 0"},{"":"Unique Join0 to 0"}] - | keys:{"0":"key (type: string)","1":"key (type: string)","2":"key (type: string)"} - | outputColumnNames:["_col0","_col5","_col10"] - | Statistics:Num rows: 4400 Data size: 46745 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - | Reduce Output Operator [RS_4] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_1] - | alias:b - | Statistics:Num rows: 25 Data size: 191 Basic stats: COMPLETE Column stats: NONE - |<-Map 4 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:key (type: string) - Map-reduce partition columns:key (type: string) - sort order:+ - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_2] - alias:c - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_8] + Select Operator [SEL_7] (rows=4400 width=10) + Output:["_col0","_col1","_col2"] + Merge Join Operator [MERGEJOIN_9] (rows=4400 width=10) + Output:["_col0","_col5","_col10"],keys:{"0":"key","1":"key","2":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + TableScan [TS_0] (rows=500 width=10) + default@src,a,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_4] + PartitionCols:key + TableScan [TS_1] (rows=25 width=7) + default@src1,b,Tbl:COMPLETE,Col:NONE,Output:["key"] + <-Map 4 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:key + TableScan [TS_2] (rows=2000 width=10) + default@srcpart,c,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: EXPLAIN SELECT @@ -5239,48 +4034,29 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 3 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 - File Output Operator [FS_9] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Transform Operator [SCR_8] - command:cat - output info:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Merge Join Operator [MERGEJOIN_14] - | condition map:[{"":"Inner Join 0 to 1"}] - | keys:{"0":"key (type: string)","1":"key (type: string)"} - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - | Reduce Output Operator [RS_3] - | key expressions:key (type: string) - | Map-reduce partition columns:key (type: string) - | sort order:+ - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | value expressions:value (type: string) - | Filter Operator [FIL_12] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 3 [SIMPLE_EDGE] - Reduce Output Operator [RS_5] - key expressions:key (type: string) - Map-reduce partition columns:key (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_13] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_1] - alias:b - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 + File Output Operator [FS_9] + Transform Operator [SCR_8] (rows=550 width=10) + command:cat + Merge Join Operator [MERGEJOIN_14] (rows=550 width=10) + Output:["_col0","_col1"],keys:{"0":"key","1":"key"} + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + PartitionCols:key + Filter Operator [FIL_12] (rows=500 width=10) + predicate:key is not null + TableScan [TS_0] (rows=500 width=10) + default@src,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Map 3 [SIMPLE_EDGE] + SHUFFLE [RS_5] + PartitionCols:key + Filter Operator [FIL_13] (rows=500 width=10) + predicate:key is not null + TableScan [TS_1] (rows=500 width=10) + default@src,b,Tbl:COMPLETE,Col:NONE,Output:["key"] PREHOOK: query: explain FROM ( @@ -5318,146 +4094,84 @@ Reducer 4 <- Union 3 (SIMPLE_EDGE) Reducer 5 <- Union 3 (SIMPLE_EDGE) Stage-4 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Stage-3 - Dependency Collection{} - Stage-2 - Reducer 4 - File Output Operator [FS_18] - compressed:false - Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Group By Operator [GBY_16] - | aggregations:["count(DISTINCT KEY._col1:0._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - |<-Union 3 [SIMPLE_EDGE] - |<-Map 6 [CONTAINS] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:++ - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_14] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_9] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 501 Data size: 136272 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:s2 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_20] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Please refer to the previous Select Operator [SEL_9] - |<-Map 7 [CONTAINS] - | Reduce Output Operator [RS_15] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:++ - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_14] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_11] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_10] - | alias:s0 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Reduce Output Operator [RS_21] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_20] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Please refer to the previous Select Operator [SEL_11] - |<-Reducer 2 [CONTAINS] - Reduce Output Operator [RS_15] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:++ - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_14] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), substr(_col1, 5) (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_9] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 501 Data size: 136272 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 360 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_2] - aggregations:["count(1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:s1 - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator [RS_21] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:+++ - Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_20] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - Please refer to the previous Select Operator [SEL_9] - Reducer 5 - File Output Operator [FS_24] - compressed:false - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Group By Operator [GBY_22] - | aggregations:["count(DISTINCT KEY._col2:0._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - |<- Please refer to the previous Union 3 [SIMPLE_EDGE] + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.dest1"} + Stage-3 + Dependency Collection{} + Stage-2 + Reducer 4 + File Output Operator [FS_18] + table:{"name:":"default.dest1"} + Group By Operator [GBY_16] (rows=1 width=96) + Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 + <-Union 3 [SIMPLE_EDGE] + <-Map 6 [CONTAINS] + Reduce Output Operator [RS_15] + PartitionCols:_col0 + Group By Operator [GBY_14] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Select Operator [SEL_9] (rows=501 width=272) + Output:["_col0","_col1"] + Select Operator [SEL_7] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_6] (rows=500 width=10) + Output:["key","value"] + Reduce Output Operator [RS_21] + PartitionCols:_col0, _col1 + Group By Operator [GBY_20] (rows=1 width=464) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1, substr(_col1, 5) + Please refer to the previous Select Operator [SEL_9] + <-Map 7 [CONTAINS] + Reduce Output Operator [RS_15] + PartitionCols:_col0 + Group By Operator [GBY_14] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Select Operator [SEL_11] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_10] (rows=500 width=10) + Output:["key","value"] + Reduce Output Operator [RS_21] + PartitionCols:_col0, _col1 + Group By Operator [GBY_20] (rows=1 width=464) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1, substr(_col1, 5) + Please refer to the previous Select Operator [SEL_11] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_15] + PartitionCols:_col0 + Group By Operator [GBY_14] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Select Operator [SEL_9] (rows=501 width=272) + Output:["_col0","_col1"] + Select Operator [SEL_5] (rows=1 width=360) + Output:["_col0","_col1"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + Select Operator [SEL_1] (rows=500 width=10) + TableScan [TS_0] (rows=500 width=10) + default@src,s1,Tbl:COMPLETE,Col:COMPLETE + Reduce Output Operator [RS_21] + PartitionCols:_col0, _col1 + Group By Operator [GBY_20] (rows=1 width=464) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1, substr(_col1, 5) + Please refer to the previous Select Operator [SEL_9] + Reducer 5 + File Output Operator [FS_24] + table:{"name:":"default.dest2"} + Group By Operator [GBY_22] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT KEY._col2:0._col0)"],keys:KEY._col0, KEY._col1 + <- Please refer to the previous Union 3 [SIMPLE_EDGE] Stage-5 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Please refer to the previous Stage-3 + Stats-Aggr Operator + Stage-1 + Move Operator + table:{"name:":"default.dest2"} + Please refer to the previous Stage-3 PREHOOK: query: explain FROM ( @@ -5488,122 +4202,72 @@ Reducer 4 <- Union 3 (SIMPLE_EDGE) Reducer 5 <- Union 3 (SIMPLE_EDGE) Stage-4 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Stage-3 - Dependency Collection{} - Stage-2 - Reducer 4 - File Output Operator [FS_14] - compressed:false - Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest1"} - Group By Operator [GBY_12] - | aggregations:["count(DISTINCT KEY._col1:0._col0)"] - | keys:KEY._col0 (type: string) - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: PARTIAL - |<-Union 3 [SIMPLE_EDGE] - |<-Map 6 [CONTAINS] - | Reduce Output Operator [RS_11] - | key expressions:_col0 (type: string), _col1 (type: string) - | Map-reduce partition columns:_col0 (type: string) - | sort order:++ - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_10] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_9] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 501 Data size: 5672 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_6] - | alias:s2 - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - | Reduce Output Operator [RS_17] - | key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - | Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - | sort order:+++ - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Group By Operator [GBY_16] - | aggregations:["count(DISTINCT substr(_col1, 5))"] - | keys:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - | outputColumnNames:["_col0","_col1","_col2","_col3"] - | Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - | Select Operator [SEL_15] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 501 Data size: 5672 Basic stats: COMPLETE Column stats: PARTIAL - | Please refer to the previous Select Operator [SEL_7] - |<-Reducer 2 [CONTAINS] - Reduce Output Operator [RS_11] - key expressions:_col0 (type: string), _col1 (type: string) - Map-reduce partition columns:_col0 (type: string) - sort order:++ - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_10] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), substr(_col1, 5) (type: string) - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_9] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 501 Data size: 5672 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 360 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator [GBY_4] - | aggregations:["count(VALUE._col0)"] - | outputColumnNames:["_col0"] - | Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions:_col0 (type: bigint) - Group By Operator [GBY_2] - aggregations:["count(1)"] - outputColumnNames:["_col0"] - Statistics:Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator [SEL_1] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - TableScan [TS_0] - alias:s1 - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator [RS_17] - key expressions:_col0 (type: string), _col1 (type: string), _col2 (type: string) - Map-reduce partition columns:_col0 (type: string), _col1 (type: string) - sort order:+++ - Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - Group By Operator [GBY_16] - aggregations:["count(DISTINCT substr(_col1, 5))"] - keys:_col0 (type: string), _col1 (type: string), substr(_col1, 5) (type: string) - outputColumnNames:["_col0","_col1","_col2","_col3"] - Statistics:Num rows: 1 Data size: 464 Basic stats: COMPLETE Column stats: PARTIAL - Select Operator [SEL_15] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 501 Data size: 5672 Basic stats: COMPLETE Column stats: PARTIAL - Please refer to the previous Select Operator [SEL_5] - Reducer 5 - File Output Operator [FS_20] - compressed:false - Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Group By Operator [GBY_18] - | aggregations:["count(DISTINCT KEY._col2:0._col0)"] - | keys:KEY._col0 (type: string), KEY._col1 (type: string) - | outputColumnNames:["_col0","_col1","_col2"] - | Statistics:Num rows: 1 Data size: 280 Basic stats: COMPLETE Column stats: PARTIAL - |<- Please refer to the previous Union 3 [SIMPLE_EDGE] + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.dest1"} + Stage-3 + Dependency Collection{} + Stage-2 + Reducer 4 + File Output Operator [FS_14] + table:{"name:":"default.dest1"} + Group By Operator [GBY_12] (rows=1 width=96) + Output:["_col0","_col1"],aggregations:["count(DISTINCT KEY._col1:0._col0)"],keys:KEY._col0 + <-Union 3 [SIMPLE_EDGE] + <-Map 6 [CONTAINS] + Reduce Output Operator [RS_11] + PartitionCols:_col0 + Group By Operator [GBY_10] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Select Operator [SEL_9] (rows=501 width=11) + Output:["_col0","_col1"] + Select Operator [SEL_7] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_6] (rows=500 width=10) + Output:["key","value"] + Reduce Output Operator [RS_17] + PartitionCols:_col0, _col1 + Group By Operator [GBY_16] (rows=1 width=464) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1, substr(_col1, 5) + Select Operator [SEL_15] (rows=501 width=11) + Output:["_col0","_col1"] + Please refer to the previous Select Operator [SEL_7] + <-Reducer 2 [CONTAINS] + Reduce Output Operator [RS_11] + PartitionCols:_col0 + Group By Operator [GBY_10] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, substr(_col1, 5) + Select Operator [SEL_9] (rows=501 width=11) + Output:["_col0","_col1"] + Select Operator [SEL_5] (rows=1 width=360) + Output:["_col0","_col1"] + Group By Operator [GBY_4] (rows=1 width=8) + Output:["_col0"],aggregations:["count(VALUE._col0)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=8) + Output:["_col0"],aggregations:["count(1)"] + Select Operator [SEL_1] (rows=500 width=10) + TableScan [TS_0] (rows=500 width=10) + default@src,s1,Tbl:COMPLETE,Col:COMPLETE + Reduce Output Operator [RS_17] + PartitionCols:_col0, _col1 + Group By Operator [GBY_16] (rows=1 width=464) + Output:["_col0","_col1","_col2","_col3"],aggregations:["count(DISTINCT substr(_col1, 5))"],keys:_col0, _col1, substr(_col1, 5) + Select Operator [SEL_15] (rows=501 width=11) + Output:["_col0","_col1"] + Please refer to the previous Select Operator [SEL_5] + Reducer 5 + File Output Operator [FS_20] + table:{"name:":"default.dest2"} + Group By Operator [GBY_18] (rows=1 width=280) + Output:["_col0","_col1","_col2"],aggregations:["count(DISTINCT KEY._col2:0._col0)"],keys:KEY._col0, KEY._col1 + <- Please refer to the previous Union 3 [SIMPLE_EDGE] Stage-5 - Stats-Aggr Operator - Stage-1 - Move Operator - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.dest2"} - Please refer to the previous Stage-3 + Stats-Aggr Operator + Stage-1 + Move Operator + table:{"name:":"default.dest2"} + Please refer to the previous Stage-3 diff --git a/ql/src/test/results/clientpositive/tez/explainuser_3.q.out b/ql/src/test/results/clientpositive/tez/explainuser_3.q.out index e2db163..aef1464 100644 --- a/ql/src/test/results/clientpositive/tez/explainuser_3.q.out +++ b/ql/src/test/results/clientpositive/tez/explainuser_3.q.out @@ -26,29 +26,19 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Reducer 2 vectorized - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 10 Data size: 1704 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [OP_7] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 10 Data size: 1704 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] vectorized - Reduce Output Operator [RS_6] - key expressions:_col0 (type: int), _col1 (type: string) - sort order:++ - Statistics:Num rows: 10 Data size: 1704 Basic stats: COMPLETE Column stats: NONE - Select Operator [OP_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 10 Data size: 1704 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - ACID table:true - alias:acid_vectorized - Statistics:Num rows: 10 Data size: 1704 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Reducer 2 vectorized + File Output Operator [FS_8] + Select Operator [OP_7] (rows=10 width=170) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] vectorized + SHUFFLE [RS_6] + Select Operator [OP_5] (rows=10 width=170) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=10 width=170) + default@acid_vectorized,acid_vectorized, ACID table,Tbl:COMPLETE,Col:NONE,Output:["a","b"] PREHOOK: query: explain select key, value FROM srcpart LATERAL VIEW explode(array(1,2,3)) myTable AS myCol @@ -59,56 +49,41 @@ POSTHOOK: type: QUERY Plan not optimized by CBO. Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 1 - File Output Operator [FS_7] - compressed:false - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_6] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - Lateral View Join Operator [LVJ_5] - outputColumnNames:["_col0","_col1","_col7"] - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_2] - outputColumnNames:["key","value"] - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - Lateral View Forward [LVF_1] - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:srcpart - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - File Output Operator [FS_7] - compressed:false - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_6] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - Lateral View Join Operator [LVJ_5] - outputColumnNames:["_col0","_col1","_col7"] - Statistics:Num rows: 4000 Data size: 42496 Basic stats: COMPLETE Column stats: NONE - UDTF Operator [UDTF_4] - function name:explode - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - Select Operator [SEL_3] - outputColumnNames:["_col0"] - Statistics:Num rows: 2000 Data size: 21248 Basic stats: COMPLETE Column stats: NONE - Please refer to the previous Lateral View Forward [LVF_1] + Fetch Operator + limit:-1 + Stage-1 + Map 1 + File Output Operator [FS_7] + Select Operator [SEL_6] (rows=4000 width=10) + Output:["_col0","_col1"] + Lateral View Join Operator [LVJ_5] (rows=4000 width=10) + Output:["_col0","_col1","_col7"] + Select Operator [SEL_2] (rows=2000 width=10) + Output:["key","value"] + Lateral View Forward [LVF_1] (rows=2000 width=10) + TableScan [TS_0] (rows=2000 width=10) + default@srcpart,srcpart,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + File Output Operator [FS_7] + Select Operator [SEL_6] (rows=4000 width=10) + Output:["_col0","_col1"] + Lateral View Join Operator [LVJ_5] (rows=4000 width=10) + Output:["_col0","_col1","_col7"] + UDTF Operator [UDTF_4] (rows=2000 width=10) + function name:explode + Select Operator [SEL_3] (rows=2000 width=10) + Output:["_col0"] + Please refer to the previous Lateral View Forward [LVF_1] PREHOOK: query: explain show tables PREHOOK: type: SHOWTABLES POSTHOOK: query: explain show tables POSTHOOK: type: SHOWTABLES Stage-1 - Fetch Operator - limit:-1 - Stage-0 - Show Table Operator: - database name:default + Fetch Operator + limit:-1 + Stage-0 + Show Table Operator: + database name:default #### A masked pattern was here #### PREHOOK: type: CREATEDATABASE @@ -128,9 +103,9 @@ PREHOOK: type: DESCDATABASE POSTHOOK: query: explain describe database extended newDB POSTHOOK: type: DESCDATABASE Stage-1 - Fetch Operator - limit:-1 - Stage-0 + Fetch Operator + limit:-1 + Stage-0 PREHOOK: query: describe database extended newDB PREHOOK: type: DESCDATABASE @@ -164,18 +139,16 @@ PREHOOK: type: ALTERTABLE_RENAME POSTHOOK: query: explain alter table tab rename to newName POSTHOOK: type: ALTERTABLE_RENAME Stage-0 - Alter Table Operator: - new name:newDB.newName - old name:newDB.tab - type:rename + Alter Table Operator: + new name:newDB.newName,old name:newDB.tab,type:rename PREHOOK: query: explain drop table tab PREHOOK: type: DROPTABLE POSTHOOK: query: explain drop table tab POSTHOOK: type: DROPTABLE Stage-0 - Drop Table Operator: - table:tab + Drop Table Operator: + table:tab PREHOOK: query: drop table tab PREHOOK: type: DROPTABLE @@ -210,12 +183,11 @@ PREHOOK: type: QUERY POSTHOOK: query: explain analyze table src compute statistics POSTHOOK: type: QUERY Stage-2 - Stats-Aggr Operator - Stage-0 - Map 1 - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: COMPLETE + Stats-Aggr Operator + Stage-0 + Map 1 + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:COMPLETE PREHOOK: query: explain analyze table src compute statistics for columns PREHOOK: type: QUERY @@ -225,32 +197,20 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-2 - Column Stats Work{} - Stage-0 - Reducer 2 - File Output Operator [FS_6] - compressed:false - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Group By Operator [GBY_4] - | aggregations:["compute_stats(VALUE._col0)","compute_stats(VALUE._col1)"] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_3] - sort order: - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - value expressions:_col0 (type: struct), _col1 (type: struct) - Group By Operator [GBY_2] - aggregations:["compute_stats(key, 16)","compute_stats(value, 16)"] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 1 Data size: 0 Basic stats: PARTIAL Column stats: NONE - Select Operator [SEL_1] - outputColumnNames:["key","value"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Column Stats Work{} + Stage-0 + Reducer 2 + File Output Operator [FS_6] + Group By Operator [GBY_4] (rows=1 width=0) + Output:["_col0","_col1"],aggregations:["compute_stats(VALUE._col0)","compute_stats(VALUE._col1)"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_3] + Group By Operator [GBY_2] (rows=1 width=0) + Output:["_col0","_col1"],aggregations:["compute_stats(key, 16)","compute_stats(value, 16)"] + Select Operator [SEL_1] (rows=500 width=10) + Output:["key","value"] + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: explain CREATE TEMPORARY MACRO SIGMOID (x DOUBLE) 1.0 / (1.0 + EXP(-x)) @@ -273,14 +233,13 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-0 - Fetch Operator - limit:1 - Limit [LIM_2] - Number of rows:1 - Select Operator [SEL_1] - outputColumnNames:["_col0"] - TableScan [TS_0] - alias:src + Fetch Operator + limit:1 + Limit [LIM_2] + Number of rows:1 + Select Operator [SEL_1] + Output:["_col0"] + TableScan [TS_0] PREHOOK: query: explain DROP TEMPORARY MACRO SIGMOID PREHOOK: type: DROPMACRO @@ -301,30 +260,23 @@ POSTHOOK: type: CREATETABLE_AS_SELECT Plan optimized by CBO. Stage-3 - Stats-Aggr Operator - Stage-4 - Create Table Operator: - columns:["key string","value string"] - input format:org.apache.hadoop.mapred.TextInputFormat - name:default.src_autho_test - output format:org.apache.hadoop.hive.ql.io.IgnoreKeyTextOutputFormat - Stage-2 - Dependency Collection{} - Stage-1 - Map 1 - File Output Operator [FS_2] - compressed:false - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe","name:":"default.src_autho_test"} - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Stage-0 - Move Operator - Please refer to the previous Stage-1 + Stats-Aggr Operator + Stage-4 + Create Table Operator: + name:default.src_autho_test + Stage-2 + Dependency Collection{} + Stage-1 + Map 1 + File Output Operator [FS_2] + table:{"name:":"default.src_autho_test"} + Select Operator [SEL_1] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + Stage-0 + Move Operator + Please refer to the previous Stage-1 PREHOOK: query: create table src_autho_test as select * from src PREHOOK: type: CREATETABLE_AS_SELECT @@ -353,18 +305,18 @@ PREHOOK: type: SHOW_GRANT POSTHOOK: query: explain show grant user hive_test_user on table src_autho_test POSTHOOK: type: SHOW_GRANT Stage-1 - Fetch Operator - limit:-1 - Stage-0 + Fetch Operator + limit:-1 + Stage-0 PREHOOK: query: explain show grant user hive_test_user on table src_autho_test(key) PREHOOK: type: SHOW_GRANT POSTHOOK: query: explain show grant user hive_test_user on table src_autho_test(key) POSTHOOK: type: SHOW_GRANT Stage-1 - Fetch Operator - limit:-1 - Stage-0 + Fetch Operator + limit:-1 + Stage-0 PREHOOK: query: select key from src_autho_test order by key limit 20 PREHOOK: type: QUERY @@ -441,9 +393,9 @@ PREHOOK: type: SHOW_ROLE_GRANT POSTHOOK: query: explain show role grant user hive_test_user POSTHOOK: type: SHOW_ROLE_GRANT Stage-1 - Fetch Operator - limit:-1 - Stage-0 + Fetch Operator + limit:-1 + Stage-0 PREHOOK: query: explain drop role sRc_roLE PREHOOK: type: DROPROLE @@ -468,8 +420,8 @@ PREHOOK: type: DROPVIEW POSTHOOK: query: explain drop view v POSTHOOK: type: DROPVIEW Stage-0 - Drop Table Operator: - table:v + Drop Table Operator: + table:v PREHOOK: query: explain create view v as with cte as (select * from src order by key limit 5) select * from cte @@ -480,9 +432,8 @@ POSTHOOK: type: CREATEVIEW Plan not optimized by CBO. Stage-0 - Create View Operator: - name:default.v - original text:with cte as (select * from src order by key limit 5) + Create View Operator: + name:default.v,original text:with cte as (select * from src order by key limit 5) select * from cte PREHOOK: query: explain with cte as (select * from src order by key limit 5) @@ -497,32 +448,21 @@ Vertex dependency in root stage Reducer 2 <- Map 1 (SIMPLE_EDGE) Stage-0 - Fetch Operator - limit:5 - Stage-1 - Reducer 2 vectorized - File Output Operator [FS_8] - compressed:false - Statistics:Num rows: 5 Data size: 50 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Limit [LIM_7] - Number of rows:5 - Statistics:Num rows: 5 Data size: 50 Basic stats: COMPLETE Column stats: NONE - Select Operator [OP_6] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [SIMPLE_EDGE] - Reduce Output Operator [RS_2] - key expressions:_col0 (type: string) - sort order:+ - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - value expressions:_col1 (type: string) - Select Operator [SEL_1] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:src - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:5 + Stage-1 + Reducer 2 vectorized + File Output Operator [FS_8] + Limit [LIM_7] (rows=5 width=10) + Number of rows:5 + Select Operator [OP_6] (rows=500 width=10) + Output:["_col0","_col1"] + <-Map 1 [SIMPLE_EDGE] + SHUFFLE [RS_2] + Select Operator [SEL_1] (rows=500 width=10) + Output:["_col0","_col1"] + TableScan [TS_0] (rows=500 width=10) + default@src,src,Tbl:COMPLETE,Col:NONE,Output:["key","value"] PREHOOK: query: create table orc_merge5 (userid bigint, string1 string, subtype double, decimal1 decimal, ts timestamp) stored as orc PREHOOK: type: CREATETABLE @@ -547,41 +487,36 @@ POSTHOOK: type: QUERY Plan optimized by CBO. Stage-3 - Stats-Aggr Operator - Stage-0 - Move Operator - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.orc_merge5"} - Stage-2 - Dependency Collection{} - Stage-5(CONDITIONAL) - Move Operator - Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) - Conditional Operator - Stage-1 - Map 1 vectorized - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 306 Data size: 82044 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.hive.ql.io.orc.OrcInputFormat","output format:":"org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat","serde:":"org.apache.hadoop.hive.ql.io.orc.OrcSerde","name:":"default.orc_merge5"} - Select Operator [OP_9] - outputColumnNames:["_col0","_col1","_col2","_col3","_col4"] - Statistics:Num rows: 306 Data size: 82044 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_8] - predicate:(userid <= 13) (type: boolean) - Statistics:Num rows: 306 Data size: 82044 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_0] - alias:orc_merge5 - Statistics:Num rows: 919 Data size: 246402 Basic stats: COMPLETE Column stats: NONE - Stage-4(CONDITIONAL) - File Merge - ORC File Merge Operator [OFM_7] - Please refer to the previous Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) - Stage-7 - Move Operator - Stage-6(CONDITIONAL) - File Merge - ORC File Merge Operator [OFM_7] - Please refer to the previous Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) + Stats-Aggr Operator + Stage-0 + Move Operator + table:{"name:":"default.orc_merge5"} + Stage-2 + Dependency Collection{} + Stage-5(CONDITIONAL) + Move Operator + Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) + Conditional Operator + Stage-1 + Map 1 vectorized + File Output Operator [FS_10] + table:{"name:":"default.orc_merge5"} + Select Operator [OP_9] (rows=306 width=268) + Output:["_col0","_col1","_col2","_col3","_col4"] + Filter Operator [FIL_8] (rows=306 width=268) + predicate:(userid <= 13) + TableScan [TS_0] (rows=919 width=268) + default@orc_merge5,orc_merge5,Tbl:COMPLETE,Col:NONE,Output:["userid","string1","subtype","decimal1","ts"] + Stage-4(CONDITIONAL) + File Merge + ORC File Merge Operator [OFM_7] + Please refer to the previous Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) + Stage-7 + Move Operator + Stage-6(CONDITIONAL) + File Merge + ORC File Merge Operator [OFM_7] + Please refer to the previous Stage-8(CONDITIONAL CHILD TASKS: Stage-5, Stage-4, Stage-6) PREHOOK: query: drop table orc_merge5 PREHOOK: type: DROPTABLE @@ -715,47 +650,28 @@ Vertex dependency in root stage Map 2 <- Map 1 (CUSTOM_EDGE) Stage-0 - Fetch Operator - limit:-1 - Stage-1 - Map 2 - File Output Operator [FS_10] - compressed:false - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - table:{"input format:":"org.apache.hadoop.mapred.TextInputFormat","output format:":"org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat","serde:":"org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe"} - Select Operator [SEL_9] - outputColumnNames:["_col0","_col1","_col2"] - Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - Map Join Operator [MAPJOIN_15] - | BucketMapJoin:true - | condition map:[{"":"Inner Join 0 to 1"}] - | HybridGraceHashJoin:true - | keys:{"Map 1":"_col0 (type: int)","Map 2":"_col0 (type: int)"} - | outputColumnNames:["_col0","_col1","_col3"] - | Statistics:Num rows: 550 Data size: 5843 Basic stats: COMPLETE Column stats: NONE - |<-Map 1 [CUSTOM_EDGE] - | Reduce Output Operator [RS_6] - | key expressions:_col0 (type: int) - | Map-reduce partition columns:_col0 (type: int) - | sort order:+ - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | value expressions:_col1 (type: string) - | Select Operator [SEL_2] - | outputColumnNames:["_col0","_col1"] - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | Filter Operator [FIL_13] - | predicate:key is not null (type: boolean) - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - | TableScan [TS_0] - | alias:a - | Statistics:Num rows: 242 Data size: 2566 Basic stats: COMPLETE Column stats: NONE - |<-Select Operator [SEL_5] - outputColumnNames:["_col0","_col1"] - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - Filter Operator [FIL_14] - predicate:key is not null (type: boolean) - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE - TableScan [TS_3] - alias:b - Statistics:Num rows: 500 Data size: 5312 Basic stats: COMPLETE Column stats: NONE + Fetch Operator + limit:-1 + Stage-1 + Map 2 + File Output Operator [FS_10] + Select Operator [SEL_9] (rows=550 width=10) + Output:["_col0","_col1","_col2"] + Map Join Operator [MAPJOIN_15] (rows=550 width=10) + BucketMapJoin:true,HybridGraceHashJoin:true,Output:["_col0","_col1","_col3"],keys:{"RS_6":"_col0","SEL_5":"_col0"} + <-Map 1 [CUSTOM_EDGE] + OTHER [RS_6] + PartitionCols:_col0 + Select Operator [SEL_2] (rows=242 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_13] (rows=242 width=10) + predicate:key is not null + TableScan [TS_0] (rows=242 width=10) + default@tab,a,Tbl:COMPLETE,Col:NONE,Output:["key","value"] + <-Select Operator [SEL_5] (rows=500 width=10) + Output:["_col0","_col1"] + Filter Operator [FIL_14] (rows=500 width=10) + predicate:key is not null + TableScan [TS_3] (rows=500 width=10) + default@tab_part,b,Tbl:COMPLETE,Col:NONE,Output:["key","value"]