hive-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From apivova...@apache.org
Subject hive git commit: HIVE-10706 Make vectorized_timestamp_funcs test more stable (Alexander Pivovarov, reviewed by Jason Dere)
Date Wed, 20 May 2015 06:19:12 GMT
Repository: hive
Updated Branches:
  refs/heads/master 3d95e1061 -> 0d0757b73


HIVE-10706 Make vectorized_timestamp_funcs test more stable (Alexander Pivovarov, reviewed
by Jason Dere)


Project: http://git-wip-us.apache.org/repos/asf/hive/repo
Commit: http://git-wip-us.apache.org/repos/asf/hive/commit/0d0757b7
Tree: http://git-wip-us.apache.org/repos/asf/hive/tree/0d0757b7
Diff: http://git-wip-us.apache.org/repos/asf/hive/diff/0d0757b7

Branch: refs/heads/master
Commit: 0d0757b73e20465d3d5178524f41d93c39450481
Parents: 3d95e10
Author: Alexander Pivovarov <apivovarov@gmail.com>
Authored: Wed May 13 23:27:02 2015 -0700
Committer: Alexander Pivovarov <apivovarov@gmail.com>
Committed: Tue May 19 23:18:31 2015 -0700

----------------------------------------------------------------------
 .../clientpositive/vectorized_timestamp_funcs.q |  36 +++----
 .../spark/vectorized_timestamp_funcs.q.out      | 108 ++++++++++---------
 .../tez/vectorized_timestamp_funcs.q.out        | 108 ++++++++++---------
 .../vectorized_timestamp_funcs.q.out            | 108 ++++++++++---------
 4 files changed, 192 insertions(+), 168 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/hive/blob/0d0757b7/ql/src/test/queries/clientpositive/vectorized_timestamp_funcs.q
----------------------------------------------------------------------
diff --git a/ql/src/test/queries/clientpositive/vectorized_timestamp_funcs.q b/ql/src/test/queries/clientpositive/vectorized_timestamp_funcs.q
index 8a2d5aa..a6b7761 100644
--- a/ql/src/test/queries/clientpositive/vectorized_timestamp_funcs.q
+++ b/ql/src/test/queries/clientpositive/vectorized_timestamp_funcs.q
@@ -142,31 +142,31 @@ FROM alltypesorc_string;
 
 -- SUM of timestamps are not vectorized reduce-side because they produce a double instead
of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string;
 
 SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string;
 
 EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string;
 
 SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string;
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/hive/blob/0d0757b7/ql/src/test/results/clientpositive/spark/vectorized_timestamp_funcs.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/spark/vectorized_timestamp_funcs.q.out b/ql/src/test/results/clientpositive/spark/vectorized_timestamp_funcs.q.out
index 3044582..e9bef38 100644
--- a/ql/src/test/results/clientpositive/spark/vectorized_timestamp_funcs.q.out
+++ b/ql/src/test/results/clientpositive/spark/vectorized_timestamp_funcs.q.out
@@ -697,12 +697,12 @@ POSTHOOK: Input: default@alltypesorc_string
 1969-12-31 23:59:44.088	1970-01-01 00:00:15.007	39	40
 PREHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -741,13 +741,17 @@ STAGE PLANS:
                 mode: mergepartial
                 outputColumnNames: _col0
                 Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
-                File Output Operator
-                  compressed: false
+                Select Operator
+                  expressions: round(_col0, 3) (type: double)
+                  outputColumnNames: _col0
                   Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
-                  table:
-                      input format: org.apache.hadoop.mapred.TextInputFormat
-                      output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                      serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
             Execution mode: vectorized
 
   Stage: Stage-0
@@ -757,38 +761,38 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-1123143.8569999998
+1123143.857
 PREHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -828,13 +832,17 @@ STAGE PLANS:
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
                 Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
-                File Output Operator
-                  compressed: false
+                Select Operator
+                  expressions: round(_col0, 0) (type: double), _col1 BETWEEN 8.97077295279421E19
AND 8.97077295279422E19 (type: boolean), _col2 BETWEEN 8.97077295279421E19 AND 8.97077295279422E19
(type: boolean), _col3 BETWEEN 9.20684592523616E19 AND 9.20684592523617E19 (type: boolean),
round(_col4, 3) (type: double), round(_col5, 3) (type: double), round(_col6, 3) (type: double),
round(_col7, 3) (type: double)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
                   Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
-                  table:
-                      input format: org.apache.hadoop.mapred.TextInputFormat
-                      output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                      serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
 
   Stage: Stage-0
     Fetch Operator
@@ -843,29 +851,29 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-2.8798560435897438E13	8.970772952794214E19	8.970772952794214E19	9.206845925236167E19	9.471416447815086E9
9.471416447815086E9	9.471416447815086E9	9.595231068211004E9
+2.8798560435897E13	true	true	true	9.471416447815E9	9.471416447815E9	9.471416447815E9	9.595231068211E9

http://git-wip-us.apache.org/repos/asf/hive/blob/0d0757b7/ql/src/test/results/clientpositive/tez/vectorized_timestamp_funcs.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/tez/vectorized_timestamp_funcs.q.out b/ql/src/test/results/clientpositive/tez/vectorized_timestamp_funcs.q.out
index fa3ed21..76e6686 100644
--- a/ql/src/test/results/clientpositive/tez/vectorized_timestamp_funcs.q.out
+++ b/ql/src/test/results/clientpositive/tez/vectorized_timestamp_funcs.q.out
@@ -697,12 +697,12 @@ POSTHOOK: Input: default@alltypesorc_string
 1969-12-31 23:59:44.088	1970-01-01 00:00:15.007	39	40
 PREHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -741,13 +741,17 @@ STAGE PLANS:
                 mode: mergepartial
                 outputColumnNames: _col0
                 Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
-                File Output Operator
-                  compressed: false
+                Select Operator
+                  expressions: round(_col0, 3) (type: double)
+                  outputColumnNames: _col0
                   Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
-                  table:
-                      input format: org.apache.hadoop.mapred.TextInputFormat
-                      output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                      serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats:
NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
             Execution mode: vectorized
 
   Stage: Stage-0
@@ -757,38 +761,38 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-1123143.8569999998
+1123143.857
 PREHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -828,13 +832,17 @@ STAGE PLANS:
                 mode: mergepartial
                 outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
                 Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
-                File Output Operator
-                  compressed: false
+                Select Operator
+                  expressions: round(_col0, 0) (type: double), _col1 BETWEEN 8.97077295279421E19
AND 8.97077295279422E19 (type: boolean), _col2 BETWEEN 8.97077295279421E19 AND 8.97077295279422E19
(type: boolean), _col3 BETWEEN 9.20684592523616E19 AND 9.20684592523617E19 (type: boolean),
round(_col4, 3) (type: double), round(_col5, 3) (type: double), round(_col6, 3) (type: double),
round(_col7, 3) (type: double)
+                  outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
                   Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
-                  table:
-                      input format: org.apache.hadoop.mapred.TextInputFormat
-                      output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                      serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+                  File Output Operator
+                    compressed: false
+                    Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats:
NONE
+                    table:
+                        input format: org.apache.hadoop.mapred.TextInputFormat
+                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
 
   Stage: Stage-0
     Fetch Operator
@@ -843,29 +851,29 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-2.8798560435897438E13	8.970772952794212E19	8.970772952794212E19	9.206845925236166E19	9.471416447815084E9
9.471416447815084E9	9.471416447815084E9	9.595231068211002E9
+2.8798560435897E13	true	true	true	9.471416447815E9	9.471416447815E9	9.471416447815E9	9.595231068211E9

http://git-wip-us.apache.org/repos/asf/hive/blob/0d0757b7/ql/src/test/results/clientpositive/vectorized_timestamp_funcs.q.out
----------------------------------------------------------------------
diff --git a/ql/src/test/results/clientpositive/vectorized_timestamp_funcs.q.out b/ql/src/test/results/clientpositive/vectorized_timestamp_funcs.q.out
index 31a96c6..b3bb908 100644
--- a/ql/src/test/results/clientpositive/vectorized_timestamp_funcs.q.out
+++ b/ql/src/test/results/clientpositive/vectorized_timestamp_funcs.q.out
@@ -662,12 +662,12 @@ POSTHOOK: Input: default@alltypesorc_string
 1969-12-31 23:59:44.088	1970-01-01 00:00:15.007	39	40
 PREHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: -- SUM of timestamps are not vectorized reduce-side because they produce
a double instead of a long (HIVE-8211)...
 EXPLAIN SELECT
-  sum(ctimestamp1)
+  round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -700,13 +700,17 @@ STAGE PLANS:
           mode: mergepartial
           outputColumnNames: _col0
           Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
-          File Output Operator
-            compressed: false
+          Select Operator
+            expressions: round(_col0, 3) (type: double)
+            outputColumnNames: _col0
             Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
-            table:
-                input format: org.apache.hadoop.mapred.TextInputFormat
-                output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            File Output Operator
+              compressed: false
+              Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: NONE
+              table:
+                  input format: org.apache.hadoop.mapred.TextInputFormat
+                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
 
   Stage: Stage-0
     Fetch Operator
@@ -715,38 +719,38 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
- sum(ctimestamp1)
+ round(sum(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-1123143.8569999998
+1123143.857
 PREHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 POSTHOOK: query: EXPLAIN SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 STAGE DEPENDENCIES:
@@ -780,13 +784,17 @@ STAGE PLANS:
           mode: mergepartial
           outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
           Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats: NONE
-          File Output Operator
-            compressed: false
+          Select Operator
+            expressions: round(_col0, 0) (type: double), _col1 BETWEEN 8.97077295279421E19
AND 8.97077295279422E19 (type: boolean), _col2 BETWEEN 8.97077295279421E19 AND 8.97077295279422E19
(type: boolean), _col3 BETWEEN 9.20684592523616E19 AND 9.20684592523617E19 (type: boolean),
round(_col4, 3) (type: double), round(_col5, 3) (type: double), round(_col6, 3) (type: double),
round(_col7, 3) (type: double)
+            outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7
             Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats: NONE
-            table:
-                input format: org.apache.hadoop.mapred.TextInputFormat
-                output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
-                serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
+            File Output Operator
+              compressed: false
+              Statistics: Num rows: 1 Data size: 64 Basic stats: COMPLETE Column stats: NONE
+              table:
+                  input format: org.apache.hadoop.mapred.TextInputFormat
+                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
+                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
 
   Stage: Stage-0
     Fetch Operator
@@ -795,29 +803,29 @@ STAGE PLANS:
         ListSink
 
 PREHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 PREHOOK: type: QUERY
 PREHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
 POSTHOOK: query: SELECT
-  avg(ctimestamp1),
-  variance(ctimestamp1),
-  var_pop(ctimestamp1),
-  var_samp(ctimestamp1),
-  std(ctimestamp1),
-  stddev(ctimestamp1),
-  stddev_pop(ctimestamp1),
-  stddev_samp(ctimestamp1)
+  round(avg(ctimestamp1), 0),
+  variance(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_pop(ctimestamp1) between 8.97077295279421E19 and 8.97077295279422E19,
+  var_samp(ctimestamp1) between 9.20684592523616E19 and 9.20684592523617E19,
+  round(std(ctimestamp1), 3),
+  round(stddev(ctimestamp1), 3),
+  round(stddev_pop(ctimestamp1), 3),
+  round(stddev_samp(ctimestamp1), 3)
 FROM alltypesorc_string
 POSTHOOK: type: QUERY
 POSTHOOK: Input: default@alltypesorc_string
 #### A masked pattern was here ####
-2.8798560435897438E13	8.970772952794212E19	8.970772952794212E19	9.206845925236166E19	9.471416447815084E9
9.471416447815084E9	9.471416447815084E9	9.595231068211002E9
+2.8798560435897E13	true	true	true	9.471416447815E9	9.471416447815E9	9.471416447815E9	9.595231068211E9


Mime
View raw message