carbondata-issues mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From "xubo245 (JIRA)" <j...@apache.org>
Subject [jira] [Created] (CARBONDATA-2085) It's different between load twice and create datamap with load again after load data and create datamap
Date Fri, 26 Jan 2018 03:38:03 GMT
xubo245 created CARBONDATA-2085:
-----------------------------------

             Summary: It's different between load twice and create datamap with load again
after load data and create datamap
                 Key: CARBONDATA-2085
                 URL: https://issues.apache.org/jira/browse/CARBONDATA-2085
             Project: CarbonData
          Issue Type: Bug
          Components: core, spark-integration
    Affects Versions: 1.3.0
            Reporter: xubo245
             Fix For: 1.3.0


It's different between load twice and create datamap with load again after load data and create
datamap


{code:java}
 test("test if timeseries load twice is successful on table creation") {
    sql("drop table if exists mainTable")
    sql(
      """
        | CREATE TABLE mainTable(
        |   mytime timestamp,
        |   name string,
        |   age int)
        | STORED BY 'org.apache.carbondata.format'
      """.stripMargin)
    sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/timeseriestest.csv' into table mainTable")
    sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/timeseriestest.csv' into table mainTable")
    sql(
      """
        | create datamap agg0 on table mainTable
        | using 'preaggregate'
        | DMPROPERTIES (
        |   'timeseries.eventTime'='mytime',
        |   'timeseries.hierarchy'='second=1,minute=1,hour=1,day=1,month=1,year=1')
        | as select mytime, sum(age)
        | from mainTable
        | group by mytime
      """.stripMargin)
    checkAnswer(sql("select * from maintable_agg0_second"),
      Seq(Row(Timestamp.valueOf("2016-02-23 01:01:30.0"), 20),
        Row(Timestamp.valueOf("2016-02-23 01:01:40.0"), 40),
        Row(Timestamp.valueOf("2016-02-23 01:01:50.0"), 60),
        Row(Timestamp.valueOf("2016-02-23 01:02:30.0"), 80),
        Row(Timestamp.valueOf("2016-02-23 01:02:40.0"), 100),
        Row(Timestamp.valueOf("2016-02-23 01:02:50.0"), 100)))
  }

  // TODO: to be fixed
  ignore("load data into mainTable after create timeseries datamap on table") {
    sql("drop table if exists mainTable")
    sql(
      """
        | CREATE TABLE mainTable(
        |   mytime timestamp,
        |   name string,
        |   age int)
        | STORED BY 'org.apache.carbondata.format'
      """.stripMargin)
    sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/timeseriestest.csv' into table mainTable")
    sql(
      """
        | create datamap agg0 on table mainTable
        | using 'preaggregate'
        | DMPROPERTIES (
        |   'timeseries.eventTime'='mytime',
        |   'timeseries.hierarchy'='second=1,minute=1,hour=1,day=1,month=1,year=1')
        | as select mytime, sum(age)
        | from mainTable
        | group by mytime""".stripMargin)


    sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/timeseriestest.csv' into table mainTable")

    // Discussed
    checkAnswer(sql("select * from maintable_agg0_second"),
      Seq(Row(Timestamp.valueOf("2016-02-23 01:01:30.0"), 20),
        Row(Timestamp.valueOf("2016-02-23 01:01:40.0"), 40),
        Row(Timestamp.valueOf("2016-02-23 01:01:50.0"), 60),
        Row(Timestamp.valueOf("2016-02-23 01:02:30.0"), 80),
        Row(Timestamp.valueOf("2016-02-23 01:02:40.0"), 100),
        Row(Timestamp.valueOf("2016-02-23 01:02:50.0"), 100)))

    //TODO: to be discussed, why is success?
    //    checkAnswer(sql("select * from maintable_agg0_second"),
    //      Seq(Row(Timestamp.valueOf("2016-02-23 01:01:30.0"), 10),
    //        Row(Timestamp.valueOf("2016-02-23 01:01:40.0"), 20),
    //        Row(Timestamp.valueOf("2016-02-23 01:01:50.0"), 30),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:30.0"), 40),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:40.0"), 50),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:50.0"), 50),
    //        Row(Timestamp.valueOf("2016-02-23 01:01:30.0"), 10),
    //        Row(Timestamp.valueOf("2016-02-23 01:01:40.0"), 20),
    //        Row(Timestamp.valueOf("2016-02-23 01:01:50.0"), 30),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:30.0"), 40),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:40.0"), 50),
    //        Row(Timestamp.valueOf("2016-02-23 01:02:50.0"), 50)))
  }

{code}




--
This message was sent by Atlassian JIRA
(v7.6.3#76005)

Mime
View raw message