Uploaded image for project: 'Kylin'
  1. Kylin
  2. KYLIN-5088

kylin4 build cube cannot correct process explode array column

    XMLWordPrintableJSON

Details

    • Bug
    • Status: Open
    • Major
    • Resolution: Unresolved
    • v4.0.0
    • None
    • Spark Engine
    • None

    Description

      there is hive(hive-3.1.2) table and view as below

       

      //代码占位符
      create table pageAds2(id int,pageid STRING,adid_list Array<string>) row format delimited fields terminated by ',' collection items terminated by '_';
      
      insert into pageAds2 select 1, 'front_page', array('1','2','3');
      insert into pageAds2 select 2, 'contact_page', array('3','4','5');
      
      create view pageAds2_view as SELECT pageid, adid FROM pageAds2 LATERAL VIEW explode(adid_list) adTable AS adid;
      

      After building cube of pageAds2_view

      //SQL
      SELECT
      `PAGEADS2_VIEW`.`PAGEID` as `PAGEADS2_VIEW_PAGEID`
      ,`PAGEADS2_VIEW`.`ADID` as `PAGEADS2_VIEW_ADID`
       FROM `DEFAULT`.`PAGEADS2_VIEW` as `PAGEADS2_VIEW`
      WHERE 1=1
      
      // JSON(CUBE)
      {
        "uuid": "391cdd5b-dbe9-6877-92fe-38f90ab55314",
        "last_modified": 1631355523311,
        "version": "4.0.0.0",
        "name": "pageAds2_view_cube_v1",
        "is_draft": false,
        "model_name": "pageAds2_view_model_v1",
        "description": "",
        "null_string": null,
        "dimensions": [
          {
            "name": "PAGEID",
            "table": "PAGEADS2_VIEW",
            "column": "PAGEID",
            "derived": null
          },
          {
            "name": "ADID",
            "table": "PAGEADS2_VIEW",
            "column": "ADID",
            "derived": null
          }
        ],
        "measures": [
          {
            "name": "_COUNT_",
            "function": {
              "expression": "COUNT",
              "parameter": {
                "type": "constant",
                "value": "1"
              },
              "returntype": "bigint"
            }
          }
        ],
        "dictionaries": [],
        "rowkey": {
          "rowkey_columns": [
            {
              "column": "PAGEADS2_VIEW.PAGEID",
              "encoding": "dict",
              "encoding_version": 1,
              "isShardBy": false
            },
            {
              "column": "PAGEADS2_VIEW.ADID",
              "encoding": "dict",
              "encoding_version": 1,
              "isShardBy": false
            }
          ]
        },
        "hbase_mapping": {
          "column_family": [
            {
              "name": "F1",
              "columns": [
                {
                  "qualifier": "M",
                  "measure_refs": [
                    "_COUNT_"
                  ]
                }
              ]
            }
          ]
        },
        "aggregation_groups": [
          {
            "includes": [
              "PAGEADS2_VIEW.PAGEID",
              "PAGEADS2_VIEW.ADID"
            ],
            "select_rule": {
              "hierarchy_dims": [],
              "mandatory_dims": [],
              "joint_dims": []
            }
          }
        ],
        "signature": "NdkZMCVkiStcS9+r2eEB0A==",
        "notify_list": [],
        "status_need_notify": [
          "ERROR",
          "DISCARDED",
          "SUCCEED"
        ],
        "partition_date_start": 0,
        "partition_date_end": 3153600000000,
        "auto_merge_time_ranges": [
          604800000,
          2419200000
        ],
        "volatile_range": 0,
        "retention_range": 0,
        "engine_type": 6,
        "storage_type": 2,
        "override_kylin_properties": {},
        "cuboid_black_list": [],
        "parent_forward": 3,
        "mandatory_dimension_set_list": [],
        "snapshot_table_desc_list": []
      }

      in kylin Insight execute below sql

      //代码占位符
      select ADID , count(*) from PAGEADS2_VIEW group by ADID
      

      got below result 

      ADID EXPR$1
      1_2_3 1
      3_4_5 1

       
       but execute the same sql in hive got below result

      adid _c1
      1 1
      2 1
      3 2
      4 1
      5 1

       
       

       

       

       

       

       

      Attachments

        Activity

          People

            Unassigned Unassigned
            zhuguowei Guowei Zhu
            Votes:
            0 Vote for this issue
            Watchers:
            1 Start watching this issue

            Dates

              Created:
              Updated: