kylin-learn_kylin表结构解读

2020-02-19  本文已影响0人  李小李的路

背景

# 用户账户表
kylin_account
# 日期维度
kylin_cal_dt
# 商品类别表
kylin_category_groupings
# 地理位置国家表
kylin_country
# Sales order table, fact table
kylin_sales

数仓模型

事实表 kylin_sales

CREATE TABLE `kylin_sales`(
  `trans_id` bigint, 
  `part_dt` date COMMENT 'Order Date', 
  `lstg_format_name` string COMMENT 'Order Transaction Type', 
  `leaf_categ_id` bigint COMMENT 'Category ID', 
  `lstg_site_id` int COMMENT 'Site ID', 
  `slr_segment_cd` smallint, 
  `price` decimal(19,4) COMMENT 'Order Price', 
  `item_count` bigint COMMENT 'Number of Purchased Goods', 
  `seller_id` bigint COMMENT 'Seller ID', 
  `buyer_id` bigint COMMENT 'Buyer ID', 
  `ops_user_id` string COMMENT 'System User ID', 
  `ops_region` string COMMENT 'System User Region')
COMMENT 'Sales order table, fact table'
ROW FORMAT SERDE 
  'org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe' 
WITH SERDEPROPERTIES ( 
  'field.delim'=',', 
  'serialization.format'=',') 
STORED AS INPUTFORMAT 
  'org.apache.hadoop.mapred.TextInputFormat' 
OUTPUTFORMAT 
  'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat'
LOCATION
  'hdfs://bigdata/user/hive/warehouse/kylin_sales'
TBLPROPERTIES (
  'transient_lastDdlTime'='1580892437')

维度表 kylin_account

CREATE TABLE `kylin_account`(
  `account_id` bigint, 
  `account_buyer_level` int COMMENT 'Account Buyer Level', 
  `account_seller_level` int COMMENT 'Account Seller Level', 
  `account_country` string COMMENT 'Account Country', 
  `account_contact` string COMMENT 'Account Contact Info')
ROW FORMAT SERDE 
  'org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe' 
WITH SERDEPROPERTIES ( 
  'field.delim'=',', 
  'serialization.format'=',') 
STORED AS INPUTFORMAT 
  'org.apache.hadoop.mapred.TextInputFormat' 
OUTPUTFORMAT 
  'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat'
LOCATION
  'hdfs://bigdata/user/hive/warehouse/kylin_account'
TBLPROPERTIES (
  'transient_lastDdlTime'='1580892437')

维度表 kylin_cal_dt

CREATE TABLE `kylin_cal_dt`(
  `cal_dt` date COMMENT 'Date, PK', 
  `year_beg_dt` date COMMENT 'YEAR Begin Date', 
  `qtr_beg_dt` date COMMENT 'Quarter Begin Date', 
  `month_beg_dt` date COMMENT 'Month Begin Date', 
  `week_beg_dt` date COMMENT 'Week Begin Date', 
  `age_for_year_id` smallint, 
  `age_for_qtr_id` smallint, 
  `age_for_month_id` smallint, 
  `age_for_week_id` smallint, 
  `age_for_dt_id` smallint, 
  `age_for_rtl_year_id` smallint, 
  `age_for_rtl_qtr_id` smallint, 
  `age_for_rtl_month_id` smallint, 
  `age_for_rtl_week_id` smallint, 
  `age_for_cs_week_id` smallint, 
  `day_of_cal_id` int, 
  `day_of_year_id` smallint, 
  `day_of_qtr_id` smallint, 
  `day_of_month_id` smallint, 
  `day_of_week_id` int, 
  `week_of_year_id` tinyint, 
  `week_of_cal_id` int, 
  `month_of_qtr_id` tinyint, 
  `month_of_year_id` tinyint, 
  `month_of_cal_id` smallint, 
  `qtr_of_year_id` tinyint, 
  `qtr_of_cal_id` smallint, 
  `year_of_cal_id` smallint, 
  `year_end_dt` string, 
  `qtr_end_dt` string, 
  `month_end_dt` string, 
  `week_end_dt` string, 
  `cal_dt_name` string, 
  `cal_dt_desc` string, 
  `cal_dt_short_name` string, 
  `ytd_yn_id` tinyint, 
  `qtd_yn_id` tinyint, 
  `mtd_yn_id` tinyint, 
  `wtd_yn_id` tinyint, 
  `season_beg_dt` string, 
  `day_in_year_count` smallint, 
  `day_in_qtr_count` tinyint, 
  `day_in_month_count` tinyint, 
  `day_in_week_count` tinyint, 
  `rtl_year_beg_dt` string, 
  `rtl_qtr_beg_dt` string, 
  `rtl_month_beg_dt` string, 
  `rtl_week_beg_dt` string, 
  `cs_week_beg_dt` string, 
  `cal_date` string, 
  `day_of_week` string, 
  `month_id` string, 
  `prd_desc` string, 
  `prd_flag` string, 
  `prd_id` string, 
  `prd_ind` string, 
  `qtr_desc` string, 
  `qtr_id` string, 
  `qtr_ind` string, 
  `retail_week` string, 
  `retail_year` string, 
  `retail_start_date` string, 
  `retail_wk_end_date` string, 
  `week_ind` string, 
  `week_num_desc` string, 
  `week_beg_date` string, 
  `week_end_date` string, 
  `week_in_year_id` string, 
  `week_id` string, 
  `week_beg_end_desc_mdy` string, 
  `week_beg_end_desc_md` string, 
  `year_id` string, 
  `year_ind` string, 
  `cal_dt_mns_1year_dt` string, 
  `cal_dt_mns_2year_dt` string, 
  `cal_dt_mns_1qtr_dt` string, 
  `cal_dt_mns_2qtr_dt` string, 
  `cal_dt_mns_1month_dt` string, 
  `cal_dt_mns_2month_dt` string, 
  `cal_dt_mns_1week_dt` string, 
  `cal_dt_mns_2week_dt` string, 
  `curr_cal_dt_mns_1year_yn_id` tinyint, 
  `curr_cal_dt_mns_2year_yn_id` tinyint, 
  `curr_cal_dt_mns_1qtr_yn_id` tinyint, 
  `curr_cal_dt_mns_2qtr_yn_id` tinyint, 
  `curr_cal_dt_mns_1month_yn_id` tinyint, 
  `curr_cal_dt_mns_2month_yn_id` tinyint, 
  `curr_cal_dt_mns_1week_yn_ind` tinyint, 
  `curr_cal_dt_mns_2week_yn_ind` tinyint, 
  `rtl_month_of_rtl_year_id` string, 
  `rtl_qtr_of_rtl_year_id` tinyint, 
  `rtl_week_of_rtl_year_id` tinyint, 
  `season_of_year_id` tinyint, 
  `ytm_yn_id` tinyint, 
  `ytq_yn_id` tinyint, 
  `ytw_yn_id` tinyint, 
  `kylin_cal_dt_cre_date` string, 
  `kylin_cal_dt_cre_user` string, 
  `kylin_cal_dt_upd_date` string, 
  `kylin_cal_dt_upd_user` string)
COMMENT 'Date Dimension Table'
ROW FORMAT SERDE 
  'org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe' 
WITH SERDEPROPERTIES ( 
  'field.delim'=',', 
  'serialization.format'=',') 
STORED AS INPUTFORMAT 
  'org.apache.hadoop.mapred.TextInputFormat' 
OUTPUTFORMAT 
  'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat'
LOCATION
  'hdfs://bigdata/user/hive/warehouse/kylin_cal_dt'
TBLPROPERTIES (
  'transient_lastDdlTime'='1580892438')

维度表 kylin_category_groupings

CREATE TABLE `kylin_category_groupings`(
  `leaf_categ_id` bigint COMMENT 'Category ID, PK', 
  `leaf_categ_name` string, 
  `site_id` int COMMENT 'Site ID, PK', 
  `categ_busn_mgr` string, 
  `categ_busn_unit` string, 
  `regn_categ` string, 
  `user_defined_field1` string COMMENT 'User Defined Field1', 
  `user_defined_field3` string COMMENT 'User Defined Field3', 
  `kylin_groupings_cre_date` string, 
  `kylin_groupings_upd_date` string COMMENT 'Last Updated Date', 
  `kylin_groupings_cre_user` string, 
  `kylin_groupings_upd_user` string COMMENT 'Last Updated User', 
  `meta_categ_id` decimal(10,0), 
  `meta_categ_name` string COMMENT 'Level1 Category', 
  `categ_lvl2_id` decimal(10,0), 
  `categ_lvl3_id` decimal(10,0), 
  `categ_lvl4_id` decimal(10,0), 
  `categ_lvl5_id` decimal(10,0), 
  `categ_lvl6_id` decimal(10,0), 
  `categ_lvl7_id` decimal(10,0), 
  `categ_lvl2_name` string COMMENT 'Level2 Category', 
  `categ_lvl3_name` string COMMENT 'Level3 Category', 
  `categ_lvl4_name` string, 
  `categ_lvl5_name` string, 
  `categ_lvl6_name` string, 
  `categ_lvl7_name` string, 
  `categ_flags` decimal(10,0), 
  `adult_categ_yn` string, 
  `domain_id` decimal(10,0), 
  `user_defined_field5` string, 
  `vcs_id` decimal(10,0), 
  `gcs_id` decimal(10,0), 
  `move_to` decimal(10,0), 
  `sap_category_id` decimal(10,0), 
  `src_id` tinyint, 
  `bsns_vrtcl_name` string)
COMMENT 'Detail category inforamtion, Dimension Table'
ROW FORMAT SERDE 
  'org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe' 
WITH SERDEPROPERTIES ( 
  'field.delim'=',', 
  'serialization.format'=',') 
STORED AS INPUTFORMAT 
  'org.apache.hadoop.mapred.TextInputFormat' 
OUTPUTFORMAT 
  'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat'
LOCATION
  'hdfs://bigdata/user/hive/warehouse/kylin_category_groupings'
TBLPROPERTIES (
  'transient_lastDdlTime'='1580892439')

维度表 kylin_country

CREATE TABLE `kylin_country`(
  `country` string, 
  `latitude` double, 
  `longitude` double, 
  `name` string)
ROW FORMAT SERDE 
  'org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe' 
WITH SERDEPROPERTIES ( 
  'field.delim'=',', 
  'serialization.format'=',') 
STORED AS INPUTFORMAT 
  'org.apache.hadoop.mapred.TextInputFormat' 
OUTPUTFORMAT 
  'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat'
LOCATION
  'hdfs://bigdata/user/hive/warehouse/kylin_country'
TBLPROPERTIES (
  'transient_lastDdlTime'='1580892438')

模型关系图

上一篇 下一篇

猜你喜欢

热点阅读