当前位置: 首页 > news >正文

建筑网站视频大全广东商城网站建设价格低

建筑网站视频大全,广东商城网站建设价格低,公司查询信息查询,wordpress地方门户主题视频地址#xff1a;尚硅谷大数据项目《在线教育之离线数仓》_哔哩哔哩_bilibili 目录 第8章 数仓开发之DIM层 P039 P040 P041 P042 P043 P044 P045 P046 P047 P048 第8章 数仓开发之DIM层 P039 第8章 数仓开发之DIM层 DIM层设计要点#xff1a; #xff08;1尚硅谷大数据项目《在线教育之离线数仓》_哔哩哔哩_bilibili 目录 第8章 数仓开发之DIM层 P039 P040 P041 P042 P043 P044 P045 P046 P047 P048 第8章 数仓开发之DIM层 P039 第8章 数仓开发之DIM层 DIM层设计要点 1DIM层的设计依据是维度建模理论该层存储维度模型的维度表。 2DIM层的数据存储格式为orc列式存储snappy压缩。 3DIM层表名的命名规范为dim_表名_全量表或者拉链表标识full/zip。 [2023-08-21 10:21:33] org.apache.hadoop.hive.ql.parse.SemanticException:Failed to get a spark session: org.apache.hadoop.hive.ql.metadata.HiveException: Failed to create Spark client for Spark session 2ed82e1b-8afb-4ad0-9ed2-0f84191a4343 P040 show databases;use edu2077;show tables;--8.1 章节维度表全量 DROP TABLE IF EXISTS dim_chapter_full; CREATE EXTERNAL TABLE dim_chapter_full (id STRING COMMENT 章节ID,chapter_name STRING COMMENT 章节名称,course_id STRING COMMENT 课程ID,video_id STRING COMMENT 视频ID,publisher_id STRING COMMENT 发布者ID,is_free STRING COMMENT 是否免费,create_time STRING COMMENT 创建时间,update_time STRING COMMENT 更新时间 ) COMMENT 章节维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_chapter_full/TBLPROPERTIES (orc.compress snappy);--数据装载 --insert overwrite覆盖写insert into会造成数据重复。 insert overwrite table dim_chapter_full partition (dt 2022-02-21) select id,chapter_name,course_id,video_id,publisher_id,is_free,create_time,update_time from ods_chapter_info_full where dt 2022-02-21;select * from dim_chapter_full;--8.2 课程维度表全量 DROP TABLE IF EXISTS dim_course_full; CREATE EXTERNAL TABLE dim_course_full (id STRING COMMENT 编号,course_name STRING COMMENT 课程名称,subject_id STRING COMMENT 学科id,subject_name STRING COMMENT 学科名称,category_id STRING COMMENT 分类id,category_name STRING COMMENT 分类名称,teacher STRING COMMENT 讲师名称,publisher_id STRING COMMENT 发布者id,chapter_num BIGINT COMMENT 章节数,origin_price decimal(16, 2) COMMENT 价格,reduce_amount decimal(16, 2) COMMENT 优惠金额,actual_price decimal(16, 2) COMMENT 实际价格,create_time STRING COMMENT 创建时间,update_time STRING COMMENT 更新时间,chapters ARRAYSTRUCTchapter_id : STRING,chapter_name : STRING, video_id : STRING,is_free: STRING COMMENT 章节 ) COMMENT 课程维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_course_full/TBLPROPERTIES (orc.compress snappy);select * from ods_base_source_full where dt 2022-02-21;select * from ods_course_info_full where dt 2022-02-21;select * from (select id,course_name,course_slogan,subject_id,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,course_introduce,create_time,update_timefrom ods_course_info_fullwhere dt 2022-02-21) ci;--ci是别名with ci as (select id,course_name,course_slogan,subject_id,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,course_introduce,create_time,update_timefrom ods_course_info_fullwhere dt 2022-02-21 ),bci as (select id, category_namefrom ods_base_category_info_fullwhere dt 2022-02-21),bs as (select id, subject_name, category_idfrom ods_base_subject_info_fullwhere dt 2022-02-21),chapter as (select course_id,--chapter_id : STRING,chapter_name : STRING, video_id : STRING,is_free : STRINGcollect_set(named_struct(chapter_id, id, chapter_name, chapter_name,video_id, video_id, is_free, is_free)) csfrom ods_chapter_info_fullwhere dt 2022-02-21group by course_id) insert overwrite table dim_course_full partition (dt 2022-02-21) select ci.id,course_name,subject_id,subject_name,category_id,category_name,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,create_time,update_time,cs chapters from cileft join bson ci.subject_id bs.idleft join bcion bs.category_id bci.idleft join chapteron ci.id chapter.course_id;--desc function extended named_struct;select * from dim_course_full; P041 --8.3 视频维度表全量 show databases;--8.3 视频维度表全量 DROP TABLE IF EXISTS dim_video_full; CREATE EXTERNAL TABLE dim_video_full (id STRING COMMENT 编号,video_name STRING COMMENT 视频名称,during_sec BIGINT COMMENT 时长,video_status STRING COMMENT 状态 未上传上传中上传完,video_size BIGINT COMMENT 大小,version_id STRING COMMENT 版本号,chapter_id STRING COMMENT 章节id,chapter_name STRING COMMENT 章节名称,is_free STRING COMMENT 是否免费,course_id STRING COMMENT 课程id,publisher_id STRING COMMENT 发布者id,create_time STRING COMMENT 创建时间,update_time STRING COMMENT 更新时间 ) COMMENT 视频维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_video_zip/TBLPROPERTIES (orc.compress snappy);select * from ods_video_info_full where dt 2022-02-21;insert overwrite table dim_video_full partition (dt 2022-02-21) select id,video_name,during_sec,video_status,video_size,version_id,chapter_id,chapter_name,is_free,course_id,publisher_id,create_time,update_time from (select id,video_name,during_sec,video_status,video_size,video_url,video_source_id,version_id,chapter_id,course_id,publisher_id,create_time,update_time,deletedfrom ods_video_info_fullwhere dt 2022-02-21and deleted 0) vileft join(select chapter_name,video_id,is_freefrom ods_chapter_info_fullwhere dt 2022-02-21 ) cion vi.id ci.video_id;select * from dim_video_full;insert overwrite table dim_video_full partition (dt 2022-02-21) select vt.id,video_name,during_sec,video_status,video_size,version_id,chapter_id,chapter_name,is_free,course_id,publisher_id,create_time,update_time from (select id,video_name,during_sec,video_status,video_size,version_id,chapter_id,course_id,publisher_id,create_time,update_timefrom ods_video_info_fullwhere dt 2022-02-21and deleted 0) vtjoin(select id,chapter_name,is_freefrom ods_chapter_info_fullwhere dt 2022-02-21) chton vt.chapter_id cht.id; org.apache.hadoop.hive.ql.parse.SemanticException:Failed to get a spark session: org.apache.hadoop.hive.ql.metadata.HiveException: Failed to create Spark client for Spark session 2519dff0-c795-4852-a1b4-f40ad1750136 2023/8/23 14:50    t004.sql: insert overwrite table dim_vi…     on vt.chapter_id cht.id... failed. 15:00    t004.sql: insert overwrite table dim_vi…     on vt.chapter_id cht.id... failed. org.apache.hadoop.hive.ql.parse.SemanticException:Failed to get a spark session: org.apache.hadoop.hive.ql.metadata.HiveException: Failed to create Spark client due to invalid resource request: Required executor memory (2048 MB), offHeap memory (0) MB, overhead (384 MB), and PySpark memory (0 MB) is above the max threshold (2048 MB) 报错-hive on spark执行数据导入脚本报错_dyson不只是吹风机的博客-CSDN博客 [atguigunode001 hadoop]$ myhadoop.sh start 启动 hadoop集群 ---------------- 启动 hdfs ---------------- Starting namenodes on [node001] Starting datanodes Starting secondary namenodes [node003]--------------- 启动 yarn --------------- Starting resourcemanager Starting nodemanagers--------------- 启动 historyserver --------------- [atguigunode001 hadoop]$ cd /opt/module/hive/hive-3.1.2/ [atguigunode001 hive-3.1.2]$ nohup bin/hive [1] 11485 [atguigunode001 hive-3.1.2]$ nohup: 忽略输入并把输出追加到nohup.out[atguigunode001 hive-3.1.2]$ nohup bin/hive --service hiveserver2 [2] 11626 [atguigunode001 hive-3.1.2]$ nohup: 忽略输入并把输出追加到nohup.out[atguigunode001 hive-3.1.2]$ jpsallnode001 3872 QuorumPeerMain 4291 Kafka 11381 JobHistoryServer 10583 NameNode 11626 RunJar 10747 DataNode 13660 Jps 13533 YarnCoarseGrainedExecutorBackend 11485 RunJar 11167 NodeManagernode002 7841 Jps 5586 ResourceManager 2946 Kafka 7683 ApplicationMaster 2552 QuorumPeerMain 5384 DataNode 5711 NodeManagernode003 6944 YarnCoarseGrainedExecutorBackend 2256 QuorumPeerMain 5040 SecondaryNameNode 4929 DataNode 2643 Kafka 5158 NodeManager 7047 Jps [atguigunode001 hive-3.1.2]$ P042 8.4 试卷维度表全量 --8.4 试卷维度表全量 DROP TABLE IF EXISTS dim_paper_full; CREATE EXTERNAL TABLE dim_paper_full (id STRING COMMENT 编号,paper_title STRING COMMENT 试卷名称,course_id STRING COMMENT 课程id,create_time STRING COMMENT 创建时间,update_time STRING COMMENT 更新时间,publisher_id STRING COMMENT 发布者id,questions ARRAYSTRUCTquestion_id: STRING, score: DECIMAL(16, 2) COMMENT 题目 ) COMMENT 试卷维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_paper_full/TBLPROPERTIES (orc.compress snappy);select * from ods_test_paper_full;insert overwrite table dim_paper_full partition (dt 2022-02-21) select id,paper_title,course_id,create_time,update_time,publisher_id,qs from (select id,paper_title,course_id,create_time,update_time,publisher_id,deletedfrom ods_test_paper_fullwhere dt 2022-02-21--and deleted 0) tpleft join (select paper_id,--question_id: STRING, score: DECIMAL(16, 2)collect_set(named_struct(question_id, id, score, score)) qsfrom ods_test_paper_question_fullwhere dt 2022-02-21and deleted 0group by paper_id ) pqon tp.id pq.paper_id;select * from dim_paper_full; P043 8.5 来源维度表全量 8.6 题目维度表全量 8.7 地区维度表全量 --8.5 来源维度表全量 DROP TABLE IF EXISTS dim_source_full; CREATE EXTERNAL TABLE dim_source_full (id STRING COMMENT 编号,source_site STRING COMMENT 来源 ) COMMENT 来源维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_source_full/TBLPROPERTIES (orc.compress snappy);insert overwrite table edu2077.dim_source_full partition (dt 2022-02-21) select id,source_site from edu2077.ods_base_source_full obsf where dt 2022-02-21;select * from dim_source_full;--8.6 题目维度表全量 DROP TABLE IF EXISTS dim_question_full; CREATE EXTERNAL TABLE dim_question_full (id STRING COMMENT 编号,chapter_id STRING COMMENT 章节id,course_id STRING COMMENT 课程id,question_type BIGINT COMMENT 题目类型,create_time STRING COMMENT 创建时间,update_time STRING COMMENT 更新时间,publisher_id STRING COMMENT 发布者id ) COMMENT 题目维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_question_full/TBLPROPERTIES (orc.compress snappy);insert overwrite table edu2077.dim_question_fullpartition (dt 2022-02-21) select id,chapter_id,course_id,question_type,create_time,update_time,publisher_id from edu2077.ods_test_question_info_full where deleted 0and dt 2022-02-21;select * from dim_question_full;--8.7 地区维度表全量 DROP TABLE IF EXISTS dim_province_full; CREATE EXTERNAL TABLE dim_province_full (id STRING COMMENT 编号,name STRING COMMENT 省名称,region_id STRING COMMENT 地区id,area_code STRING COMMENT 行政区位码,iso_code STRING COMMENT 国际编码,iso_3166_2 STRING COMMENT ISO3166编码 ) COMMENT 地区维度表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_province_full/TBLPROPERTIES (orc.compress snappy);insert overwrite table edu2077.dim_province_full partition (dt 2022-02-21) select id,name,region_id,area_code,iso_code,iso_3166_2 from edu2077.ods_base_province_full where dt 2022-02-21;select * from dim_province_full; P044 8.8 时间维度表特殊 --8.8 时间维度表特殊 DROP TABLE IF EXISTS dim_date; CREATE EXTERNAL TABLE dim_date (date_id STRING COMMENT 日期id,week_id STRING COMMENT 周id,一年中的第几周,week_day STRING COMMENT 周几,day STRING COMMENT 每月的第几天,month STRING COMMENT 一年中的第几月,quarter STRING COMMENT 一年中的第几季度,year STRING COMMENT 年份,is_workday STRING COMMENT 是否是工作日,holiday_id STRING COMMENT 节假日 ) COMMENT 时间维度表STORED AS ORCLOCATION /warehouse/edu/dim/dim_date/TBLPROPERTIES (orc.compress snappy);DROP TABLE IF EXISTS tmp_dim_date_info; CREATE EXTERNAL TABLE tmp_dim_date_info (date_id STRING COMMENT 日,week_id STRING COMMENT 周id,week_day STRING COMMENT 周几,day STRING COMMENT 每月的第几天,month STRING COMMENT 第几月,quarter STRING COMMENT 第几季度,year STRING COMMENT 年,is_workday STRING COMMENT 是否是工作日,holiday_id STRING COMMENT 节假日 ) COMMENT 时间维度表ROW FORMAT DELIMITED FIELDS TERMINATED BY \tLOCATION /warehouse/edu/tmp/tmp_dim_date_info/;insert overwrite table dim_date select * from tmp_dim_date_info;insert overwrite table dim_date select date_id,week_id,week_day,day,month,quarter,year,is_workday,holiday_id from tmp_dim_date_info;select * from dim_date; P045 8.9 用户维度表拉链表 --8.9 用户维度表拉链表 DROP TABLE IF EXISTS dim_user_zip; CREATE EXTERNAL TABLE dim_user_zip (id STRING COMMENT 编号,login_name STRING COMMENT 用户名称,nick_name STRING COMMENT 用户昵称,real_name STRING COMMENT 用户姓名,phone_num STRING COMMENT 手机号,email STRING COMMENT 邮箱,user_level STRING COMMENT 用户级别,birthday STRING COMMENT 用户生日,gender STRING COMMENT 性别 M男,F女,create_time STRING COMMENT 创建时间,operate_time STRING COMMENT 修改时间,status STRING COMMENT 状态,start_date STRING COMMENT 开始日期,end_date STRING COMMENT 结束日期 ) COMMENT 用户表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_user_zip/TBLPROPERTIES (orc.compress snappy); P046 8.9 用户维度表拉链表 3首日装载 inc等增量表没有数据尚硅谷在线教育系统项目ods_user_info_inc这个增量表没有数据课件上也没有相关操作有空帮我看看应该是执行hdfs_to_ods_db.sh这个数据装载脚本的时候增量表数据没有被添加到hdfs里面。 启动Maxwell后再执行hdfs_to_ods_db.sh脚本就行了。 {id:3,login_name:tws1uxb5r,nick_name:进林,passwd:null,real_name:贺进林,phone_num:13443888468,email:tws1uxb5raol.com,head_img:null,user_level:1,birthday:1987-06-16,gender:null,create_time:2022-02-16 00:00:00,operate_time:null,status:null} {id:3,login_name:tws1uxb5r,nick_name:进林,passwd:null,real_name:贺进林,phone_num:13443888468,email:tws1uxb5raol.com,head_img:null,user_level:1,birthday:1987-06-16,gender:null,create_time:2022-02-16 00:00:00,operate_time:null,status:null } --8.9 用户维度表拉链表 DROP TABLE IF EXISTS dim_user_zip; CREATE EXTERNAL TABLE dim_user_zip (id STRING COMMENT 编号,login_name STRING COMMENT 用户名称,nick_name STRING COMMENT 用户昵称,real_name STRING COMMENT 用户姓名,phone_num STRING COMMENT 手机号,email STRING COMMENT 邮箱,user_level STRING COMMENT 用户级别,birthday STRING COMMENT 用户生日,gender STRING COMMENT 性别 M男,F女,create_time STRING COMMENT 创建时间,operate_time STRING COMMENT 修改时间,status STRING COMMENT 状态,start_date STRING COMMENT 开始日期,end_date STRING COMMENT 结束日期 ) COMMENT 用户表PARTITIONED BY (dt STRING)STORED AS ORCLOCATION /warehouse/edu/dim/dim_user_zip/TBLPROPERTIES (orc.compress snappy);select * from edu2077.ods_user_info_inc where dt 2022-02-21;select * from edu2077.ods_user_info_inc where dt 2022-02-21and type bootstrap-insert;select data.id,data.login_name,data.nick_name,data.passwd,data.real_name,data.phone_num,data.email,data.head_img,data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status from edu2077.ods_user_info_inc where dt 2022-02-21and type bootstrap-insert;insert overwrite table edu2077.dim_user_zip partition (dt 9999-12-31) select data.id,data.login_name,data.nick_name,md5(data.real_name),md5(if(data.phone_num regexp ^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num, null)),md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$, data.email, null)),data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,2022-02-21 start_date,9999-12-31 end_date from edu2077.ods_user_info_inc where dt 2022-02-21and type bootstrap-insert;select * from dim_user_zip; P047 8.9 用户维度表拉链表 4每日装载 --8.9 用户维度表拉链表 --4每日装载 select * from edu2077.ods_user_info_inc where dt 2022-02-21;select * from edu2077.ods_user_info_inc where dt 2022-02-22;select * from dim_user_zip where dt 9999-12-31;select data.id,data.login_name,data.nick_name,md5(data.real_name),md5(if(data.phone_num regexp ^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num, null)),md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$, data.email, null)),data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,2022-02-21 start_date,9999-12-31 end_date from edu2077.ods_user_info_inc where dt 2022-02-22;select id,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date from dim_user_zip where dt 9999-12-31 union select data.id,data.login_name,data.nick_name,md5(data.real_name),md5(if(data.phone_num regexp ^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num, null)),md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$, data.email, null)),data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,2022-02-21 start_date,9999-12-31 end_datefrom edu2077.ods_user_info_inc where dt 2022-02-22;set hive.exec.dynamic.partition.modenonstrict;--关闭严格模式 insert overwrite table edu2077.dim_user_zip partition (dt) select id,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,if(rn 1, 9999-12-31, date_sub(2022-02-22, 1)) end_date,if(rn 1, 9999-12-31, date_sub(2022-02-22, 1)) dt from (select id,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,end_date,row_number() over (partition by id order by start_date desc) rnfrom (select id,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,end_datefrom edu2077.dim_user_zipwhere dt 9999-12-31unionselect id,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,2020-02-22 start_date,9999-12-31 end_datefrom (select data.id,data.login_name,data.nick_name,md5(data.real_name) real_name,md5(if(data.phone_num regexp^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num, null)) phone_num,md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$,data.email, null)) email,data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,row_number() over (partition by data.id order by ts desc) rnfrom edu2077.ods_user_info_incwhere dt 2022-02-22) t1where rn 1) t2) t3; P048 8.10 数据装载脚本 8.10.1 首日装载脚本 8.10.2 每日装载脚本 #vim ods_to_dim_init.sh#!/bin/bash if [ -n $2 ] ;thendo_date$2 elseecho 请传入日期参数exit fiAPPedudim_chapter_full insert overwrite table ${APP}.dim_chapter_fullpartition (dt $do_date) select id,chapter_name,course_id,video_id,publisher_id,is_free,create_time,update_time from ${APP}.ods_chapter_info_full where deleted 0and dt $do_date;dim_course_full with a as(select id, category_namefrom ${APP}.ods_base_category_info_fullwhere deleted 0and dt $do_date),b as(select id, subject_name, category_idfrom ${APP}.ods_base_subject_info_fullwhere deleted 0and dt $do_date),c as(select id,course_name,subject_id,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,create_time,update_timefrom ${APP}.ods_course_info_fullwhere deleted 0and dt $do_date),d as(select course_id,collect_set(named_struct(chapter_id, id, chapter_name, chapter_name, video_id, video_id, is_free, is_free)) chaptersfrom ${APP}.ods_chapter_info_fullwhere deleted 0and dt $do_dategroup by course_id) insert overwrite table ${APP}.dim_course_full partition(dt $do_date) select c.id,course_name,subject_id,subject_name,category_id,category_name,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,create_time,update_time,chapters from cleft join bon c.subject_id b.idleft join aon b.category_id a.idleft join don c.id d.course_id;dim_video_full insert overwrite table ${APP}.dim_video_full partition (dt $do_date) select vt.id,video_name,during_sec,video_status,video_size,version_id,chapter_id,chapter_name,is_free,course_id,publisher_id,create_time,update_time from (select id,video_name,during_sec,video_status,video_size,version_id,chapter_id,course_id,publisher_id,create_time,update_timefrom ${APP}.ods_video_info_fullwhere dt $do_date and deleted 0) vtjoin(select id,chapter_name,is_freefrom ${APP}.ods_chapter_info_fullwhere dt $do_date) chton vt.chapter_id cht.id;dim_paper_full insert overwrite table ${APP}.dim_paper_full partition (dt $do_date) select t1.id,paper_title,course_id,create_time,update_time,publisher_id,questions from ${APP}.ods_test_paper_full t1left join(select paper_id,collect_set(named_struct(question_id, question_id, score, score)) questionsfrom ${APP}.ods_test_paper_question_fullwhere deleted 0 and dt $do_dategroup by paper_id) t2on t1.id t2.paper_id where t1.deleted 0 and t1.dt $do_date;dim_source_full insert overwrite table ${APP}.dim_source_full partition (dt $do_date) select id,source_site from ${APP}.ods_base_source_full obsf where dt $do_date;dim_question_full insert overwrite table ${APP}.dim_question_fullpartition (dt $do_date) select id,chapter_id,course_id,question_type,create_time,update_time,publisher_id from ${APP}.ods_test_question_info_full where deleted 0and dt $do_date;dim_province_full insert overwrite table ${APP}.dim_province_full partition (dt $do_date) select id,name,region_id,area_code,iso_code,iso_3166_2 from ${APP}.ods_base_province_full where dt $do_date;dim_user_zip insert overwrite table ${APP}.dim_user_zippartition (dt 9999-12-31) select data.id,data.login_name,data.nick_name,md5(data.real_name),md5(if(data.phone_num regexp ^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num,null)),md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$,data.email,null)),data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,$do_date start_date,9999-12-31 end_date from ${APP}.ods_user_info_inc where dt $do_dateand type bootstrap-insert;case $1 indim_chapter_full|dim_course_full|dim_video_full|dim_paper_full|dim_source_full|dim_question_full|dim_province_full|dim_user_zip)eval hive -e \\$$1\;;all )hive -e ${dim_chapter_full}${dim_course_full}${dim_video_full}${dim_paper_full}${dim_source_full}${dim_question_full}${dim_province_full}${dim_user_zip};; esac #vim ods_to_dim.sh#!/bin/bash if [ -n $2 ] ;thendo_date$2 elsedo_datedate -d -1 day %F fiAPPedudim_chapter_full insert overwrite table ${APP}.dim_chapter_fullpartition (dt $do_date) select id,chapter_name,course_id,video_id,publisher_id,is_free,create_time,update_time from ${APP}.ods_chapter_info_full where deleted 0and dt $do_date;dim_course_full with a as(select id, category_namefrom ${APP}.ods_base_category_info_fullwhere deleted 0and dt $do_date),b as(select id, subject_name, category_idfrom ${APP}.ods_base_subject_info_fullwhere deleted 0and dt $do_date),c as(select id,course_name,subject_id,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,create_time,update_timefrom ${APP}.ods_course_info_fullwhere deleted 0and dt $do_date),d as(select course_id,collect_set(named_struct(chapter_id, id, chapter_name, chapter_name, video_id, video_id, is_free, is_free)) chaptersfrom ${APP}.ods_chapter_info_fullwhere deleted 0and dt $do_dategroup by course_id) insert overwrite table ${APP}.dim_course_full partition(dt $do_date) select c.id,course_name,subject_id,subject_name,category_id,category_name,teacher,publisher_id,chapter_num,origin_price,reduce_amount,actual_price,create_time,update_time,chapters from cleft join bon c.subject_id b.idleft join aon b.category_id a.idleft join don c.id d.course_id;dim_video_full insert overwrite table ${APP}.dim_video_full partition (dt $do_date) select vt.id,video_name,during_sec,video_status,video_size,version_id,chapter_id,chapter_name,is_free,course_id,publisher_id,create_time,update_time from (select id,video_name,during_sec,video_status,video_size,version_id,chapter_id,course_id,publisher_id,create_time,update_timefrom ${APP}.ods_video_info_fullwhere dt $do_date and deleted 0) vtjoin(select id,chapter_name,is_freefrom ${APP}.ods_chapter_info_fullwhere dt $do_date) chton vt.chapter_id cht.id;dim_paper_full insert overwrite table ${APP}.dim_paper_full partition (dt $do_date) select t1.id,paper_title,course_id,create_time,update_time,publisher_id,questions from ${APP}.ods_test_paper_full t1left join(select paper_id,collect_set(named_struct(question_id, question_id, score, score)) questionsfrom ${APP}.ods_test_paper_question_fullwhere deleted 0 and dt $do_dategroup by paper_id) t2on t1.id t2.paper_id where t1.deleted 0 and t1.dt $do_date;dim_source_full insert overwrite table ${APP}.dim_source_full partition (dt $do_date) select id,source_site from ${APP}.ods_base_source_full obsf where dt $do_date;dim_question_full insert overwrite table ${APP}.dim_question_fullpartition (dt $do_date) select id,chapter_id,course_id,question_type,create_time,update_time,publisher_id from ${APP}.ods_test_question_info_full where deleted 0and dt $do_date;dim_province_full insert overwrite table ${APP}.dim_province_full partition (dt $do_date) select id,name,region_id,area_code,iso_code,iso_3166_2 from ${APP}.ods_base_province_full where dt $do_date;dim_user_zip set hive.exec.dynamic.partition.modenonstrict; insert overwrite table ${APP}.dim_user_zip partition(dt) selectid,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,if(rn1,9999-12-31,date_sub($do_date,1)) end_date,if(rn1,9999-12-31,date_sub($do_date,1)) dt from (selectid,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,end_date,row_number() over (partition by id order by start_date desc) rnfrom(selectid,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,start_date,end_datefrom ${APP}.dim_user_zipwhere dt9999-12-31unionselectid,login_name,nick_name,real_name,phone_num,email,user_level,birthday,gender,create_time,operate_time,status,2020-02-22 start_date,9999-12-31 end_datefrom(selectdata.id,data.login_name,data.nick_name,md5(data.real_name) real_name,md5(if(data.phone_num regexp ^(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{8}$,data.phone_num,null)) phone_num,md5(if(data.email regexp ^[a-zA-Z0-9_-][a-zA-Z0-9_-](\\.[a-zA-Z0-9_-])$,data.email,null)) email,data.user_level,data.birthday,data.gender,data.create_time,data.operate_time,data.status,row_number() over (partition by data.id order by ts desc) rnfrom ${APP}.ods_user_info_incwhere dt$do_date)t1where rn1)t2 )t3;case $1 indim_chapter_full|dim_course_full|dim_video_full|dim_paper_full|dim_source_full|dim_question_full|dim_province_full|dim_user_zip)eval hive -e \\$$1\;;all )hive -e ${dim_chapter_full}${dim_course_full}${dim_video_full}${dim_paper_full}${dim_source_full}${dim_question_full}${dim_province_full}${dim_user_zip};; esac
http://www.dnsts.com.cn/news/216182.html

相关文章:

  • 图书网站怎么做保定网络关键词排名
  • 如何做网站地图txt湖北省网站备案
  • 网站开发设计的阶段打游戏一天赚200元
  • 如何创建自己的公司网站手机网站怎么开发
  • 鹿泉企业网站建设什么网站做3d模型能赚钱
  • 怎么推广网站平台中企动力做的网站怎么登陆
  • 做网站的模板广告设计公司怎么找业务
  • 石家庄做网站推广网站设计包括哪些内容
  • 天津网站排名方案怎么修改网站标题
  • 景安网站备案查询众筹网站开发成本
  • 福州市工程建设质量管理网站php网站开发用什么php
  • 做公司集团网站我的免费网
  • 网站限定域名四川住房和城乡建设厅网站电话
  • 网站中的作用网站建设费计入那个科目
  • 长沙公司网站建设网站点击量查询
  • 一个虚拟主机多个网站wordpress动态背景
  • 中小企业网站建设与推广分析无锡室内设计公司
  • 试卷网站在线做做食品的采购员常用网站
  • 这几年做那个网站致富松江手机网站建设
  • 网站开发专业前景wordpress添加备案号插件
  • 深圳集团网站建设海报设计图
  • 网站用ps做还是aiwordpress 摘要长度
  • 一元夺宝网站建设2017wordpress简洁博客主题
  • 建设银行网站首页下载北京 好的网站制作
  • 怎么申请订阅号沈阳seo收费
  • 乐云seo网站建设公司设计网站要多少钱
  • 可以做盗版漫画网站吗设计制作活动主题
  • 外贸网站模板设计军事最新消息今天
  • 推广自身网站深圳市东企网络技术有限公司
  • 辽宁海星建设集团有限公司网站网站设计怎么写