数据分析指标
| 1. 基于时间维度(①每月用户的访问指标 ②每天用户的访问指标 ③每小时用户的访问指标) 重写数据 |
| 2. 基于用户维度(不同年龄段用户的访问量指标) 重写数据 |
| 3. 基于地理维度(每个分区下不同省份用户的访问指标) 追加数据 |
创建时间维度表及导入数据
| |
| |
| |
| |
| |
| create table if not exists month_pvs( |
| visit_year string, |
| visit_month string, |
| pvs int |
| ) row format delimited |
| fields terminated by ','; |
| |
| |
| |
| insert overwrite table month_pvs |
| select visit_month, visit_year, count(*) as pvs |
| from web_detail |
| group by visit_month, visit_year; |
| |
| |
| |
| create table if not exists day_pvs( |
| visit_year string, |
| visit_month string, |
| visit_day string, |
| pvs int |
| ) row format delimited |
| fields terminated by ','; |
| |
| |
| insert overwrite table day_pvs |
| select visit_year, visit_month, visit_day, count(*) as pvs |
| from web_detail |
| group by visit_year, visit_month, visit_day; |
| |
| |
| |
| |
| |
| |
| create table if not exists hour_pvs( |
| visit_year string, |
| visit_month string, |
| visit_day string, |
| visit_hour string, |
| pvs int |
| ) row format delimited |
| fields terminated by ','; |
| |
| |
| |
| insert overwrite table hour_pvs |
| select visit_year, visit_month, visit_day, visit_hour, count(*) as pvs |
| from web_detail |
| group by visit_year, visit_month, visit_day, visit_hour; |
创建用户维度表及导入数据
| |
| |
| |
| |
| |
| |
| |
| |
| create table if not exists age_pvs( |
| age_range string, |
| pvs int |
| ) row format delimited fields terminated by ","; |
| |
| insert overwrite table age_pvs |
| select tmp.ageDuan age_range, count(*) pvs |
| from |
| ( |
| select |
| case |
| when (age between 0 and 18) then "少年人" |
| when (age between 18 and 40) then "青年人" |
| when (age between 40 and 65) then "中年" |
| else "老年" |
| end as ageDuan |
| from web_detail |
| ) tmp |
| group by tmp.ageDuan; |
创建地理维度表及导入数据
| |
| |
| |
| |
| |
| create table if not exists area_pvs( |
| logdate string, |
| provice string, |
| latitude string, |
| longitude string, |
| pvs int |
| ) row format delimited fields terminated by ","; |
| |
| |
| -- 追加写 |
| insert into table area_pvs |
| select logdate, province, latitude, longitude, count(*) as pvs |
| from web_detail |
| where logdate ="${hiveconf:yesterday}" |
| -- where logdate ="20220808" |
| group by province, latitude, longitude, logdate; |
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· TypeScript + Deepseek 打造卜卦网站:技术与玄学的结合
· Manus的开源复刻OpenManus初探
· AI 智能体引爆开源社区「GitHub 热点速览」
· 三行代码完成国际化适配,妙~啊~
· .NET Core 中如何实现缓存的预热?