Skip to content
项目
群组
代码片段
帮助
正在加载...
帮助
提交反馈
为 GitLab 提交贡献
登录
切换导航
L
label
项目
项目
详情
动态
版本
周期分析
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
统计图
成员
成员
收起侧边栏
Close sidebar
动态
分支图
统计图
提交
打开侧边栏
zhenxin.ma
label
提交
bb76e55c
提交
bb76e55c
编写于
9月 18, 2020
作者:
wuyunfeng
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
修改sessionpref表名
上级
5c56dda7
变更
3
隐藏空白字符变更
内嵌
并排
正在显示
3 个修改的文件
包含
7 行增加
和
6 行删除
+7
-6
MyConfigSession.scala
src/main/scala/com/config/MyConfigSession.scala
+1
-1
SessionProcessPref.scala
src/main/scala/com/session/SessionProcessPref.scala
+2
-1
SessionProcessTerm.scala
src/main/scala/com/session/SessionProcessTerm.scala
+4
-4
未找到文件。
src/main/scala/com/config/MyConfigSession.scala
浏览文件 @
bb76e55c
...
...
@@ -9,7 +9,7 @@ package com.config
*/
object
MyConfigSession
{
//Hive的DW层流量表
final
val
HIVE_TABLE0
:
String
=
"pica_
dw.dw_fact
_log_session_pref"
final
val
HIVE_TABLE0
:
String
=
"pica_
ods.ods
_log_session_pref"
final
val
HIVE_TABLE1_TMP
:
String
=
"pica_dw.dw_fact_log_session_tmp"
final
val
HIVE_TABLE2_TMP
:
String
=
"pica_dw.dw_fact_log_session_path_tmp"
final
val
HIVE_TABLE1
:
String
=
"pica_dw.dw_fact_log_session"
...
...
src/main/scala/com/session/SessionProcessPref.scala
浏览文件 @
bb76e55c
...
...
@@ -54,6 +54,7 @@ object SessionProcessPref {
var
index
=
0
val
conditionGroup
=
List
(
"<='4' "
,
"between '5' and '9'"
,
">'9'"
)
for
(
condition
<-
conditionGroup
){
index
+=
1
val
slideDF
=
sourceDF
.
where
(
s
" SUBSTRING(pseudo_session,1,1) ${condition}"
).
repartition
(
100
)
println
(
s
"-----------------------------------compute refer columns,condition=${condition}-----------------------------------------"
)
//step2:抽取出当天pseudo_session对应的非空的device_token,doctor_id,mobile,补充到对应的pseudo_session下这几项为空的记录中
...
...
@@ -243,7 +244,7 @@ class SessionProcessPref extends java.io.Serializable {
if
(
index
!=
1
){
insertSql
=
"insert into"
}
println
(
s
"-----------------create view ${tmpTable} and load to
dw_fact_log_session_pref
--------------------"
)
println
(
s
"-----------------create view ${tmpTable} and load to
${MyConfigSession.HIVE_TABLE0}
--------------------"
)
dataFrame
.
repartition
(
10
).
createOrReplaceTempView
(
tmpTable
)
val
fields
=
List
(
"pseudo_session"
,
"user_id"
,
"COALESCE(cast(user_id as int),0) user_id_int"
,
"mobile"
,
"device_token"
,
"user_token"
,
"view_class"
,
"view_path"
,
"action"
,
"action_type"
,
"component_tag"
,
"menu_code"
,
"menu_code_new"
,
"action_code"
,
"position"
,
"label_value"
,
"label_class"
,
"module_class1"
,
"module_class2"
,
"app_version"
,
"device_type"
,
"device_brand"
,
...
...
src/main/scala/com/session/SessionProcessTerm.scala
浏览文件 @
bb76e55c
...
...
@@ -46,7 +46,7 @@ object SessionProcessTerm {
var
condition
=
" 1=1"
if
(
args
.
length
>=
1
)
{
scnData
=
args
(
0
)
if
(
args
.
length
>
1
){
if
(
args
.
length
>
1
&&
args
(
1
)!=
""
){
condition
=
args
(
1
)
}
}
...
...
@@ -90,9 +90,9 @@ object SessionProcessTerm {
println
(
"selectDF.show========"
)
selectDF
.
printSchema
()
println
(
"selectDF.count========="
,
selectDF
.
count
())
//
val conditionGroup = List("<='4' ","between '5' and '9'",">'9'")
val
conditionGroup
=
List
(
"='0'"
,
"='1'"
,
"='2'"
,
"='3'"
,
"='4'"
,
"='5'"
,
"='6'"
,
"='7'"
,
"='8'"
,
"='9'"
,
"='a'"
,
"='b'"
,
"='c'"
,
"='d'"
,
"='e'"
,
"='f'"
)
val
conditionGroup
=
List
(
"<='4' "
,
"between '5' and '9'"
,
">'9'"
)
//
val conditionGroup = List("='0'","='1'","='2'","='3'","='4'","='5'","='6'","='7'","='8'","='9'",
//
"='a'","='b'","='c'","='d'","='e'","='f'")
var
dataCount
=
0
var
index
=
0
selectDF
.
persist
(
StorageLevel
.
MEMORY_AND_DISK_SER
)
...
...
写
预览
Markdown
格式
0%
请重试
or
附加一个文件
附加文件
取消
您添加了
0
人
到此讨论。请谨慎行事。
先完成此消息的编辑!
取消
想要评论请
注册
或
登录