1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
import os
import sys
sys.path.append(os.path.dirname(sys.path[0]))
from utils.ssh_util import SSHUtil
from utils.common_util import CommonUtil, DateTypes
from utils.db_util import DBUtil
if __name__ == '__main__':
site_name = CommonUtil.get_sys_arg(1, None)
date_type = CommonUtil.get_sys_arg(2, None)
date_info = CommonUtil.get_sys_arg(3, None)
# 获取最后一个参数,判断是否导出到测试环境
test_flag = CommonUtil.get_sys_arg(len(sys.argv) - 1, None)
print(f"执行参数为{sys.argv}")
if test_flag == 'test':
db_type = 'postgresql_test'
print("导出到PG测试库中")
else:
db_type = "postgresql"
print("导出到PG正式库中")
# 获取数据库连接
engine = DBUtil.get_db_engine(db_type, site_name)
# 导出表
export_base_tb = f"{site_name}_aba_last_change_rate"
# last30day和last365day导出
if date_type in (DateTypes.last30day.name, DateTypes.last365day.name):
export_tb_target = f"{export_base_tb}_{date_type}" # us_aba_last_change_rate_last30day / _last365day
export_tb_copy = f"{export_tb_target}_copy"
export_tb = export_tb_copy
# 如果copy表不存在则创建copy表
sql = f"""
create table if not exists {export_tb_copy}
(
like {export_tb_target} including indexes including comments
);
truncate table {export_tb_copy};
"""
DBUtil.engine_exec_sql(engine, sql)
else:
# day,week,month这种时间类型的数据导出
date_partition = str(date_info).replace("-", "_")
export_tb = f"{site_name}_aba_last_change_rate_{date_type}_{date_partition}"
next_val = CommonUtil.get_next_val(date_type, date_info)
# 创建分区,并清空导出分区
sql = f"""
create table if not exists {export_tb} partition of {export_base_tb} for values from ('{date_type}', '{date_info}') to ('{date_type}', '{next_val}');
truncate table {export_tb};
"""
DBUtil.engine_exec_sql(engine, sql)
# 导出表名
sh = CommonUtil.build_export_sh(
site_name=site_name,
db_type=db_type,
hive_tb="dwt_aba_last_change_rate",
export_tb=export_tb,
col=[
"search_term",
"search_term_id",
"date_type",
"date_info",
"rank_change_rate",
"bsr_orders_change_rate",
"cn_seller_change_rate",
"fbm_change_rate",
"amazon_change_rate",
"rank_rate_of_change",
"bsr_orders_rate_of_change",
"cn_seller_rate_of_change",
"fbm_rate_of_change",
"amazon_rate_of_change",
"created_time",
"updated_time"
],
partition_dict={
"site_name": site_name,
"date_type": date_type,
"date_info": date_info
}
)
client = SSHUtil.get_ssh_client()
SSHUtil.exec_command_async(client, sh, ignore_err=False)
client.close()
if date_type in (DateTypes.last30day.name, DateTypes.last365day.name):
# 需要通过备份表替换形式替换数据
DBUtil.exchange_tb(engine, export_tb_copy, export_tb_target, cp_index_flag=False)