Skip to content
Projects
Groups
Snippets
Help
This project
Loading...
Sign in / Register
Toggle navigation
A
Amazon-Selection-Data
Overview
Overview
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
abel_cjy
Amazon-Selection-Data
Commits
d9e2d8b9
Commit
d9e2d8b9
authored
May 28, 2026
by
fangxingjun
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
no message
parent
1777e202
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
70 deletions
+0
-70
export_dwt_asin_sync.py
Pyspark_job/sqoop_export/export_dwt_asin_sync.py
+0
-70
No files found.
Pyspark_job/sqoop_export/export_dwt_asin_sync.py
View file @
d9e2d8b9
...
...
@@ -10,76 +10,6 @@ sys.path.append(os.path.dirname(sys.path[0]))
from
utils.secure_db_client
import
get_remote_engine
# def update_workflow_manager(site_name, date_type, date_info):
# print(f"当前执行的参数: {site_name, date_type, date_info}")
# if date_type == "month":
# while True:
# try:
# site_name_pri_dict = {
# "us": 2,
# "uk": 4,
# "de": 6,
# }
# engine_mysql = get_remote_engine(
# site_name='us',
# db_type='mysql'
# )
# spider_script = f'ansible dabing_all -f 10 -m shell -a "nohup /usr/local/bin/python3 /mnt/py_spider/threading_spider/Poll_site_spider_month.py {site_name} {date_type} {date_info} >/dev/null 2>&1 &";'
# priority = site_name_pri_dict[site_name]
# update_sql_workflow_spider = f"""
# INSERT INTO selection.workflow_manager
# (
# workflow_name,
# site_name,
# date_type,
# date_info,
# priority,
# spider_name,
# spider_script,
# spider_is_ready,
# spider_state,
# bg_name,
# bg_dol_name,
# bg_dol_state,
# finished_count
# )
# VALUES
# (
# '月全流程',
# '{site_name}',
# 'month',
# '{date_info}',
# {priority},
# '{site_name}_spider_asin',
# '{spider_script}',
# 'yes',
# 1,
# '{site_name}_all_cal',
# 'ALL-月流程-ABA+反查+流量选品',
# 1,
# 0
# )
# ON DUPLICATE KEY UPDATE
# spider_is_ready = VALUES(spider_is_ready),
# spider_script = VALUES(spider_script),
# spider_state = VALUES(spider_state),
# bg_dol_name = VALUES(bg_dol_name);
# """
# print(f"workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}")
# engine_mysql.execute(update_sql_workflow_spider)
#
# update_sql_workflow_bg = f"""update selection.workflow_manager
# set bg_dol_state=3, finished_count=COALESCE(finished_count, 0) + 1
# WHERE workflow_name='月全流程' and site_name='{site_name}' and date_type='{date_type}' and date_info='{date_info}' and priority={priority}"""
# print(f"workflow_manager进度表---更新asin导出进度和完成次数: {update_sql_workflow_bg}")
# engine_mysql.execute(update_sql_workflow_bg)
# break
# except Exception as e:
# print(f"失败:workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}, {e}, 报错信息: {traceback.format_exc()}")
# time.sleep(300)
# continue
def
export_data
(
site_name
,
date_type
,
date_info
):
engine
=
get_remote_engine
(
site_name
=
site_name
,
# -> database "selection"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment