Commit 05c13cdd by fangxingjun

no message

parent 1d3a545e
......@@ -21,55 +21,53 @@ def update_workflow_manager(site_name, date_type, date_info):
site_name='us',
db_type='mysql'
)
with engine_mysql.begin() as conn:
spider_script = f'ansible dabing_all -f 10 -m shell -a "nohup /usr/local/bin/python3 /mnt/py_spider/threading_spider/Poll_site_spider_month.py {site_name} {date_type} {date_info} >/dev/null 2>&1 &";'
priority = site_name_pri_dict[site_name]
update_sql_workflow_spider = f"""
INSERT INTO selection.workflow_manager
(
workflow_name,
site_name,
date_type,
date_info,
priority,
spider_name,
spider_script,
spider_is_ready,
spider_state,
bg_name,
bg_dol_state,
finished_count
)
VALUES
(
'月全流程',
'{site_name}',
'month',
'{date_info}',
{priority},
'{site_name}_spider_asin',
'{spider_script}',
'yes',
1,
'{site_name}_all_cal',
3,
0
)
ON DUPLICATE KEY UPDATE
spider_is_ready = VALUES(spider_is_ready),
spider_script = VALUES(spider_script),
spider_state = VALUES(spider_state),
bg_dol_state = VALUES(bg_dol_state);
"""
print(f"workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}")
conn.execute(update_sql_workflow_spider)
spider_script = f'ansible dabing_all -f 10 -m shell -a "nohup /usr/local/bin/python3 /mnt/py_spider/threading_spider/Poll_site_spider_month.py {site_name} {date_type} {date_info} >/dev/null 2>&1 &";'
priority = site_name_pri_dict[site_name]
update_sql_workflow_spider = f"""
INSERT INTO selection.workflow_manager
(
workflow_name,
site_name,
date_type,
date_info,
priority,
spider_name,
spider_script,
spider_is_ready,
spider_state,
bg_name,
bg_dol_state,
finished_count
)
VALUES
(
'月全流程',
'{site_name}',
'month',
'{date_info}',
{priority},
'{site_name}_spider_asin',
'{spider_script}',
'yes',
1,
'{site_name}_all_cal',
1,
0
)
ON DUPLICATE KEY UPDATE
spider_is_ready = VALUES(spider_is_ready),
spider_script = VALUES(spider_script),
spider_state = VALUES(spider_state);
"""
print(f"workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}")
engine_mysql.execute(update_sql_workflow_spider)
update_sql_workflow_bg = f"""update selection.workflow_manager
set bg_dol_state=3, finished_count=COALESCE(finished_count, 0) + 1
WHERE workflow_name='月全流程' and site_name='{site_name}' and date_type='{date_type}' and date_info='{date_info}' and priority={priority}"""
print(f"workflow_manager进度表---更新asin导出进度和完成次数: {update_sql_workflow_bg}")
conn.execute(update_sql_workflow_bg)
break
update_sql_workflow_bg = f"""update selection.workflow_manager
set bg_dol_state=3, finished_count=COALESCE(finished_count, 0) + 1
WHERE workflow_name='月全流程' and site_name='{site_name}' and date_type='{date_type}' and date_info='{date_info}' and priority={priority}"""
print(f"workflow_manager进度表---更新asin导出进度和完成次数: {update_sql_workflow_bg}")
engine_mysql.execute(update_sql_workflow_bg)
break
except Exception as e:
print(f"失败:workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}, {e}, 报错信息: {traceback.format_exc()}")
time.sleep(300)
......@@ -112,6 +110,6 @@ if __name__ == '__main__':
site_name = sys.argv[1] # 参数1:站点
date_type = sys.argv[2] # 参数2:类型:week/4_week/month/quarter/day
date_info = sys.argv[3] # 参数3:年-周/年-月/年-季/年-月-日, 比如: 2022-1
export_data(site_name, date_type, date_info)
# export_data(site_name, date_type, date_info)
if site_name in ["us", "uk", "de"] and date_type == "month":
update_workflow_manager(site_name, date_type, date_info)
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment