Commit d9e2d8b9 by fangxingjun

no message

parent 1777e202
......@@ -10,76 +10,6 @@ sys.path.append(os.path.dirname(sys.path[0]))
from utils.secure_db_client import get_remote_engine
# def update_workflow_manager(site_name, date_type, date_info):
# print(f"当前执行的参数: {site_name, date_type, date_info}")
# if date_type == "month":
# while True:
# try:
# site_name_pri_dict = {
# "us": 2,
# "uk": 4,
# "de": 6,
# }
# engine_mysql = get_remote_engine(
# site_name='us',
# db_type='mysql'
# )
# spider_script = f'ansible dabing_all -f 10 -m shell -a "nohup /usr/local/bin/python3 /mnt/py_spider/threading_spider/Poll_site_spider_month.py {site_name} {date_type} {date_info} >/dev/null 2>&1 &";'
# priority = site_name_pri_dict[site_name]
# update_sql_workflow_spider = f"""
# INSERT INTO selection.workflow_manager
# (
# workflow_name,
# site_name,
# date_type,
# date_info,
# priority,
# spider_name,
# spider_script,
# spider_is_ready,
# spider_state,
# bg_name,
# bg_dol_name,
# bg_dol_state,
# finished_count
# )
# VALUES
# (
# '月全流程',
# '{site_name}',
# 'month',
# '{date_info}',
# {priority},
# '{site_name}_spider_asin',
# '{spider_script}',
# 'yes',
# 1,
# '{site_name}_all_cal',
# 'ALL-月流程-ABA+反查+流量选品',
# 1,
# 0
# )
# ON DUPLICATE KEY UPDATE
# spider_is_ready = VALUES(spider_is_ready),
# spider_script = VALUES(spider_script),
# spider_state = VALUES(spider_state),
# bg_dol_name = VALUES(bg_dol_name);
# """
# print(f"workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}")
# engine_mysql.execute(update_sql_workflow_spider)
#
# update_sql_workflow_bg = f"""update selection.workflow_manager
# set bg_dol_state=3, finished_count=COALESCE(finished_count, 0) + 1
# WHERE workflow_name='月全流程' and site_name='{site_name}' and date_type='{date_type}' and date_info='{date_info}' and priority={priority}"""
# print(f"workflow_manager进度表---更新asin导出进度和完成次数: {update_sql_workflow_bg}")
# engine_mysql.execute(update_sql_workflow_bg)
# break
# except Exception as e:
# print(f"失败:workflow_manager进度表---重置爬虫的asin抓取进度: {update_sql_workflow_spider}, {e}, 报错信息: {traceback.format_exc()}")
# time.sleep(300)
# continue
def export_data(site_name, date_type, date_info):
engine = get_remote_engine(
site_name=site_name, # -> database "selection"
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment