@@ -59,19 +55,19 @@ class CalculateMean(BaseUtils):
...
@@ -59,19 +55,19 @@ class CalculateMean(BaseUtils):
sql_6=f"""
sql_6=f"""
SELECT * from {self.site_name}_one_category WHERE id in ( select max(id) from {self.site_name}_one_category where `year_month`='2025_5' and orders=0 and rank>50000 GROUP BY `name`)
SELECT * from {self.site_name}_one_category WHERE id in ( select max(id) from {self.site_name}_one_category where `year_month`='2025_5' and orders=0 and rank>50000 GROUP BY `name`)
UNION
UNION
select * from {self.site_name}_one_category where `year_month`='2025_6' and rank<=50000
select * from {self.site_name}_one_category where `year_month`='2025_8' and rank<=50000
"""
"""
print('查询原始表6:',sql_6)
print('查询原始表6:',sql_6)
self.df_sum_6=pd.read_sql(sql_6,con=self.engine)
self.df_sum_6=self.engine.read_sql(sql_6)
# ---- 7 月份 ----
# ---- 7 月份 ----
sql_7=f"""
sql_7=f"""
SELECT * from {self.site_name}_one_category WHERE id in ( select max(id) from {self.site_name}_one_category where `year_month`='2025_5' and orders=0 and rank>50000 GROUP BY `name`)
SELECT * from {self.site_name}_one_category WHERE id in ( select max(id) from {self.site_name}_one_category where `year_month`='2025_5' and orders=0 and rank>50000 GROUP BY `name`)
UNION
UNION
select * from {self.site_name}_one_category where `year_month`='2025_7' and rank<=50000
select * from {self.site_name}_one_category where `year_month`='2025_9' and rank<=50000
update_workflow_progress=f"update workflow_progress set status_val=3,status='抓取结束' where page='ASIN销量' and date_info='2025-{week}' and site_name='{site_name}' and date_type='week'"
update_workflow_progress=f"update workflow_progress set status_val=3,status='抓取结束' where page='ASIN销量' and date_info='2025-{week}' and site_name='{site_name}' and date_type='week'"
dele_sql=f"DELETE from {site}_aba_profit_category_insights where category='{i[0]}' and product_type='{i[1]}' and item_type_keyword='{i[2]}' and year_week='{self.y_w}'"
# dele_sql = f"DELETE from {site}_aba_profit_category_insights where category='{i[0]}' and product_type='{i[1]}' and item_type_keyword='{i[2]}' and year_week='{self.y_w}'"
dele_sql=f"DELETE from {site}_aba_profit_category_insights where category='{i[0]}' and product_type='{i[1]}' and item_type_keyword='{i[2]}' and year_week='{self.y_w}'"
dele_sql=f"DELETE from {site}_aba_profit_category_insights where category='{i[0]}' and product_type='{i[1]}' and item_type_keyword='{i[2]}' and year_week='{self.y_w}'"
...
@@ -437,9 +441,18 @@ class dow_category_Product():
...
@@ -437,9 +441,18 @@ class dow_category_Product():
SET variation_family='{data_json}', status='{spider_value}', update_time='{update_time}' ,parent_asin='{parent_asin}',variation_asin={var_asin_list}
WHERE id={id} AND site_name='{site_name}'
"""
print('成功',sql)
eliferror=='账号电脑退出登录':
sql=f"""
UPDATE asin_variation_family_log SET status='未开始' WHERE id={id} AND site_name='{site_name}'
"""
else:
sql=f"""
UPDATE asin_variation_family_log
SET variation_family='{data_json}', status='{spider_value}', update_time='{update_time}' ,parent_asin='{parent_asin}',variation_asin={var_asin_list},err_msg='{error}'
# category_name_sql_select = f"select distinct `name` , orders,category_first_id from {db_base}_one_category where rank=1 and `year_month` ='{year_month}'"
# print(category_name_sql_select)
# cursor.execute(category_name_sql_select)
# category_name_list = cursor.fetchall()
# print(category_name_list,'3444444444')
# update_sql_state1 = f"""UPDATE {db_base}_one_category SET STATE= 1"""
@@ -408,32 +408,35 @@ class async_account_name_products(BaseUtils):
...
@@ -408,32 +408,35 @@ class async_account_name_products(BaseUtils):
try:
try:
withself.engine_pg6.begin()asconn:
withself.engine_pg6.begin()asconn:
# 查詢收藏asin
# 查詢收藏asin
sql_read_asin=f'SELECT id, data_id, end_time FROM {self.db_user_collection_syn} WHERE now() >= crawling_time and now() <= end_time and state = 1 and data_type = 1 ORDER BY id FETCH FIRST {self.read_size} ROWS ONLY FOR UPDATE;'
sql_read_asin=f'SELECT id, data_id, end_time FROM {self.db_user_collection_syn} WHERE now() >= crawling_time and now() <= end_time and state = 1 and data_type = 1 ORDER BY id FOR UPDATE'
sql_read=f'SELECT id, product_url,data_id,end_time FROM {self.db_user_collection_syn} WHERE now() >= crawling_time and now() <= end_time and state = 1 and data_type = 2 ORDER BY id FETCH FIRST {self.read_size} ROWS ONLY FOR UPDATE;'
sql_read=f'SELECT id, product_url,data_id,end_time FROM {self.db_user_collection_syn} WHERE now() >= crawling_time and now() <= end_time and state = 1 and data_type = 2 ORDER BY id FETCH FIRST {self.read_size} ROWS ONLY FOR UPDATE;'
sql_delete=f"DELETE FROM adv_low_competition_phrase WHERE site = '{site_url}' AND sku = '{self.sku}' ;"
sql_delete=f"""delete from adv_low_competition_phrase where site = '{site_url}' and sku='{self.sku}' and keyword_phrase in ("{tuple(new_df.keyword_phrase)[0]}");"""
sql=f"SELECT elem->>'boyris' AS asin,task_id,site_name FROM ai_asin_analyze_log,LATERAL json_array_elements(input_params) elem WHERE module='{module}' and spider_status='未开始' for update;"
else:
sql=f"""SELECT elem->>'asin' AS asin,task_id,site_name FROM ai_asin_analyze_log,LATERAL json_array_elements(input_params) elem WHERE module = '{module}' and spider_status='未开始' for update;"""
# sql = f"""SELECT elem->>'asin' AS asin,task_id,site_name FROM ai_asin_analyze_log,LATERAL json_array_elements(input_params) elem WHERE module = '{module}' and task_id=39 for update;"""
select_sql=f"""select id, site_name, task_id, unique_key as asin,sub_step from ai_asin_analyze_spider where sub_step = 'AsinInfoRepository:详情' and status = '未开始' and site_name='{site}' order by task_id"""