"is_amazon_new",# 派生:badge_text 含 "new on amazon" 则 1
"is_movie_label",# 派生:是否电影/媒体类(0/1)
"is_brand_label",# 派生:是否有品牌(0/1)
"multi_color_flag",# 派生:多色标识(0.非多色/1.属性多色/2.标题降级)
...
...
@@ -866,15 +873,21 @@ class KafkaFlowAsinDetail(Templates):
.persist(StorageLevel.DISK_ONLY)
# df_seller_info 已完成派生,及时释放缓存
self.df_seller_info.unpersist()
print("3. 读取asin_label信息")
print("3. 读取asin_label信息(含 badge_text)")
sql=f"""
select asin, label from
(select asin, lower(label) as label, created_time,row_number() over(partition by asin,label order by updated_time desc) as crank
from ods_other_search_term_data where site_name='{self.site_name}' and date_type='30day' and trim(label) not in ('null','') and label is not null) t where t.crank=1
select asin, lower(label) as label, lower(badge_text) as badge_text
from ods_other_search_term_data
where site_name = '{self.site_name}' and date_type = '30day'