es_isrepost 赋值修改为 1

This commit is contained in:
DELL 2026-01-21 10:04:57 +08:00
parent 8c84df0fdc
commit 073f4325d0

View File

@ -185,13 +185,13 @@ class TwitterSpider(scrapy.Spider):
item['es_urltime'] = get_time_stamp( item['es_urltime'] = get_time_stamp(
str(created_at)) + 8 * 3600 * 1000 # TW默认使用的是零时区转换为北京时间 str(created_at)) + 8 * 3600 * 1000 # TW默认使用的是零时区转换为北京时间
if 'quoted_status_result' in result: if 'quoted_status_result' in result:
item['es_isrepost'] = 'yes' item['es_isrepost'] = 1
item['es_urltitle'] = author_full_text item['es_urltitle'] = author_full_text
item['es_catalog1'] = author_full_text item['es_catalog1'] = author_full_text
legacy = result['quoted_status_result']['result']['legacy'] legacy = result['quoted_status_result']['result']['legacy']
self.logger.info('采集引用推文原文信息') self.logger.info('采集引用推文原文信息')
elif 'retweeted_status_result' in legacy: elif 'retweeted_status_result' in legacy:
item['es_isrepost'] = 'yes' item['es_isrepost'] = 1
legacy = legacy['retweeted_status_result']['result']['legacy'] legacy = legacy['retweeted_status_result']['result']['legacy']
self.logger.info('采集转发推文原文信息') self.logger.info('采集转发推文原文信息')
item['es_content'] = legacy['full_text'] item['es_content'] = legacy['full_text']