diff --git a/spiders/MediaSpiders/MediaSpiders/spiders/TwitterUserSpider.py b/spiders/MediaSpiders/MediaSpiders/spiders/TwitterUserSpider.py index 3a62562..2449034 100644 --- a/spiders/MediaSpiders/MediaSpiders/spiders/TwitterUserSpider.py +++ b/spiders/MediaSpiders/MediaSpiders/spiders/TwitterUserSpider.py @@ -185,13 +185,13 @@ class TwitterSpider(scrapy.Spider): item['es_urltime'] = get_time_stamp( str(created_at)) + 8 * 3600 * 1000 # TW默认使用的是零时区,转换为北京时间 if 'quoted_status_result' in result: - item['es_isrepost'] = 'yes' + item['es_isrepost'] = 1 item['es_urltitle'] = author_full_text item['es_catalog1'] = author_full_text legacy = result['quoted_status_result']['result']['legacy'] self.logger.info('采集引用推文原文信息') elif 'retweeted_status_result' in legacy: - item['es_isrepost'] = 'yes' + item['es_isrepost'] = 1 legacy = legacy['retweeted_status_result']['result']['legacy'] self.logger.info('采集转发推文原文信息') item['es_content'] = legacy['full_text']