From ee9473a6c3dc62e5765148bfac3c88459ac8f988 Mon Sep 17 00:00:00 2001 From: yuxin-pc Date: Tue, 20 Jan 2026 11:07:54 +0800 Subject: [PATCH] =?UTF-8?q?=E5=8C=B9=E9=85=8D=E5=8E=9F=E6=96=87?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- research/pdf_downloader/set_raw_title_kcna.py | 3 ++- research/pdf_downloader/set_raw_title_rodong.py | 6 ++++-- 2 files changed, 6 insertions(+), 3 deletions(-) diff --git a/research/pdf_downloader/set_raw_title_kcna.py b/research/pdf_downloader/set_raw_title_kcna.py index 2925987..bb2deb4 100644 --- a/research/pdf_downloader/set_raw_title_kcna.py +++ b/research/pdf_downloader/set_raw_title_kcna.py @@ -75,7 +75,8 @@ def main(): FROM indeximos WHERE es_srcname IN ({placeholders}) AND es_urlname IS NOT NULL - AND es_urlname != '' + AND es_urlname != '' + AND es_loadtime > '2026-01-16 10:40:00' """ cursor.execute(query, TARGET_SRCNAMES) records = cursor.fetchall() diff --git a/research/pdf_downloader/set_raw_title_rodong.py b/research/pdf_downloader/set_raw_title_rodong.py index 0aaba06..eeac4d8 100644 --- a/research/pdf_downloader/set_raw_title_rodong.py +++ b/research/pdf_downloader/set_raw_title_rodong.py @@ -63,6 +63,7 @@ def get_chinese_records(cursor) -> List[Tuple]: WHERE es_srcname IN ({placeholders}) AND es_urltitle IS NOT NULL AND TRIM(es_urltitle) != '' AND es_urltime IS NOT NULL + AND es_loadtime > '2026-01-16 10:40:00' """ cursor.execute(query, TARGET_SRCNAMES) return cursor.fetchall() @@ -73,11 +74,12 @@ def get_foreign_candidates_by_time(cursor, pub_time) -> List[Tuple]: 获取同一发布时间的所有外文候选记录(要求 es_abstract 不为空) """ query = """ - SELECT es_sid, es_abstract, es_urltitle, es_urlcontent + SELECT es_sid, es_title, es_urltitle, es_urlcontent FROM indeximos WHERE es_urltime = %s - AND es_abstract IS NOT NULL AND TRIM(es_abstract) != '' + AND es_title IS NOT NULL AND TRIM(es_title) != '' AND es_urlcontent IS NOT NULL + AND es_loadtime > '2026-01-16 10:40:00' """ cursor.execute(query, (pub_time,)) return cursor.fetchall()