From f1ed839f4c61d5f637ab77c162bf8403ad107aa4 Mon Sep 17 00:00:00 2001 From: Roberta Takenaka Date: Wed, 24 Nov 2021 20:31:56 -0300 Subject: [PATCH] =?UTF-8?q?Como=20h=C3=A1=20casos=20em=20que=20o=20doi=20p?= =?UTF-8?q?ode=20estar=20errado=20(o=20mesmo=20doi=20atribu=C3=ADdo=20para?= =?UTF-8?q?=20artigos=20diferentes),=20deve-se=20comparar=20mais=20dados?= =?UTF-8?q?=20para=20garantir=20de=20que=20=C3=A9=20uma=20repeti=C3=A7?= =?UTF-8?q?=C3=A3o?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- airflow/dags/operations/sync_kernel_to_website_operations.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/airflow/dags/operations/sync_kernel_to_website_operations.py b/airflow/dags/operations/sync_kernel_to_website_operations.py index a98fa26d..bc331c2c 100644 --- a/airflow/dags/operations/sync_kernel_to_website_operations.py +++ b/airflow/dags/operations/sync_kernel_to_website_operations.py @@ -667,6 +667,11 @@ def _unpublish_repeated_documents(document_id, doi): for doc in docs: if doc._id == document_id: continue + if doc.title != new_doc.title: + continue + if doc.issue != new_doc.issue and not doc.issue.endswith("aop"): + continue + logging.info("Repeated document %s / %s / %s / %s" % (doc._id, doc.pid, doc.aop_pid, str(doc.scielo_pids))) # obtém os pids