From ae522b79b79c364725c8e71b5f6e7d8171035004 Mon Sep 17 00:00:00 2001 From: Fuhu Xia Date: Tue, 25 Jun 2024 08:58:39 -0400 Subject: [PATCH] raise error and return None for ParentNotHarvestedException --- ckanext/datajson/datajson.py | 15 ++++++--------- 1 file changed, 6 insertions(+), 9 deletions(-) diff --git a/ckanext/datajson/datajson.py b/ckanext/datajson/datajson.py index b37b3d1b..d68e190d 100644 --- a/ckanext/datajson/datajson.py +++ b/ckanext/datajson/datajson.py @@ -458,14 +458,7 @@ def is_part_of_to_package_id(self, ipo, harvest_object): # we have 0 o bad results msg = 'Parent identifier not found: "{}"'.format(ipo) log.error(msg) - try: - harvest_object_error = HarvestObjectError(message=msg, object=harvest_object) - harvest_object_error.save() - harvest_object.state = "ERROR" - harvest_object.save() - except Exception: - pass - raise ParentNotHarvestedException('Unable to find parent dataset. Raising error to allow re-run later') + raise ParentNotHarvestedException('Unable to find parent dataset.') def import_stage(self, harvest_object): # The import stage actually creates the dataset. @@ -501,7 +494,11 @@ def import_stage(self, harvest_object): # check if parent is already harvested parent_identifier = parent_pkg_id.replace('IPO:', '') - parent = self.is_part_of_to_package_id(parent_identifier, harvest_object) + try: + parent = self.is_part_of_to_package_id(parent_identifier, harvest_object) + except ParentNotHarvestedException as e: + self._save_object_error(str(e), harvest_object, 'Import') + return None parent_pkg_id = parent['id'] if extra.key.startswith('catalog_'):