move detecting unchanged datasets to ckanharvester and queue.py

This commit is contained in:
Jari Voutilainen 2015-03-10 14:48:41 +02:00
parent 1e0376cff6
commit 859133fe36
3 changed files with 15 additions and 4 deletions

View File

@ -178,8 +178,6 @@ class HarvesterBase(SingletonPlugin):
else: else:
log.info('Package with GUID %s not updated, skipping...' % harvest_object.guid) log.info('Package with GUID %s not updated, skipping...' % harvest_object.guid)
harvest_object.report_status = 'not modified'
harvest_object.save()
return return
# Flag the other objects linking to this package as not current anymore # Flag the other objects linking to this package as not current anymore

View File

@ -378,6 +378,17 @@ class CKANHarvester(HarvesterBase):
for resource in package_dict.get('resources', []): for resource in package_dict.get('resources', []):
resource.pop('url_type', None) resource.pop('url_type', None)
# Check if package exists
data_dict = {}
data_dict['id'] = package_dict['id']
try:
existing_package_dict = get_action('package_show')(context, data_dict)
if 'metadata_modified' in package_dict and \
package_dict['metadata_modified'] <= existing_package_dict.get('metadata_modified'):
return "unchanged"
except NotFound:
pass
result = self._create_or_update_package(package_dict,harvest_object) result = self._create_or_update_package(package_dict,harvest_object)
if result and self.config.get('read_only',False) == True: if result and self.config.get('read_only',False) == True:

View File

@ -312,14 +312,16 @@ def fetch_and_import_stages(harvester, obj):
obj.import_finished = datetime.datetime.utcnow() obj.import_finished = datetime.datetime.utcnow()
if success_import: if success_import:
obj.state = "COMPLETE" obj.state = "COMPLETE"
if success_import is 'unchanged':
obj.report_status = 'not modified'
obj.save()
return
else: else:
obj.state = "ERROR" obj.state = "ERROR"
obj.save() obj.save()
else: else:
obj.state = "ERROR" obj.state = "ERROR"
obj.save() obj.save()
if obj.report_status == 'not modified':
return
if obj.state == 'ERROR': if obj.state == 'ERROR':
obj.report_status = 'errored' obj.report_status = 'errored'
elif obj.current == False: elif obj.current == False: