#noticket Tests added to clarify license URL extraction.

This commit is contained in:
David Read 2013-01-31 14:32:19 +00:00 committed by amercader
parent e20080e69d
commit 9daff6a5b2
1 changed files with 31 additions and 2 deletions

View File

@ -13,7 +13,8 @@ from ckanext.harvest.model import (setup as harvest_model_setup,
HarvestSource, HarvestJob, HarvestObject) HarvestSource, HarvestJob, HarvestObject)
from ckanext.spatial.validation import Validators, SchematronValidator from ckanext.spatial.validation import Validators, SchematronValidator
from ckanext.spatial.harvesters import (GeminiCswHarvester, GeminiDocHarvester, from ckanext.spatial.harvesters import (GeminiCswHarvester, GeminiDocHarvester,
GeminiWafHarvester, SpatialHarvester) GeminiWafHarvester, SpatialHarvester,
GeminiHarvester)
from ckanext.spatial.model.package_extent import setup as spatial_db_setup from ckanext.spatial.model.package_extent import setup as spatial_db_setup
from ckanext.spatial.tests.base import SpatialTestBase from ckanext.spatial.tests.base import SpatialTestBase
@ -165,7 +166,7 @@ class TestHarvest(HarvestFixtureBase):
pkgs = Session.query(Package).all() pkgs = Session.query(Package).all()
assert len(pkgs) == 2 assert_equal(len(pkgs), 2)
pkg_ids = [pkg.id for pkg in pkgs] pkg_ids = [pkg.id for pkg in pkgs]
@ -801,6 +802,34 @@ class TestHarvest(HarvestFixtureBase):
source_dict = get_action('harvest_source_show')(self.context,{'id':source.id}) source_dict = get_action('harvest_source_show')(self.context,{'id':source.id})
assert len(source_dict['status']['packages']) == 1 assert len(source_dict['status']['packages']) == 1
class TestImportStageTools:
def test_licence_url_normal(self):
assert_equal(GeminiHarvester._extract_first_licence_url(
['Reference and PSMA Only',
'http://www.test.gov.uk/licenseurl']),
'http://www.test.gov.uk/licenseurl')
def test_licence_url_multiple_urls(self):
# only the first URL is extracted
assert_equal(GeminiHarvester._extract_first_licence_url(
['Reference and PSMA Only',
'http://www.test.gov.uk/licenseurl',
'http://www.test.gov.uk/2nd_licenseurl']),
'http://www.test.gov.uk/licenseurl')
def test_licence_url_embedded(self):
# URL is embedded within the text field and not extracted
assert_equal(GeminiHarvester._extract_first_licence_url(
['Reference and PSMA Only http://www.test.gov.uk/licenseurl']),
None)
def test_licence_url_embedded_at_start(self):
# URL is embedded at the start of the text field and the
# whole field is returned. Noting this unusual behaviour
assert_equal(GeminiHarvester._extract_first_licence_url(
['http://www.test.gov.uk/licenseurl Reference and PSMA Only']),
'http://www.test.gov.uk/licenseurl Reference and PSMA Only')
class TestValidation(HarvestFixtureBase): class TestValidation(HarvestFixtureBase):