2012-10-17 17:59:02 +02:00
|
|
|
"""
|
|
|
|
Some very thin wrapper classes around those in OWSLib
|
|
|
|
for convenience.
|
|
|
|
"""
|
|
|
|
|
2019-12-11 13:23:03 +01:00
|
|
|
from past.builtins import basestring
|
|
|
|
from builtins import object
|
2012-10-17 17:59:02 +02:00
|
|
|
import logging
|
|
|
|
|
|
|
|
from owslib.etree import etree
|
2015-12-25 20:09:37 +01:00
|
|
|
from owslib.fes import PropertyIsEqualTo, SortBy, SortProperty
|
2012-10-17 17:59:02 +02:00
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
class CswError(Exception):
|
|
|
|
pass
|
|
|
|
|
|
|
|
class OwsService(object):
|
|
|
|
def __init__(self, endpoint=None):
|
|
|
|
if endpoint is not None:
|
|
|
|
self._ows(endpoint)
|
|
|
|
|
|
|
|
def __call__(self, args):
|
|
|
|
return getattr(self, args.operation)(**self._xmd(args))
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def _operations(cls):
|
|
|
|
return [x for x in dir(cls) if not x.startswith("_")]
|
|
|
|
|
|
|
|
def _xmd(self, obj):
|
|
|
|
md = {}
|
|
|
|
for attr in [x for x in dir(obj) if not x.startswith("_")]:
|
|
|
|
val = getattr(obj, attr)
|
|
|
|
if not val:
|
|
|
|
pass
|
|
|
|
elif callable(val):
|
|
|
|
pass
|
|
|
|
elif isinstance(val, basestring):
|
|
|
|
md[attr] = val
|
|
|
|
elif isinstance(val, int):
|
|
|
|
md[attr] = val
|
|
|
|
elif isinstance(val, list):
|
|
|
|
md[attr] = val
|
|
|
|
else:
|
|
|
|
md[attr] = self._xmd(val)
|
|
|
|
return md
|
|
|
|
|
|
|
|
def _ows(self, endpoint=None, **kw):
|
|
|
|
if not hasattr(self, "_Implementation"):
|
|
|
|
raise NotImplementedError("Needs an Implementation")
|
|
|
|
if not hasattr(self, "__ows_obj__"):
|
|
|
|
if endpoint is None:
|
|
|
|
raise ValueError("Must specify a service endpoint")
|
|
|
|
self.__ows_obj__ = self._Implementation(endpoint)
|
|
|
|
return self.__ows_obj__
|
|
|
|
|
|
|
|
def getcapabilities(self, debug=False, **kw):
|
|
|
|
ows = self._ows(**kw)
|
|
|
|
caps = self._xmd(ows)
|
|
|
|
if not debug:
|
|
|
|
if "request" in caps: del caps["request"]
|
|
|
|
if "response" in caps: del caps["response"]
|
|
|
|
if "owscommon" in caps: del caps["owscommon"]
|
|
|
|
return caps
|
|
|
|
|
|
|
|
class CswService(OwsService):
|
|
|
|
"""
|
|
|
|
Perform various operations on a CSW service
|
|
|
|
"""
|
2013-10-23 14:02:22 +02:00
|
|
|
from owslib.csw import CatalogueServiceWeb as _Implementation
|
2015-12-25 20:09:37 +01:00
|
|
|
|
2016-01-25 16:33:48 +01:00
|
|
|
def __init__(self, endpoint=None):
|
|
|
|
super(CswService, self).__init__(endpoint)
|
2015-12-25 20:09:37 +01:00
|
|
|
self.sortby = SortBy([SortProperty('dc:identifier')])
|
|
|
|
|
2012-10-17 17:59:02 +02:00
|
|
|
def getrecords(self, qtype=None, keywords=[],
|
|
|
|
typenames="csw:Record", esn="brief",
|
|
|
|
skip=0, count=10, outputschema="gmd", **kw):
|
|
|
|
from owslib.csw import namespaces
|
2013-10-14 15:18:42 +02:00
|
|
|
constraints = []
|
2012-10-17 17:59:02 +02:00
|
|
|
csw = self._ows(**kw)
|
2013-10-14 15:18:42 +02:00
|
|
|
|
|
|
|
if qtype is not None:
|
|
|
|
constraints.append(PropertyIsEqualTo("dc:type", qtype))
|
|
|
|
|
2012-10-17 17:59:02 +02:00
|
|
|
kwa = {
|
2013-10-14 15:18:42 +02:00
|
|
|
"constraints": constraints,
|
2012-10-17 17:59:02 +02:00
|
|
|
"typenames": typenames,
|
|
|
|
"esn": esn,
|
|
|
|
"startposition": skip,
|
|
|
|
"maxrecords": count,
|
|
|
|
"outputschema": namespaces[outputschema],
|
2015-12-25 20:09:37 +01:00
|
|
|
"sortby": self.sortby
|
2012-10-17 17:59:02 +02:00
|
|
|
}
|
2013-10-14 15:18:42 +02:00
|
|
|
log.info('Making CSW request: getrecords2 %r', kwa)
|
|
|
|
csw.getrecords2(**kwa)
|
2012-10-17 17:59:02 +02:00
|
|
|
if csw.exceptionreport:
|
|
|
|
err = 'Error getting records: %r' % \
|
|
|
|
csw.exceptionreport.exceptions
|
|
|
|
#log.error(err)
|
|
|
|
raise CswError(err)
|
2019-12-11 13:23:03 +01:00
|
|
|
return [self._xmd(r) for r in list(csw.records.values())]
|
2012-10-17 17:59:02 +02:00
|
|
|
|
|
|
|
def getidentifiers(self, qtype=None, typenames="csw:Record", esn="brief",
|
|
|
|
keywords=[], limit=None, page=10, outputschema="gmd",
|
2014-03-02 23:12:54 +01:00
|
|
|
startposition=0, cql=None, **kw):
|
2012-10-17 17:59:02 +02:00
|
|
|
from owslib.csw import namespaces
|
2013-10-14 15:18:42 +02:00
|
|
|
constraints = []
|
2012-10-17 17:59:02 +02:00
|
|
|
csw = self._ows(**kw)
|
2013-10-14 15:18:42 +02:00
|
|
|
|
|
|
|
if qtype is not None:
|
|
|
|
constraints.append(PropertyIsEqualTo("dc:type", qtype))
|
|
|
|
|
2012-10-17 17:59:02 +02:00
|
|
|
kwa = {
|
2013-10-14 15:18:42 +02:00
|
|
|
"constraints": constraints,
|
2012-10-17 17:59:02 +02:00
|
|
|
"typenames": typenames,
|
|
|
|
"esn": esn,
|
2012-11-02 12:12:46 +01:00
|
|
|
"startposition": startposition,
|
2012-10-17 17:59:02 +02:00
|
|
|
"maxrecords": page,
|
|
|
|
"outputschema": namespaces[outputschema],
|
2015-12-25 20:09:37 +01:00
|
|
|
"cql": cql,
|
|
|
|
"sortby": self.sortby
|
2012-10-17 17:59:02 +02:00
|
|
|
}
|
|
|
|
i = 0
|
2012-11-02 12:12:46 +01:00
|
|
|
matches = 0
|
2012-10-17 17:59:02 +02:00
|
|
|
while True:
|
2013-10-14 15:18:42 +02:00
|
|
|
log.info('Making CSW request: getrecords2 %r', kwa)
|
2012-11-02 12:12:46 +01:00
|
|
|
|
2013-10-14 15:18:42 +02:00
|
|
|
csw.getrecords2(**kwa)
|
2012-10-17 17:59:02 +02:00
|
|
|
if csw.exceptionreport:
|
|
|
|
err = 'Error getting identifiers: %r' % \
|
|
|
|
csw.exceptionreport.exceptions
|
|
|
|
#log.error(err)
|
|
|
|
raise CswError(err)
|
2012-11-02 12:12:46 +01:00
|
|
|
|
|
|
|
if matches == 0:
|
|
|
|
matches = csw.results['matches']
|
|
|
|
|
2019-12-11 13:23:03 +01:00
|
|
|
identifiers = list(csw.records.keys())
|
2012-10-17 17:59:02 +02:00
|
|
|
if limit is not None:
|
|
|
|
identifiers = identifiers[:(limit-startposition)]
|
|
|
|
for ident in identifiers:
|
|
|
|
yield ident
|
2012-11-02 12:12:46 +01:00
|
|
|
|
|
|
|
if len(identifiers) == 0:
|
2012-10-17 17:59:02 +02:00
|
|
|
break
|
2012-11-02 12:12:46 +01:00
|
|
|
|
2012-10-17 17:59:02 +02:00
|
|
|
i += len(identifiers)
|
|
|
|
if limit is not None and i > limit:
|
|
|
|
break
|
2012-11-02 12:12:46 +01:00
|
|
|
|
|
|
|
startposition += page
|
|
|
|
if startposition >= (matches + 1):
|
|
|
|
break
|
|
|
|
|
|
|
|
kwa["startposition"] = startposition
|
|
|
|
|
2012-10-17 17:59:02 +02:00
|
|
|
def getrecordbyid(self, ids=[], esn="full", outputschema="gmd", **kw):
|
|
|
|
from owslib.csw import namespaces
|
|
|
|
csw = self._ows(**kw)
|
|
|
|
kwa = {
|
|
|
|
"esn": esn,
|
|
|
|
"outputschema": namespaces[outputschema],
|
|
|
|
}
|
|
|
|
# Ordinary Python version's don't support the metadata argument
|
|
|
|
log.info('Making CSW request: getrecordbyid %r %r', ids, kwa)
|
|
|
|
csw.getrecordbyid(ids, **kwa)
|
|
|
|
if csw.exceptionreport:
|
|
|
|
err = 'Error getting record by id: %r' % \
|
|
|
|
csw.exceptionreport.exceptions
|
|
|
|
#log.error(err)
|
|
|
|
raise CswError(err)
|
|
|
|
if not csw.records:
|
|
|
|
return
|
2019-12-11 13:23:03 +01:00
|
|
|
record = self._xmd(list(csw.records.values())[0])
|
2012-10-17 17:59:02 +02:00
|
|
|
|
|
|
|
## strip off the enclosing results container, we only want the metadata
|
|
|
|
#md = csw._exml.find("/gmd:MD_Metadata")#, namespaces=namespaces)
|
|
|
|
# Ordinary Python version's don't support the metadata argument
|
|
|
|
md = csw._exml.find("/{http://www.isotc211.org/2005/gmd}MD_Metadata")
|
|
|
|
mdtree = etree.ElementTree(md)
|
|
|
|
try:
|
2019-12-11 13:23:03 +01:00
|
|
|
record["xml"] = etree.tostring(mdtree, pretty_print=True, encoding=str)
|
2012-10-17 17:59:02 +02:00
|
|
|
except TypeError:
|
|
|
|
# API incompatibilities between different flavours of elementtree
|
|
|
|
try:
|
2019-12-11 13:23:03 +01:00
|
|
|
record["xml"] = etree.tostring(mdtree, pretty_print=True, encoding=str)
|
2012-10-17 17:59:02 +02:00
|
|
|
except AssertionError:
|
2019-12-11 13:23:03 +01:00
|
|
|
record["xml"] = etree.tostring(md, pretty_print=True, encoding=str)
|
2012-11-20 16:42:07 +01:00
|
|
|
|
|
|
|
record["xml"] = '<?xml version="1.0" encoding="UTF-8"?>\n' + record["xml"]
|
2012-10-17 17:59:02 +02:00
|
|
|
record["tree"] = mdtree
|
|
|
|
return record
|