harvester-d4science/ckanext/harvest/controllers/view.py

175 lines
6.1 KiB
Python
Raw Normal View History

from ckan.lib.helpers import json
2011-03-10 10:45:16 +01:00
import urllib2
import ckan.lib.helpers as h
from ckan.lib.base import BaseController, c, g, request, \
response, session, render, config, abort, redirect
from ckan.model import Package
class ViewController(BaseController):
api_url = config.get('ckan.api_url', 'http://localhost:5000').rstrip('/')+'/api/2/rest'
2011-03-10 17:48:50 +01:00
form_api_url = config.get('ckan.api_url', 'http://localhost:5000').rstrip('/')+'/api/2/form'
2011-03-10 16:32:51 +01:00
api_key = config.get('ckan.harvesting.api_key')
2011-03-10 10:45:16 +01:00
2011-03-10 16:32:51 +01:00
def _do_request(self,url,data = None):
2011-03-10 10:45:16 +01:00
2011-03-10 16:32:51 +01:00
http_request = urllib2.Request(
url = url,
headers = {'Authorization' : self.api_key}
)
if data:
http_request.add_data(data)
try:
return urllib2.urlopen(http_request)
except urllib2.HTTPError as e:
raise
2011-03-10 16:32:51 +01:00
def index(self):
# Request all harvesting sources
sources_url = self.api_url + '/harvestsource'
2011-03-15 17:19:13 +01:00
try:
doc = self._do_request(sources_url).read()
2011-03-10 16:32:51 +01:00
2011-03-15 17:19:13 +01:00
sources_ids = json.loads(doc)
2011-03-10 16:32:51 +01:00
2011-03-15 17:19:13 +01:00
source_url = sources_url + '/%s'
sources = []
# For each source, request its details
for source_id in sources_ids:
doc = self._do_request(source_url % source_id).read()
sources.append(json.loads(doc))
c.sources = sources
except urllib2.HTTPError as e:
msg = 'An error occurred: [%s %s]' % (str(e.getcode()),e.msg)
h.flash_error(msg)
2011-03-10 16:32:51 +01:00
return render('ckanext/harvest/index.html')
def create(self):
# This is the DGU form API, so we don't use self.api_url
2011-03-10 17:48:50 +01:00
form_url = self.form_api_url + '/harvestsource/create'
if request.method == 'GET':
# Request the fields
2011-03-10 16:32:51 +01:00
c.form = self._do_request(form_url).read()
2011-03-11 14:42:21 +01:00
c.mode = 'create'
return render('ckanext/harvest/create.html')
if request.method == 'POST':
# Build an object like the one expected by the DGU form API
data = {
'form_data':
{'HarvestSource--url': request.POST['HarvestSource--url'],
'HarvestSource--description': request.POST['HarvestSource--description']},
'user_ref':'',
'publisher_ref':''
}
data = json.dumps(data)
try:
r = self._do_request(form_url,data)
h.flash_success('Harvesting source added successfully')
except urllib2.HTTPError as e:
msg = 'An error occurred: [%s %s]' % (str(e.getcode()),e.msg)
# The form API returns just a 500, so we are not exactly sure of what
# happened, but most probably it was a duplicate entry
2011-03-11 14:42:21 +01:00
if e.getcode() == 500:
msg = msg + ' Does the source already exist?'
h.flash_error(msg)
finally:
redirect(h.url_for(controller='harvest', action='index'))
def show(self,id):
sources_url = self.api_url + '/harvestsource/%s' % id
doc = self._do_request(sources_url).read()
c.source = json.loads(doc)
2011-03-11 13:38:09 +01:00
return render('ckanext/harvest/show.html')
def delete(self,id):
form_url = self.form_api_url + '/harvestsource/delete/%s' % id
r = self._do_request(form_url)
h.flash_success('Harvesting source deleted successfully')
redirect(h.url_for(controller='harvest', action='index', id=None))
2011-03-11 14:42:21 +01:00
def edit(self,id):
form_url = self.form_api_url + '/harvestsource/edit/%s' % id
if request.method == 'GET':
# Request the fields
c.form = self._do_request(form_url).read()
c.mode = 'edit'
return render('ckanext/harvest/create.html')
if request.method == 'POST':
# Build an object like the one expected by the DGU form API
data = {
'form_data':
{'HarvestSource-%s-url' % id: request.POST['HarvestSource-%s-url' % id] ,
'HarvestSource-%s-description' % id: request.POST['HarvestSource-%s-description' % id]},
'user_ref':'',
'publisher_ref':''
}
data = json.dumps(data)
try:
r = self._do_request(form_url,data)
h.flash_success('Harvesting source edited successfully')
except urllib2.HTTPError as e:
msg = 'An error occurred: [%s %s]' % (str(e.getcode()),e.msg)
h.flash_error(msg)
finally:
redirect(h.url_for(controller='harvest', action='index', id=None))
2011-03-10 18:24:23 +01:00
def create_harvesting_job(self,id):
2011-03-10 17:48:50 +01:00
form_url = self.api_url + '/harvestingjob'
data = {
2011-03-10 18:24:23 +01:00
'source_id': id,
2011-03-10 17:48:50 +01:00
'user_ref': ''
}
data = json.dumps(data)
try:
r = self._do_request(form_url,data)
h.flash_success('Refresh requested, harvesting will take place within 15 minutes.')
except urllib2.HTTPError as e:
msg = 'An error occurred: [%s %s]' % (str(e.getcode()),e.msg)
if e.getcode() == 400:
msg = msg + ' ' + e.read()
h.flash_error(msg)
finally:
redirect(h.url_for(controller='harvest', action='index', id=None))
def map_view(self,id):
#check if package exists
pkg = Package.get(id)
if pkg is None:
abort(404, 'Package not found')
c.url = pkg.url
return render('ckanext/harvest/map.html')
def proxy(self):
if not 'url' in request.params:
abort(400)
try:
server_response = urllib2.urlopen(request.params['url'])
headers = server_response.info()
if headers.get('Content-Type'):
response.content_type = headers.get('Content-Type')
return server_response.read()
except urllib2.HTTPError as e:
response.status_int = e.getcode()
return