TPDL2020-context-propagation/es_connector.py

48 lines
1.5 KiB
Python
Raw Normal View History

2020-06-11 16:40:40 +02:00
from elasticsearch import Elasticsearch
from elasticsearch_dsl import *
import logging
log = logging.getLogger("ES connector")
log.setLevel(logging.INFO)
ES_HOST = "ip-90-147-167-25.ct1.garrservices.it"
class ESObject(object):
def __init__(self, id, pid, type, title, abstract, propagated_abstract):
self.id = id
self.pid = pid
self.type = type
self.title = title
self.abstract = abstract
self.propagated_abstract = propagated_abstract
class ESResponse(object):
def __init__(self, count=0, hits=[]):
self.count = count
self.hits = hits
class ESConnector(object):
def __init__(self):
self.index_host = ES_HOST
self.client = Elasticsearch(hosts=self.index_host, timeout=600000)
def query_after(self, query_string=None, start=0, i='propagation-after'):
s = Search(using=self.client, index=i)
if query_string is not None:
q = Q('query_string', query=query_string)
s = s.query(q)
s = s[start:start+10]
response = s.execute()
hits = []
for hit in response.hits:
hits.append(ESObject(hit.id,
hit.pid,
hit.type,
hit.title,
hit.abstract if 'abstract' in hit else '',
hit.propagated_abstract if 'propagated_abstract' in hit else ''))
return ESResponse(hits=hits, count=response.hits.total)