Added cache that keeps hashtags for scope with a TTL of 5 minutes

git-svn-id: http://svn.research-infrastructures.eu/public/d4science/gcube/trunk/portlets/user/top-topics@128785 82a268e6-3cf1-43bd-a215-b396298e98cf
This commit is contained in:
Costantino Perciante 2016-05-23 15:43:44 +00:00
parent 9b7db56867
commit bf90c6723f
5 changed files with 291 additions and 100 deletions

View File

@ -21,6 +21,7 @@ import org.gcube.portal.databook.server.DBCassandraAstyanaxImpl;
import org.gcube.portal.databook.server.DatabookStore; import org.gcube.portal.databook.server.DatabookStore;
import org.gcube.portal.databook.shared.Feed; import org.gcube.portal.databook.shared.Feed;
import org.gcube.portlets.user.topics.client.TopicService; import org.gcube.portlets.user.topics.client.TopicService;
import org.gcube.portlets.user.topics.server.cache.TopicsCacheImpl;
import org.gcube.portlets.user.topics.shared.HashTagAndOccurrence; import org.gcube.portlets.user.topics.shared.HashTagAndOccurrence;
import org.gcube.portlets.user.topics.shared.HashtagsWrapper; import org.gcube.portlets.user.topics.shared.HashtagsWrapper;
import org.gcube.vomanagement.usermanagement.GroupManager; import org.gcube.vomanagement.usermanagement.GroupManager;
@ -43,7 +44,7 @@ public class TopicServiceImpl extends RemoteServiceServlet implements TopicServi
public static final String TEST_USER = "test.user"; public static final String TEST_USER = "test.user";
private static final int WINDOW_SIZE_IN_MONTHS = 6; // it must not exceed 12 private static final int WINDOW_SIZE_IN_MONTHS = 6; // it must not exceed 12
/** /**
* The Cassandra store interface * The Cassandra store interface
*/ */
@ -87,130 +88,151 @@ public class TopicServiceImpl extends RemoteServiceServlet implements TopicServi
*/ */
@Override @Override
public HashtagsWrapper getHashtags() { public HashtagsWrapper getHashtags() {
ArrayList<String> hashtagsChart = new ArrayList<>(); ArrayList<String> hashtagsChart;
ASLSession session = getASLSession(); ASLSession session = getASLSession();
long timestampStart = System.currentTimeMillis();
// get the reference time
Calendar referenceTime = Calendar.getInstance();
int currentMonth = referenceTime.get(Calendar.MONTH); // jan = 0, ..... dec = 11
referenceTime.set(Calendar.MONTH, currentMonth - WINDOW_SIZE_IN_MONTHS); // the year is automatically decreased if needed
// print it
SimpleDateFormat format = new SimpleDateFormat("yyyy-MM-dd");
_log.debug("Reference time for trending topics is " + format.format(referenceTime.getTime()));
String userName = session.getUsername(); String userName = session.getUsername();
boolean isInfrastructure = isInfrastructureScope(); boolean isInfrastructure = isInfrastructureScope();
String currentScope = session.getScope();
try {
//in case the portal is restarted and you have the social home open it will get test.user (no callback to set session info)
//this check just return nothing if that happens
if (userName.compareTo("test.user") == 0) {
_log.debug("Found " + userName + " returning nothing");
return null;
}
ArrayList<HashTagAndOccurrence> toSort = new ArrayList<HashTagAndOccurrence>();
if (isInfrastructure) {
_log.debug("****** retrieving hashtags for user VREs");
// different vres could have a same hashtag, we need to merge them long timestampStart = System.currentTimeMillis();
Map<String, Integer> hashtags = new HashMap<String, Integer>();
// get cache reference
TopicsCacheImpl topicsCache = TopicsCacheImpl.getCacheInstance();
hashtagsChart = topicsCache.get(currentScope);
if(hashtagsChart != null){
// we need a map for the couple <hashtag, vre in which it is present> _log.debug("TopTopics for scope " + currentScope + " retrieved from the cache");
// it is needed because later we need to retrieve the most recent feed among the ones
// containing the hashtag itself }
Map<String, List<String>> hashtagsInVres = new HashMap<String, List<String>>(); else{
GroupManager gm = new LiferayGroupManager(); _log.debug("TopTopics for scope " + currentScope + " are not in the cache, evaluating them...");
UserManager um = new LiferayUserManager();
GCubeUser user = um.getUserByUsername(userName); // create array
hashtagsChart = new ArrayList<String>();
// get the reference time
Calendar referenceTime = Calendar.getInstance();
int currentMonth = referenceTime.get(Calendar.MONTH); // jan = 0, ..... dec = 11
referenceTime.set(Calendar.MONTH, currentMonth - WINDOW_SIZE_IN_MONTHS); // the year is automatically decreased if needed
List<GCubeGroup> groups = gm.listGroupsByUser(user.getUserId()); // print it
for (GCubeGroup group : groups) { SimpleDateFormat format = new SimpleDateFormat("yyyy-MM-dd");
if (gm.isVRE(group.getGroupId())) { _log.debug("Reference time for trending topics is " + format.format(referenceTime.getTime()));
String vreid = gm.getInfrastructureScope(group.getGroupId()); //get the scope
Map<String, Integer> map = store.getVREHashtagsWithOccurrenceFilteredByTime(vreid, referenceTime.getTimeInMillis());
// merge the values if needed try {
for (String hashtag : map.keySet()) { //in case the portal is restarted and you have the social home open it will get test.user (no callback to set session info)
//this check just return nothing if that happens
if (userName.compareTo("test.user") == 0) {
_log.debug("Found " + userName + " returning nothing");
return null;
}
ArrayList<HashTagAndOccurrence> toSort = new ArrayList<HashTagAndOccurrence>();
if (isInfrastructure) {
_log.debug("****** retrieving hashtags for user VREs");
if(hashtags.containsKey(hashtag)){ // different vres could have a same hashtag, we need to merge them
Map<String, Integer> hashtags = new HashMap<String, Integer>();
int currentValue = hashtags.get(hashtag); // we need a map for the couple <hashtag, vre in which it is present>
int newValue = currentValue + map.get(hashtag); // it is needed because later we need to retrieve the most recent feed among the ones
// containing the hashtag itself
// remove and re-add Map<String, List<String>> hashtagsInVres = new HashMap<String, List<String>>();
hashtags.remove(hashtag);
hashtags.put(hashtag, newValue);
// get the current list of vres in which the hashtag is present and add this new one GroupManager gm = new LiferayGroupManager();
List<String> vres = hashtagsInVres.get(hashtag); UserManager um = new LiferayUserManager();
vres.add(vreid); GCubeUser user = um.getUserByUsername(userName);
hashtagsInVres.remove(hashtag);
hashtagsInVres.put(hashtag, vres);
}else{ List<GCubeGroup> groups = gm.listGroupsByUser(user.getUserId());
for (GCubeGroup group : groups) {
if (gm.isVRE(group.getGroupId())) {
String vreid = gm.getInfrastructureScope(group.getGroupId()); //get the scope
Map<String, Integer> map = store.getVREHashtagsWithOccurrenceFilteredByTime(vreid, referenceTime.getTimeInMillis());
hashtags.put(hashtag, map.get(hashtag)); // merge the values if needed
for (String hashtag : map.keySet()) {
// put in the hashmap hashtagsInVres too if(hashtags.containsKey(hashtag)){
List<String> vres = new ArrayList<String>();
vres.add(vreid); int currentValue = hashtags.get(hashtag);
hashtagsInVres.put(hashtag, vres); int newValue = currentValue + map.get(hashtag);
// remove and re-add
hashtags.remove(hashtag);
hashtags.put(hashtag, newValue);
// get the current list of vres in which the hashtag is present and add this new one
List<String> vres = hashtagsInVres.get(hashtag);
vres.add(vreid);
hashtagsInVres.remove(hashtag);
hashtagsInVres.put(hashtag, vres);
}else{
hashtags.put(hashtag, map.get(hashtag));
// put in the hashmap hashtagsInVres too
List<String> vres = new ArrayList<String>();
vres.add(vreid);
hashtagsInVres.put(hashtag, vres);
}
} }
} }
} }
// now we need to evaluate score for each element
Map<String, Double> weights = evaluateWeight(hashtags, WINDOW_SIZE_IN_MONTHS, currentMonth, referenceTime, null, hashtagsInVres);
// at the end build the list
for (String hashtag : hashtags.keySet()) {
toSort.add(new HashTagAndOccurrence(hashtag, hashtags.get(hashtag), weights.get(hashtag)));
}
}
//else must be in a VRE scope
else {
String scope = session.getScope();
_log.debug("****** retrieving hashtags for scope " + scope);
Map<String, Integer> hashtags = store.getVREHashtagsWithOccurrenceFilteredByTime(scope, referenceTime.getTimeInMillis());
// now we need to evaluate the wiehgt for each element
Map<String, Double> weights = evaluateWeight(hashtags, WINDOW_SIZE_IN_MONTHS, currentMonth, referenceTime, scope, null);
for (String hashtag : hashtags.keySet()) {
toSort.add(new HashTagAndOccurrence(hashtag, hashtags.get(hashtag), weights.get(hashtag)));
}
} }
// now we need to evaluate score for each element _log.debug("Number of topics retrieved is " + toSort.size());
Map<String, Double> weights = evaluateWeight(hashtags, WINDOW_SIZE_IN_MONTHS, currentMonth, referenceTime, null, hashtagsInVres);
// at the end build the list Collections.sort(toSort); // sort for weight
for (String hashtag : hashtags.keySet()) {
toSort.add(new HashTagAndOccurrence(hashtag, hashtags.get(hashtag), weights.get(hashtag))); for (HashTagAndOccurrence wrapper : toSort) {
_log.debug("Entry is " + wrapper.toString() + " with weight " + wrapper.getWeight());
String hashtag = wrapper.getHashtag();
String href="\"?"+
new String(Base64.encodeBase64(GCubeSocialNetworking.HASHTAG_OID.getBytes()))+"="+
new String(Base64.encodeBase64(hashtag.getBytes()))+"\"";
String hashtagLink = "<a class=\"topiclink\" href=" + href + ">"+hashtag+"</a>";
hashtagsChart.add(hashtagLink);
} }
// update the cache
topicsCache.insert(currentScope, hashtagsChart);
} }
//else must be in a VRE scope catch (Exception e) {
else { e.printStackTrace();
String scope = session.getScope(); return null;
_log.debug("****** retrieving hashtags for scope " + scope);
Map<String, Integer> hashtags = store.getVREHashtagsWithOccurrenceFilteredByTime(scope, referenceTime.getTimeInMillis());
// now we need to evaluate the wiehgt for each element
Map<String, Double> weights = evaluateWeight(hashtags, WINDOW_SIZE_IN_MONTHS, currentMonth, referenceTime, scope, null);
for (String hashtag : hashtags.keySet()) {
toSort.add(new HashTagAndOccurrence(hashtag, hashtags.get(hashtag), weights.get(hashtag)));
}
}
_log.debug("Number of topics retrieved is " + toSort.size());
Collections.sort(toSort); // sort for weight
for (HashTagAndOccurrence wrapper : toSort) {
_log.debug("Entry is " + wrapper.toString() + " with weight " + wrapper.getWeight());
String hashtag = wrapper.getHashtag();
String href="\"?"+
new String(Base64.encodeBase64(GCubeSocialNetworking.HASHTAG_OID.getBytes()))+"="+
new String(Base64.encodeBase64(hashtag.getBytes()))+"\"";
String hashtagLink = "<a class=\"topiclink\" href=" + href + ">"+hashtag+"</a>";
hashtagsChart.add(hashtagLink);
} }
} }
catch (Exception e) {
e.printStackTrace();
return null;
}
long timestampEnd = System.currentTimeMillis() - timestampStart; long timestampEnd = System.currentTimeMillis() - timestampStart;
_log.debug("Overall time to retrieve hastags is " + timestampEnd); _log.debug("Overall time to retrieve hastags is " + timestampEnd + "ms");
return new HashtagsWrapper(isInfrastructure, hashtagsChart); return new HashtagsWrapper(isInfrastructure, hashtagsChart);
} }

View File

@ -0,0 +1,26 @@
package org.gcube.portlets.user.topics.server.cache;
/**
* Cache interface
* @author Costantino Perciante at ISTI-CNR (costantino.perciante@isti.cnr.it)
* @param <K> the key type
* @param <V> the value type
*/
public interface CacheInterface <K,V>{
/**
* Retrieve a value V from the cache
* @param key
* @return
*/
public V get(K key);
/**
* Insert an object V with key K into the cache
* @param key
* @param value
* @return
*/
public boolean insert(K key, V value);
}

View File

@ -0,0 +1,26 @@
package org.gcube.portlets.user.topics.server.cache;
/**
* Utility functions for caches
* @author Costantino Perciante at ISTI-CNR
* (costantino.perciante@isti.cnr.it)
*
*/
public class CacheUtilities {
/**
* Check if the bean expired
* @param beanTimestamp
* @param ttl
* @return <true> if expired, <false> otherwise
*/
public static boolean expired(long beanTimestamp, long ttl){
long currentTime = System.currentTimeMillis();
if((beanTimestamp + ttl) <= currentTime)
return true;
else
return false;
}
}

View File

@ -0,0 +1,40 @@
package org.gcube.portlets.user.topics.server.cache;
/**
* A bean object to be used as value within caches. It contains a TTL value too.
* @author Costantino Perciante at ISTI-CNR
* (costantino.perciante@isti.cnr.it)
*
* @param <V> the value type
*/
public class CacheValueBean <V>{
private V value;
private long TTL;
/**
* @param value
* @param tTL
*/
public CacheValueBean(V value, long ttl) {
super();
this.value = value;
this.TTL = ttl;
}
public V getValue() {
return value;
}
public void setValue(V value) {
this.value = value;
}
public long getTTL() {
return TTL;
}
public void setTTL(long ttl) {
this.TTL = ttl;
}
@Override
public String toString() {
return "CacheValueBean [value=" + value + ", TTL=" + TTL + "]";
}
}

View File

@ -0,0 +1,77 @@
package org.gcube.portlets.user.topics.server.cache;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Map;
import org.slf4j.LoggerFactory;
/**
* TopTopics cache: the key of each value is the scope
* @author Costantino Perciante at ISTI-CNR
* (costantino.perciante@isti.cnr.it)
*/
public class TopicsCacheImpl implements CacheInterface<String, ArrayList<String>> {
private static final org.slf4j.Logger logger = LoggerFactory.getLogger(TopicsCacheImpl.class);
private static TopicsCacheImpl instance = new TopicsCacheImpl();
/**
* The hashmap
*/
private Map<String, CacheValueBean<ArrayList<String>>> cacheMap;
/**
* Cache entry expires after EXPIRED_AFTER ms
*/
private static final long EXPIRED_AFTER = 1000 * 60 * 2;
/**
* private constructor
*/
private TopicsCacheImpl(){
this.cacheMap = new HashMap<String, CacheValueBean<ArrayList<String>>>();
}
/**
* Retrieve the current cache instance object
* @return
*/
public static TopicsCacheImpl getCacheInstance(){
return instance;
}
@Override
public ArrayList<String> get(String key) {
if(cacheMap.containsKey(key)){
CacheValueBean<ArrayList<String>> bean = cacheMap.get(key);
if(CacheUtilities.expired(bean.getTTL(), EXPIRED_AFTER)){
cacheMap.remove(key);
logger.debug("TopTopics for scope " + key + "expired, return null");
}
else
return bean.getValue();
}
return null;
}
@Override
public boolean insert(String key, ArrayList<String> value) {
CacheValueBean<ArrayList<String>> newBean = new CacheValueBean<ArrayList<String>>(value, System.currentTimeMillis());
if(cacheMap.containsKey(key))
cacheMap.remove(key);
cacheMap.put(key, newBean);
return true;
}
}