Added logic to exclude harvesting in some cases
git-svn-id: https://svn.d4science.research-infrastructures.eu/gcube/trunk/accounting/accounting-dashboard-harvester-se-plugin@169212 82a268e6-3cf1-43bd-a215-b396298e98cf
This commit is contained in:
parent
248bb98b88
commit
13c74dc4f9
|
@ -3,6 +3,7 @@ package org.gcube.dataharvest;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.io.InputStream;
|
import java.io.InputStream;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
|
import java.util.Calendar;
|
||||||
import java.util.Date;
|
import java.util.Date;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
@ -45,6 +46,7 @@ public class AccountingDataHarvesterPlugin extends Plugin<DataHarvestPluginDecla
|
||||||
public static final String GET_VRE_USERS_INPUT_PARAMETER = "getVREUsers";
|
public static final String GET_VRE_USERS_INPUT_PARAMETER = "getVREUsers";
|
||||||
public static final String DRY_RUN_INPUT_PARAMETER = "dryRun";
|
public static final String DRY_RUN_INPUT_PARAMETER = "dryRun";
|
||||||
|
|
||||||
|
public static final String SO_BIG_DATA_VO = "/d4science.research-infrastructures.eu/SoBigData";
|
||||||
public static final String SO_BIG_DATA_CATALOGUE_CONTEXT = "/d4science.research-infrastructures.eu/SoBigData/ResourceCatalogue";
|
public static final String SO_BIG_DATA_CATALOGUE_CONTEXT = "/d4science.research-infrastructures.eu/SoBigData/ResourceCatalogue";
|
||||||
public static final String TAGME_CONTEXT = "/d4science.research-infrastructures.eu/SoBigData/TagMe";
|
public static final String TAGME_CONTEXT = "/d4science.research-infrastructures.eu/SoBigData/TagMe";
|
||||||
|
|
||||||
|
@ -184,9 +186,13 @@ public class AccountingDataHarvesterPlugin extends Plugin<DataHarvestPluginDecla
|
||||||
|
|
||||||
|
|
||||||
try {
|
try {
|
||||||
|
if(context.startsWith(SO_BIG_DATA_VO) && start.before(DateUtils.getStartCalendar(2018, Calendar.APRIL, 1).getTime())) {
|
||||||
|
logger.info("Not Harvesting VREs Accesses for {} from {} to {}", context, DateUtils.format(start), DateUtils.format(end));
|
||||||
|
} else {
|
||||||
// Collecting Google Analytics Data for VREs Accesses
|
// Collecting Google Analytics Data for VREs Accesses
|
||||||
List<HarvestedData> harvested = vreAccessesHarvester.getData();
|
List<HarvestedData> harvested = vreAccessesHarvester.getData();
|
||||||
data.addAll(harvested);
|
data.addAll(harvested);
|
||||||
|
}
|
||||||
} catch(Exception e) {
|
} catch(Exception e) {
|
||||||
logger.error("Error harvesting Social Interactions for {}", context, e);
|
logger.error("Error harvesting Social Interactions for {}", context, e);
|
||||||
}
|
}
|
||||||
|
@ -205,7 +211,8 @@ public class AccountingDataHarvesterPlugin extends Plugin<DataHarvestPluginDecla
|
||||||
// Collecting info on VRE users
|
// Collecting info on VRE users
|
||||||
if(getVREUsers) {
|
if(getVREUsers) {
|
||||||
// Harvesting Users only for VREs (not for VO and ROOT which is the sum of the children contexts)
|
// Harvesting Users only for VREs (not for VO and ROOT which is the sum of the children contexts)
|
||||||
if(scopeBean.is(Type.VRE)) {
|
// The VREUsers can be only Harvested for the lst month
|
||||||
|
if(scopeBean.is(Type.VRE) && start.equals(DateUtils.getPreviousPeriod(measureType).getTime())) {
|
||||||
VREUsersHarvester vreUsersHarvester = new VREUsersHarvester(start, end);
|
VREUsersHarvester vreUsersHarvester = new VREUsersHarvester(start, end);
|
||||||
List<HarvestedData> harvested = vreUsersHarvester.getData();
|
List<HarvestedData> harvested = vreUsersHarvester.getData();
|
||||||
data.addAll(harvested);
|
data.addAll(harvested);
|
||||||
|
|
|
@ -99,11 +99,10 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
String pagePath = row.getPagePath();
|
String pagePath = row.getPagePath();
|
||||||
if(!pagePath.contains("_redirect=/group")) {
|
if(!pagePath.contains("_redirect=/group")) {
|
||||||
if(pagePath.endsWith(lowerCasedContext)) {
|
if(pagePath.endsWith(lowerCasedContext)) {
|
||||||
System.out.println("match end->"+pagePath);
|
logger.trace("Matched endsWith({}) : {}", lowerCasedContext, pagePath);
|
||||||
measure++;
|
measure++;
|
||||||
}
|
} else if(pagePath.contains(case1) || pagePath.contains(case2)) {
|
||||||
else if (pagePath.contains(case1) || pagePath.contains(case2) ) {
|
logger.trace("Matched contains({}) || contains({}) : {}", case1, case2, pagePath);
|
||||||
System.out.println("match compare->"+pagePath);
|
|
||||||
measure++;
|
measure++;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -127,23 +126,23 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
*/
|
*/
|
||||||
private static List<VREAccessesReportRow> getAllAccesses(Date start, Date end) throws Exception {
|
private static List<VREAccessesReportRow> getAllAccesses(Date start, Date end) throws Exception {
|
||||||
DateRange dateRange = getDateRangeForAnalytics(start, end);
|
DateRange dateRange = getDateRangeForAnalytics(start, end);
|
||||||
System.out.println("getting accesses in this time range: " + dateRange.toPrettyString());
|
logger.trace("Getting accesses in this time range {}", dateRange.toPrettyString());
|
||||||
|
|
||||||
AnalyticsReportCredentials credentialsFromD4S = getAuthorisedApplicationInfoFromIs();
|
AnalyticsReportCredentials credentialsFromD4S = getAuthorisedApplicationInfoFromIs();
|
||||||
AnalyticsReporting service = initializeAnalyticsReporting(credentialsFromD4S);
|
AnalyticsReporting service = initializeAnalyticsReporting(credentialsFromD4S);
|
||||||
HashMap<String, GetReportsResponse> responses = getReportResponses(service, credentialsFromD4S.getViewIds(), dateRange);
|
HashMap<String,GetReportsResponse> responses = getReportResponses(service, credentialsFromD4S.getViewIds(),
|
||||||
|
dateRange);
|
||||||
List<VREAccessesReportRow> totalAccesses = new ArrayList<>();
|
List<VREAccessesReportRow> totalAccesses = new ArrayList<>();
|
||||||
|
|
||||||
for(String view : responses.keySet()) {
|
for(String view : responses.keySet()) {
|
||||||
List<VREAccessesReportRow> viewReport = parseResponse(view, responses.get(view));
|
List<VREAccessesReportRow> viewReport = parseResponse(view, responses.get(view));
|
||||||
System.out.println("got " + viewReport.size() + " entries from view id= "+view);
|
logger.trace("Got {} entries from view id={}", viewReport.size(), view);
|
||||||
totalAccesses.addAll(viewReport);
|
totalAccesses.addAll(viewReport);
|
||||||
}
|
}
|
||||||
System.out.println("Merged in " + totalAccesses.size() + " toal entries from all views");
|
logger.trace("Merged in {} total entries from all views", totalAccesses.size());
|
||||||
return totalAccesses;
|
return totalAccesses;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Initializes an Analytics Reporting API V4 service object.
|
* Initializes an Analytics Reporting API V4 service object.
|
||||||
*
|
*
|
||||||
|
@ -151,7 +150,8 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
* @throws IOException
|
* @throws IOException
|
||||||
* @throws GeneralSecurityException
|
* @throws GeneralSecurityException
|
||||||
*/
|
*/
|
||||||
private static AnalyticsReporting initializeAnalyticsReporting(AnalyticsReportCredentials cred) throws GeneralSecurityException, IOException {
|
private static AnalyticsReporting initializeAnalyticsReporting(AnalyticsReportCredentials cred)
|
||||||
|
throws GeneralSecurityException, IOException {
|
||||||
HttpTransport httpTransport = GoogleNetHttpTransport.newTrustedTransport();
|
HttpTransport httpTransport = GoogleNetHttpTransport.newTrustedTransport();
|
||||||
GoogleCredential credential = fromD4SServiceEndpoint(cred).createScoped(AnalyticsReportingScopes.all());
|
GoogleCredential credential = fromD4SServiceEndpoint(cred).createScoped(AnalyticsReportingScopes.all());
|
||||||
|
|
||||||
|
@ -167,31 +167,26 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
* @return GetReportResponse The Analytics Reporting API V4 response.
|
* @return GetReportResponse The Analytics Reporting API V4 response.
|
||||||
* @throws IOException
|
* @throws IOException
|
||||||
*/
|
*/
|
||||||
private static HashMap<String, GetReportsResponse> getReportResponses(AnalyticsReporting service, List<String> viewIDs, DateRange dateRange) throws IOException {
|
private static HashMap<String,GetReportsResponse> getReportResponses(AnalyticsReporting service,
|
||||||
|
List<String> viewIDs, DateRange dateRange) throws IOException {
|
||||||
|
|
||||||
HashMap<String,GetReportsResponse> reports = new HashMap<>();
|
HashMap<String,GetReportsResponse> reports = new HashMap<>();
|
||||||
|
|
||||||
// Create the Metrics object.
|
// Create the Metrics object.
|
||||||
Metric sessions = new Metric()
|
Metric sessions = new Metric().setExpression("ga:pageviews").setAlias("pages");
|
||||||
.setExpression("ga:pageviews")
|
|
||||||
.setAlias("pages");
|
|
||||||
Dimension pageTitle = new Dimension().setName("ga:pagePath");
|
Dimension pageTitle = new Dimension().setName("ga:pagePath");
|
||||||
|
|
||||||
for(String view : viewIDs) {
|
for(String view : viewIDs) {
|
||||||
logger.info("Getting data from Google Analytics for viewid: " + view);
|
logger.info("Getting data from Google Analytics for viewid: " + view);
|
||||||
// Create the ReportRequest object.
|
// Create the ReportRequest object.
|
||||||
ReportRequest request = new ReportRequest()
|
ReportRequest request = new ReportRequest().setViewId(view).setDateRanges(Arrays.asList(dateRange))
|
||||||
.setViewId(view)
|
.setMetrics(Arrays.asList(sessions)).setDimensions(Arrays.asList(pageTitle));
|
||||||
.setDateRanges(Arrays.asList(dateRange))
|
|
||||||
.setMetrics(Arrays.asList(sessions))
|
|
||||||
.setDimensions(Arrays.asList(pageTitle));
|
|
||||||
|
|
||||||
ArrayList<ReportRequest> requests = new ArrayList<ReportRequest>();
|
ArrayList<ReportRequest> requests = new ArrayList<ReportRequest>();
|
||||||
requests.add(request);
|
requests.add(request);
|
||||||
|
|
||||||
// Create the GetReportsRequest object.
|
// Create the GetReportsRequest object.
|
||||||
GetReportsRequest getReport = new GetReportsRequest()
|
GetReportsRequest getReport = new GetReportsRequest().setReportRequests(requests);
|
||||||
.setReportRequests(requests);
|
|
||||||
|
|
||||||
// Call the batchGet method.
|
// Call the batchGet method.
|
||||||
GetReportsResponse response = service.reports().batchGet(getReport).execute();
|
GetReportsResponse response = service.reports().batchGet(getReport).execute();
|
||||||
|
@ -207,7 +202,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
* @param response An Analytics Reporting API V4 response.
|
* @param response An Analytics Reporting API V4 response.
|
||||||
*/
|
*/
|
||||||
private static List<VREAccessesReportRow> parseResponse(String viewId, GetReportsResponse response) {
|
private static List<VREAccessesReportRow> parseResponse(String viewId, GetReportsResponse response) {
|
||||||
System.out.println("\n*** parsing Response for " + viewId);
|
logger.trace("\n*** parsing Response for {}", viewId);
|
||||||
|
|
||||||
List<VREAccessesReportRow> toReturn = new ArrayList<>();
|
List<VREAccessesReportRow> toReturn = new ArrayList<>();
|
||||||
|
|
||||||
|
@ -219,8 +214,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
|
|
||||||
if(rows == null) {
|
if(rows == null) {
|
||||||
logger.warn("No data found for " + viewId);
|
logger.warn("No data found for " + viewId);
|
||||||
}
|
} else
|
||||||
else
|
|
||||||
for(ReportRow row : rows) {
|
for(ReportRow row : rows) {
|
||||||
List<String> dimensions = row.getDimensions();
|
List<String> dimensions = row.getDimensions();
|
||||||
List<DateRangeValues> metrics = row.getMetrics();
|
List<DateRangeValues> metrics = row.getMetrics();
|
||||||
|
@ -228,7 +222,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
VREAccessesReportRow var = new VREAccessesReportRow();
|
VREAccessesReportRow var = new VREAccessesReportRow();
|
||||||
boolean validEntry = false;
|
boolean validEntry = false;
|
||||||
for(int i = 0; i < dimensionHeaders.size() && i < dimensions.size(); i++) {
|
for(int i = 0; i < dimensionHeaders.size() && i < dimensions.size(); i++) {
|
||||||
//System.out.println(dimensionHeaders.get(i) + ": " + dimensions.get(i));
|
//logger.trace("{} : {}", dimensionHeaders.get(i), dimensions.get(i));
|
||||||
String pagePath = dimensions.get(i);
|
String pagePath = dimensions.get(i);
|
||||||
if(pagePath.startsWith("/group") || pagePath.startsWith("/web")) {
|
if(pagePath.startsWith("/group") || pagePath.startsWith("/web")) {
|
||||||
var.setPagePath(dimensions.get(i));
|
var.setPagePath(dimensions.get(i));
|
||||||
|
@ -249,6 +243,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
}
|
}
|
||||||
return toReturn;
|
return toReturn;
|
||||||
}
|
}
|
||||||
|
|
||||||
private static GoogleCredential fromD4SServiceEndpoint(AnalyticsReportCredentials cred) throws IOException {
|
private static GoogleCredential fromD4SServiceEndpoint(AnalyticsReportCredentials cred) throws IOException {
|
||||||
|
|
||||||
String clientId = cred.getClientId();
|
String clientId = cred.getClientId();
|
||||||
|
@ -258,8 +253,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
String tokenUri = cred.getTokenUri();
|
String tokenUri = cred.getTokenUri();
|
||||||
String projectId = cred.getProjectId();
|
String projectId = cred.getProjectId();
|
||||||
|
|
||||||
if (clientId == null || clientEmail == null || privateKeyPem == null
|
if(clientId == null || clientEmail == null || privateKeyPem == null || privateKeyId == null) {
|
||||||
|| privateKeyId == null) {
|
|
||||||
throw new IOException("Error reading service account credential from stream, "
|
throw new IOException("Error reading service account credential from stream, "
|
||||||
+ "expecting 'client_id', 'client_email', 'private_key' and 'private_key_id'.");
|
+ "expecting 'client_id', 'client_email', 'private_key' and 'private_key_id'.");
|
||||||
}
|
}
|
||||||
|
@ -268,12 +262,9 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
|
|
||||||
Collection<String> emptyScopes = Collections.emptyList();
|
Collection<String> emptyScopes = Collections.emptyList();
|
||||||
|
|
||||||
Builder credentialBuilder = new GoogleCredential.Builder()
|
Builder credentialBuilder = new GoogleCredential.Builder().setTransport(Utils.getDefaultTransport())
|
||||||
.setTransport( Utils.getDefaultTransport())
|
.setJsonFactory(Utils.getDefaultJsonFactory()).setServiceAccountId(clientEmail)
|
||||||
.setJsonFactory(Utils.getDefaultJsonFactory())
|
.setServiceAccountScopes(emptyScopes).setServiceAccountPrivateKey(privateKey)
|
||||||
.setServiceAccountId(clientEmail)
|
|
||||||
.setServiceAccountScopes(emptyScopes)
|
|
||||||
.setServiceAccountPrivateKey(privateKey)
|
|
||||||
.setServiceAccountPrivateKeyId(privateKeyId);
|
.setServiceAccountPrivateKeyId(privateKeyId);
|
||||||
|
|
||||||
if(tokenUri != null) {
|
if(tokenUri != null) {
|
||||||
|
@ -309,7 +300,8 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
throw new IOException("Unexpected exception reading PKCS data", unexpectedException);
|
throw new IOException("Unexpected exception reading PKCS data", unexpectedException);
|
||||||
}
|
}
|
||||||
|
|
||||||
private static List<ServiceEndpoint> getAnalyticsReportingConfigurationFromIS(String infrastructureScope) throws Exception {
|
private static List<ServiceEndpoint> getAnalyticsReportingConfigurationFromIS(String infrastructureScope)
|
||||||
|
throws Exception {
|
||||||
String scope = infrastructureScope;
|
String scope = infrastructureScope;
|
||||||
String currScope = ScopeProvider.instance.get();
|
String currScope = ScopeProvider.instance.get();
|
||||||
ScopeProvider.instance.set(scope);
|
ScopeProvider.instance.set(scope);
|
||||||
|
@ -321,6 +313,7 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
ScopeProvider.instance.set(currScope);
|
ScopeProvider.instance.set(currScope);
|
||||||
return toReturn;
|
return toReturn;
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* l
|
* l
|
||||||
* @throws Exception
|
* @throws Exception
|
||||||
|
@ -332,12 +325,12 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
try {
|
try {
|
||||||
List<ServiceEndpoint> list = getAnalyticsReportingConfigurationFromIS(context);
|
List<ServiceEndpoint> list = getAnalyticsReportingConfigurationFromIS(context);
|
||||||
if(list.size() > 1) {
|
if(list.size() > 1) {
|
||||||
logger.error("Too many Service Endpoints having name " + SERVICE_ENDPOINT_NAME +" in this scope having Category " + SERVICE_ENDPOINT_CATEGORY);
|
logger.error("Too many Service Endpoints having name " + SERVICE_ENDPOINT_NAME
|
||||||
}
|
+ " in this scope having Category " + SERVICE_ENDPOINT_CATEGORY);
|
||||||
else if (list.size() == 0){
|
} else if(list.size() == 0) {
|
||||||
logger.warn("There is no Service Endpoint having name " + SERVICE_ENDPOINT_NAME +" and Category " + SERVICE_ENDPOINT_CATEGORY + " in this context: " + context);
|
logger.warn("There is no Service Endpoint having name " + SERVICE_ENDPOINT_NAME + " and Category "
|
||||||
}
|
+ SERVICE_ENDPOINT_CATEGORY + " in this context: " + context);
|
||||||
else {
|
} else {
|
||||||
|
|
||||||
for(ServiceEndpoint res : list) {
|
for(ServiceEndpoint res : list) {
|
||||||
reportCredentials.setTokenUri(res.profile().runtime().hostedOn());
|
reportCredentials.setTokenUri(res.profile().runtime().hostedOn());
|
||||||
|
@ -370,9 +363,11 @@ public class VREAccessesHarvester extends BasicHarvester {
|
||||||
}
|
}
|
||||||
return reportCredentials;
|
return reportCredentials;
|
||||||
}
|
}
|
||||||
|
|
||||||
private static LocalDate asLocalDate(Date date) {
|
private static LocalDate asLocalDate(Date date) {
|
||||||
return Instant.ofEpochMilli(date.getTime()).atZone(ZoneId.systemDefault()).toLocalDate();
|
return Instant.ofEpochMilli(date.getTime()).atZone(ZoneId.systemDefault()).toLocalDate();
|
||||||
}
|
}
|
||||||
|
|
||||||
private static DateRange getDateRangeForAnalytics(Date start, Date end) {
|
private static DateRange getDateRangeForAnalytics(Date start, Date end) {
|
||||||
DateTimeFormatter formatter = DateTimeFormatter.ofPattern("yyyy-MM-dd"); //required by Analytics
|
DateTimeFormatter formatter = DateTimeFormatter.ofPattern("yyyy-MM-dd"); //required by Analytics
|
||||||
String startDate = asLocalDate(start).format(formatter);
|
String startDate = asLocalDate(start).format(formatter);
|
||||||
|
|
|
@ -1,6 +1,7 @@
|
||||||
package org.gcube.dataharvest;
|
package org.gcube.dataharvest;
|
||||||
|
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
|
import java.util.Calendar;
|
||||||
import java.util.Date;
|
import java.util.Date;
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
import java.util.LinkedHashMap;
|
import java.util.LinkedHashMap;
|
||||||
|
@ -85,10 +86,11 @@ public class AccountingDataHarvesterPluginTest extends ContextTest {
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
public void testScopeBean() throws Exception {
|
public void testScopeBean() throws Exception {
|
||||||
|
org.gcube.dataharvest.utils.Utils.setContext(ROOT);
|
||||||
SortedSet<String> contexts = getContexts();
|
SortedSet<String> contexts = getContexts();
|
||||||
for(String context : contexts) {
|
for(String context : contexts) {
|
||||||
ScopeBean scopeBean = new ScopeBean(context);
|
ScopeBean scopeBean = new ScopeBean(context);
|
||||||
logger.debug("Name {}, FullName {}", scopeBean.name(), scopeBean.toString());
|
logger.debug("FullName {} - Name {}", scopeBean.toString(), scopeBean.name());
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
@ -147,9 +149,13 @@ public class AccountingDataHarvesterPluginTest extends ContextTest {
|
||||||
}
|
}
|
||||||
|
|
||||||
try {
|
try {
|
||||||
|
if(context.startsWith(AccountingDataHarvesterPlugin.SO_BIG_DATA_VO) && start.before(DateUtils.getStartCalendar(2018, Calendar.APRIL, 1).getTime())) {
|
||||||
|
logger.info("Not Harvesting VREs Accesses for {} from {} to {}", context, DateUtils.format(start), DateUtils.format(end));
|
||||||
|
} else {
|
||||||
// Collecting Google Analytics Data for VREs Accesses
|
// Collecting Google Analytics Data for VREs Accesses
|
||||||
List<HarvestedData> harvested = vreAccessesHarvester.getData();
|
List<HarvestedData> harvested = vreAccessesHarvester.getData();
|
||||||
data.addAll(harvested);
|
data.addAll(harvested);
|
||||||
|
}
|
||||||
} catch(Exception e) {
|
} catch(Exception e) {
|
||||||
logger.error("Error harvesting Social Interactions for {}", context, e);
|
logger.error("Error harvesting Social Interactions for {}", context, e);
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue