Master branch updates from beta September 2023 #337
|
@ -112,7 +112,7 @@ public class CreateActionSetSparkJob implements Serializable {
|
|||
final String cited = ID_PREFIX
|
||||
+ IdentifierFactory.md5(CleaningFunctions.normalizePidValue("doi", value.getCited()));
|
||||
|
||||
if(!citing.equals(cited)){
|
||||
if (!citing.equals(cited)) {
|
||||
relationList
|
||||
.addAll(
|
||||
getRelations(
|
||||
|
@ -123,7 +123,8 @@ public class CreateActionSetSparkJob implements Serializable {
|
|||
citing = ID_PREFIX + IdentifierFactory
|
||||
.md5(
|
||||
CleaningFunctions
|
||||
.normalizePidValue("doi", value.getCiting().substring(0, value.getCiting().indexOf(".refs"))));
|
||||
.normalizePidValue(
|
||||
"doi", value.getCiting().substring(0, value.getCiting().indexOf(".refs"))));
|
||||
relationList.addAll(getRelations(citing, cited));
|
||||
}
|
||||
}
|
||||
|
|
|
@ -72,7 +72,7 @@ public class ReadCOCI implements Serializable {
|
|||
String outputPath,
|
||||
String delimiter) throws IOException {
|
||||
|
||||
for(String inputFile : inputFiles){
|
||||
for (String inputFile : inputFiles) {
|
||||
String p_string = workingPath + "/" + inputFile + ".gz";
|
||||
|
||||
Dataset<Row> cociData = spark
|
||||
|
|
|
@ -12,7 +12,6 @@ public class COCI implements Serializable {
|
|||
|
||||
private String cited;
|
||||
|
||||
|
||||
public String getOci() {
|
||||
return oci;
|
||||
}
|
||||
|
@ -37,5 +36,4 @@ public class COCI implements Serializable {
|
|||
this.cited = cited;
|
||||
}
|
||||
|
||||
|
||||
}
|
||||
|
|
|
@ -122,8 +122,6 @@ public class ReadCOCITest {
|
|||
"-inputFile", "input1;input2;input3;input4;input5"
|
||||
});
|
||||
|
||||
|
||||
|
||||
final JavaSparkContext sc = JavaSparkContext.fromSparkContext(spark.sparkContext());
|
||||
|
||||
JavaRDD<COCI> tmp = sc
|
||||
|
|
Loading…
Reference in New Issue