From 0043e4051f46c7ada1dc4a2ab757989c7e84e365 Mon Sep 17 00:00:00 2001 From: Miriam Baglioni Date: Thu, 5 Dec 2024 18:44:06 +0100 Subject: [PATCH] [oalex] renaming --- strings.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/strings.py b/strings.py index 250d659..dea9c43 100644 --- a/strings.py +++ b/strings.py @@ -69,7 +69,7 @@ exploded = spark.read.json(folder_path) \ col("rors").alias("OAlex"), explode(col("raw_aff_string")).alias("affiliation") #this allows to split all the raw_aff_string and to parallelize better ) -affs = explode \ +affs = exploded \ .select("affiliation") \ .distinct() \ .withColumn("Matchings", oalex_affro_udf(col("affiliation")))