diff --git a/data/beginners_kit.ipynb b/data/beginners_kit.ipynb index ea108ce..2fb7ef2 100644 --- a/data/beginners_kit.ipynb +++ b/data/beginners_kit.ipynb @@ -34,20 +34,20 @@ }, "outputs": [], "source": [ - "!rm -rf data\n", - "!mkdir data\n", + "# !rm -rf data\n", + "# !mkdir data\n", "\n", - "import os\n", - "base_url = \"https://zenodo.org/record/7490192/files/\"\n", + "# import os\n", + "# base_url = \"https://zenodo.org/record/7490192/files/\"\n", "\n", "\n", - "items =[\"communities_infrastructures.tar\",\"dataset.tar\",\"datasource.tar\",\"organization.tar\",\"otherresearchproduct.tar\",\"project.tar\",\"publication.tar\",\"relation.tar\", \"software.tar\"]\n", + "# items =[\"communities_infrastructures.tar\",\"dataset.tar\",\"datasource.tar\",\"organization.tar\",\"otherresearchproduct.tar\",\"project.tar\",\"publication.tar\",\"relation.tar\", \"software.tar\"]\n", "\n", - "for item in items: \n", - " print(f\"Downloading {item}\")\n", - " os.system(f'wget {base_url}{item}?download=1 -O data/{item}')\n", - " print(f\"Extracting {item}\")\n", - " os.system(f'tar -xf data/{item} -C data/; rm data/{item}')" + "# for item in items: \n", + "# print(f\"Downloading {item}\")\n", + "# os.system(f'wget {base_url}{item}?download=1 -O data/{item}')\n", + "# print(f\"Extracting {item}\")\n", + "# os.system(f'tar -xf data/{item} -C data/; rm data/{item}')" ] }, { @@ -55,7 +55,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Have a look at the input data" + "## Load the datasets" ] }, { @@ -279,7 +279,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "All the exercises follow the following template.\n", + "All the exercises follow the template below.\n", "```python\n", "query = \"\"\"\n", "SELECT \n", @@ -295,7 +295,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### **Task**: Split relations based on their semantics and compute their numbers; sort results in descending order, limit to the first 20. " + "### **Task**: Split relations based on their semantics and count them; sort results in descending order, limit to the first 20. " ] }, { @@ -323,7 +323,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### **Task:** Show the most occurring publication subject term; sort results in descending order; limit to the first 20" + "### **Task:** Show the most occurring publication subjects; sort results in descending order; limit to the first 20" ] }, { @@ -356,7 +356,7 @@ "tags": [] }, "source": [ - "### **Task:** Show the most co-occurring publication subjects from controlled vocabularies (i.e. scheme != 'keyword') avoiding repetition; limit to the first 20" + "### **Task:** Show the most co-occurring publication subjects from controlled vocabularies (i.e., scheme != 'keyword') avoiding repetition; limit to the first 20" ] }, {