diff --git a/notebooks/Classification_BertFineTuning.ipynb b/notebooks/Classification_BertFineTuning.ipynb index 90aad20383f161edfcea6e00d84d5c9275220aa3..6860b3dc97d812063b900cfe1d15562e97d71fd8 100644 --- a/notebooks/Classification_BertFineTuning.ipynb +++ b/notebooks/Classification_BertFineTuning.ipynb @@ -227,6 +227,16 @@ "!wget https://geode.liris.cnrs.fr/EDdA-Classification/datasets/test_set.tsv" ] }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "!wget https://geode.liris.cnrs.fr/EDdA-Classification/datasets/training_set_superdomains.tsv\n", + "!wget https://geode.liris.cnrs.fr/EDdA-Classification/datasets/test_set_superdomains.tsv" + ] + }, { "cell_type": "markdown", "metadata": { @@ -244,8 +254,11 @@ }, "outputs": [], "source": [ - "train_path = '../data/training_set.tsv'\n", - "test_path = '../data/test_set.tsv'" + "#train_path = '../data/training_set.tsv'\n", + "#test_path = '../data/test_set.tsv'\n", + "\n", + "train_path = '../data/training_set_superdomains.tsv'\n", + "test_path = '../data/test_set_superdomains.tsv'" ] }, { @@ -298,7 +311,8 @@ "outputs": [], "source": [ "columnText = 'contentWithoutClass'\n", - "columnClass = 'ensemble_domaine_enccre'\n", + "#columnClass = 'ensemble_domaine_enccre'\n", + "columnClass = 'super_domain'\n", "\n", "maxOfInstancePerClass = 10000\n", "\n",