diff --git a/0-TECHNIQUE/greekLemmatization/lemmatisationAp.ipynb b/0-TECHNIQUE/greekLemmatization/lemmatisationAp.ipynb index 178b27adf9390219f9905a4b026f68dda82b0b8e..194dea88e600370915ea35a5a560b7c4ba341137 100644 --- a/0-TECHNIQUE/greekLemmatization/lemmatisationAp.ipynb +++ b/0-TECHNIQUE/greekLemmatization/lemmatisationAp.ipynb @@ -141,23 +141,145 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 23, "id": "6af10a3c-fff0-4537-8f15-3a82d9a2a3d0", "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "<div>\n", + "<style scoped>\n", + " .dataframe tbody tr th:only-of-type {\n", + " vertical-align: middle;\n", + " }\n", + "\n", + " .dataframe tbody tr th {\n", + " vertical-align: top;\n", + " }\n", + "\n", + " .dataframe thead th {\n", + " text-align: right;\n", + " }\n", + "</style>\n", + "<table border=\"1\" class=\"dataframe\">\n", + " <thead>\n", + " <tr style=\"text-align: right;\">\n", + " <th></th>\n", + " <th>book</th>\n", + " <th>fragment</th>\n", + " <th>author</th>\n", + " <th>text</th>\n", + " <th>keyword_code</th>\n", + " <th>text_lemmatized</th>\n", + " </tr>\n", + " </thead>\n", + " <tbody>\n", + " <tr>\n", + " <th>0</th>\n", + " <td>1</td>\n", + " <td>1</td>\n", + " <td>anonymous</td>\n", + " <td>\\n ἃς οἱ πλάνοι καθεῖλον ...</td>\n", + " <td>['https://anthologiagraeca.org/api/keywords/11...</td>\n", + " <td>á½…Ï‚ ὠπλάσσω καθαιÏÎω ἔνθατος εἰκών ἄναξ στηλόω...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>1</th>\n", + " <td>1</td>\n", + " <td>2</td>\n", + " <td>anonymous</td>\n", + " <td>\\n θεῖος Ἰουστῖνος, Σοφίη...</td>\n", + " <td>['https://anthologiagraeca.org/api/keywords/11...</td>\n", + " <td>θεῖος Ἰουστῖνος , Σοφίης πόσις , á½…Ï‚ πόÏω ΧÏιστ...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>2</th>\n", + " <td>1</td>\n", + " <td>3</td>\n", + " <td>anonymous</td>\n", + " <td>\\n ὠπÏὶν Ἰουστῖνος πεÏικα...</td>\n", + " <td>['https://anthologiagraeca.org/api/keywords/11...</td>\n", + " <td>ὠπÏίν Ἰουστῖνος πεÏικαλλής δÎομαι ναός οὗτος ...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>3</th>\n", + " <td>1</td>\n", + " <td>4</td>\n", + " <td>anonymous</td>\n", + " <td>\\n τοῦτον Ἰωάννῃ, ΧÏιστοῦ...</td>\n", + " <td>['https://anthologiagraeca.org/api/keywords/11...</td>\n", + " <td>οὗτος ἸωννεÏÏ‚ , ΧÏιστός μÎγας θεÏάπων , ΣτοÏδι...</td>\n", + " </tr>\n", + " <tr>\n", + " <th>4</th>\n", + " <td>1</td>\n", + " <td>5</td>\n", + " <td>anonymous</td>\n", + " <td>\\n τόνδε Θεῷ κάμες οἶκον, ...</td>\n", + " <td>['https://anthologiagraeca.org/api/keywords/11...</td>\n", + " <td>ὅδε Θεός κάμνω οἶκος , Ἀμάντιος , μεσσόθι πόντ...</td>\n", + " </tr>\n", + " </tbody>\n", + "</table>\n", + "</div>" + ], + "text/plain": [ + " book fragment author \\\n", + "0 1 1 anonymous \n", + "1 1 2 anonymous \n", + "2 1 3 anonymous \n", + "3 1 4 anonymous \n", + "4 1 5 anonymous \n", + "\n", + " text \\\n", + "0 \\n ἃς οἱ πλάνοι καθεῖλον ... \n", + "1 \\n θεῖος Ἰουστῖνος, Σοφίη... \n", + "2 \\n ὠπÏὶν Ἰουστῖνος πεÏικα... \n", + "3 \\n τοῦτον Ἰωάννῃ, ΧÏιστοῦ... \n", + "4 \\n τόνδε Θεῷ κάμες οἶκον, ... \n", + "\n", + " keyword_code \\\n", + "0 ['https://anthologiagraeca.org/api/keywords/11... \n", + "1 ['https://anthologiagraeca.org/api/keywords/11... \n", + "2 ['https://anthologiagraeca.org/api/keywords/11... \n", + "3 ['https://anthologiagraeca.org/api/keywords/11... \n", + "4 ['https://anthologiagraeca.org/api/keywords/11... \n", + "\n", + " text_lemmatized \n", + "0 á½…Ï‚ ὠπλάσσω καθαιÏÎω ἔνθατος εἰκών ἄναξ στηλόω... \n", + "1 θεῖος Ἰουστῖνος , Σοφίης πόσις , á½…Ï‚ πόÏω ΧÏιστ... \n", + "2 ὠπÏίν Ἰουστῖνος πεÏικαλλής δÎομαι ναός οὗτος ... \n", + "3 οὗτος ἸωννεÏÏ‚ , ΧÏιστός μÎγας θεÏάπων , ΣτοÏδι... \n", + "4 ὅδε Θεός κάμνω οἶκος , Ἀμάντιος , μεσσόθι πόντ... " + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "df.head()" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 24, "id": "9d7e049d-9bf1-44cc-b528-421deeec48cc", "metadata": {}, "outputs": [], "source": [ "df.to_csv('../../DONNEES/DataIn/corpus_grc_tokenized.csv')" ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ffb2013a-ac98-48c2-8cee-8c0de8f87ccf", + "metadata": {}, + "outputs": [], + "source": [] } ], "metadata": {