diff --git a/Spacy_Neo4j_Gutenberg_Book/Spacy NER with Neo4j Clustering on Gutenberg book.ipynb b/Spacy_Neo4j_Gutenberg_Book/Spacy NER with Neo4j Clustering on Gutenberg book.ipynb index c290eeb..940a20a 100644 --- a/Spacy_Neo4j_Gutenberg_Book/Spacy NER with Neo4j Clustering on Gutenberg book.ipynb +++ b/Spacy_Neo4j_Gutenberg_Book/Spacy NER with Neo4j Clustering on Gutenberg book.ipynb @@ -42,12 +42,12 @@ "source": [ "# import spacy and load an NLP model\n", "import spacy\n", - "nlp = spacy.load(\"en_core_web_lg\")\n" + "nlp = spacy.load(\"en_core_web_lg\", disable=[\"tagger\", \"parser\"])\n" ] }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -71,13 +71,14 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ + "Elphbergs Rudolf\n", "Rudolf Rose\n", "Robert Ancestry\n", "Ancestry Rose\n", @@ -86,18 +87,18 @@ "Rudolf Robert\n", "Robert Rudolf\n", "Ruritania Burlesdon\n", - "Burlesdon George II\n", + "Lady Burlesdon George II\n", "George II King\n", - "Rudolf the Third Ruritania \n", + "Rudolf the Third Ruritania\n", "Burlesdon Amelia\n", "James Burlesdon\n", "Burlesdon a Knight of the Garter\n", "a Knight of the Garter Rudolf\n", - "a Knight of the Garter Ruritania \n", - "Rudolf Ruritania \n", + "a Knight of the Garter Ruritania\n", + "Rudolf Ruritania\n", "Jacob Jacob\n", "Jacob Rudolf\n", - "Elphberg Elphberg\n", + "Elphbergs Elphberg\n", "Elphberg Rudolf\n", "Bob Rose\n" ] @@ -155,7 +156,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ @@ -180,7 +181,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 7, "metadata": {}, "outputs": [], "source": [ @@ -265,7 +266,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 8, "metadata": { "scrolled": true }, @@ -277,17 +278,17 @@ " \n", " " ], "text/plain": [ - "" + "" ] }, - "execution_count": 12, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -316,7 +317,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 9, "metadata": {}, "outputs": [ {