From b6a26a444925c49d1e140bd9654fec3b23732de2 Mon Sep 17 00:00:00 2001 From: Lili Gasser <gasserli@ethz.ch> Date: Wed, 16 Jan 2019 10:42:09 +0000 Subject: [PATCH] add french files contd --- notebooks/NER_read-training-data.ipynb | 25 +++++++++++++++---------- 1 file changed, 15 insertions(+), 10 deletions(-) diff --git a/notebooks/NER_read-training-data.ipynb b/notebooks/NER_read-training-data.ipynb index 52824eda..d8dd9c8b 100644 --- a/notebooks/NER_read-training-data.ipynb +++ b/notebooks/NER_read-training-data.ipynb @@ -9,7 +9,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -52,7 +52,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -80,7 +80,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 3, "metadata": {}, "outputs": [ { @@ -1089,7 +1089,7 @@ " ...]" ] }, - "execution_count": 5, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -1109,7 +1109,7 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 4, "metadata": { "scrolled": true }, @@ -19179,7 +19179,7 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 6, "metadata": {}, "outputs": [ { @@ -23820,10 +23820,15 @@ " - values: text as string, entities as list, title as string (also contains year and document number)\n", " \n", "each entity is a dictionary with start and end character (as integer) and the label (as string). The four possible entries for labels (so far) are:\n", - "- ORGANIZATION\n", - "- PERSON\n", - "- LOCATION\n", - "- MISC" + "- german:\n", + " - ORGANIZATION\n", + " - PERSON\n", + " - LOCATION\n", + " - MISC\n", + "- french:\n", + " - I-ORG\n", + " - I-PERS\n", + " - I-LIEU" ] }, { -- GitLab