Spaces:

Az-r-ow
/

TravelNER

Sleeping

App Files Files Community

Az-r-ow commited on Jan 11

Commit

dcd93f5

1 Parent(s): 74d5c55

feat(ihm): semi-functionnal interface, minor things to add

Browse files

Files changed (18) hide show

.gitignore +0 -10
app/app.py +229 -150
app/travel_resolver/libs/nlp/ner/models.py +13 -24
app/travel_resolver/libs/nlp/ner/models_definitions/__init__.py +0 -0
app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/__init__.py +0 -0
app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/architecture.py +21 -0
app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/bilstm.weights.h5 +3 -0
app/travel_resolver/libs/nlp/ner/{models → models_definitions}/bilstm/model.keras +0 -0
app/travel_resolver/libs/nlp/ner/{models → models_definitions}/bilstm/tf_version.txt +0 -0
app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/__init__.py +0 -0
app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/architecture.py +37 -0
app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/lstm_with_pos.weights.h5 +3 -0
app/travel_resolver/libs/nlp/ner/{models → models_definitions}/lstm_with_pos/model.keras +0 -0
app/travel_resolver/libs/nlp/ner/{models → models_definitions}/lstm_with_pos/tf_version.txt +0 -0
app/travel_resolver/tests/data_processing_test.py +1 -1
test.py +10 -0
test.txt +1 -0
test2.txt +2 -0

.gitignore CHANGED Viewed

@@ -167,15 +167,5 @@ cython_debug/
 # Remove test ouptuts
 output.*
-# Remove vscode settings
-.vscode
-# Remove macos ds store
 # Macos generated files
-.DS_Store
-# Remove vscode settings
-.vscode
-# Remove macos ds store
 .DS_Store

 # Remove test ouptuts
 output.*
 # Macos generated files
 .DS_Store

app/app.py CHANGED Viewed

@@ -3,17 +3,107 @@ from transformers import pipeline
 import numpy as np
 import pandas as pd
 from travel_resolver.libs.nlp.ner.models import BiLSTM_NER, LSTM_NER, CamemBERT_NER
-import torch
 from travel_resolver.libs.nlp.ner.data_processing import process_sentence
 from travel_resolver.libs.pathfinder.CSVTravelGraph import CSVTravelGraph
 from travel_resolver.libs.pathfinder.graph import Graph
-import os
 transcriber = pipeline(
     "automatic-speech-recognition", model="openai/whisper-base", device="cpu"
 )
-models = {"LSTM": None, "BiLSTM": None, "CamemBERT": CamemBERT_NER()}
 def transcribe(audio):
@@ -81,162 +171,151 @@ def getStationsByCityName(city: str):
     return stations
-def getDepartureAndArrivalFromText(text: str, model: str):
-    entities = models[model].get_entities(text)
-    tokenized_sentence = process_sentence(text, return_tokens=True)
-    dep_idx = entities.index(1)
-    arr_idx = entities.index(2)
-    return tokenized_sentence[dep_idx].upper(), tokenized_sentence[arr_idx].upper()
-def handle_audio(audio):
-    promptAudio = transcribe(audio)
-    # todo : replace with the model selected by the user
-    dep, arr = getDepartureAndArrivalFromText(promptAudio, "CamemBERT")
-    return (
-        gr.update(visible=True),
-        gr.update(visible=False),
-        gr.update(value=promptAudio),
-        gr.update(value=dep),
-        gr.update(value=arr),
-    )
-def handle_file(file):
-    loading_screen.update(visible=True)
     dep = None
     arr = None
-    if file is not None:
-        with open(file.name, "r") as f:
-            file_content = f.read()
-            row = file_content.split("\n")
-            if len(row) > 1:
-                return
-            else:
-                dep, arr = getDepartureAndArrivalFromText(file_content, "CamemBERT")
-    else:
-        file_content = "Aucun fichier uploadé."
-    loading_screen.update(visible=False)
-    return (
-        gr.update(visible=True),
-        gr.update(visible=False),
-        gr.update(value=file_content),
-        gr.update(value=dep),
-        gr.update(value=arr),
-    )
-def handle_back():
-    audio.clear()
-    file.clear()
-    return (gr.update(visible=False), gr.update(visible=True))
-def handleCityChange(city):
-    stations = getStationsByCityName(city)
-    return gr.update(choices=stations, value=stations[0], interactive=True)
-def handleStationChange(departureStation, destinationStation):
-    if departureStation and destinationStation:
-        dijkstraPath, dijkstraCost = getDijkstraResult(
-            departureStation, destinationStation
-        )
-        dijkstraPathFormatted = "\n".join(
-            [f"{i + 1}. {elem}" for i, elem in enumerate(dijkstraPath)]
-        )
-        AStarPath, AStarCost = getAStarResult(departureStation, destinationStation)
-        AStarPathFormatted = "\n".join(
-            [f"{i + 1}. {elem}" for i, elem in enumerate(AStarPath)]
-        )
-        return (
-            gr.update(value=dijkstraCost),
-            gr.update(value=dijkstraPathFormatted, lines=len(dijkstraPath)),
-            gr.update(value=AStarCost),
-            gr.update(value=AStarPathFormatted, lines=len(AStarPath)),
-        )
-    return (
-        gr.HTML("<p>Aucun prompt renseigné</p>"),
-        gr.update(value=""),
-        gr.HTML("<p>Aucun prompt renseigné</p>"),
-        gr.update(value=""),
-    )
-with gr.Blocks(css="#back-button {width: fit-content}") as demo:
-    with gr.Row(visible=False) as loading_screen:
-        gr.Text("Chargement ...", elem_id="loading")
-    with gr.Column() as promptChooser:
-        with gr.Row():
-            audio = gr.Audio(label="Fichier audio")
-            file = gr.File(
-                label="Fichier texte", file_types=["text"], file_count="single"
-            )
-    with gr.Column(visible=False) as content:
-        backButton = gr.Button("← Back", elem_id="back-button")
-        with gr.Row():
-            with gr.Column(scale=1, min_width=300) as parameters:
-                prompt = gr.Textbox(label="Prompt")
-                departureCity = gr.Textbox(label="Ville de départ")
-                destinationCity = gr.Textbox(label="Ville de de destination")
-            with gr.Column(scale=2, min_width=300) as result:
                 with gr.Row():
-                    departureStation = gr.Dropdown(label="Gare de départ")
-                    destinationStation = gr.Dropdown(label="Gare d'arrivée")
-                with gr.Tab("Dijkstra"):
-                    timeDijkstra = gr.HTML("<p>Aucun prompt renseigné</p>")
-                    dijkstraPath = gr.Textbox(label="Chemin emprunté")
-                with gr.Tab("AStar"):
-                    timeAStar = gr.HTML("<p>Aucun prompt renseigné</p>")
-                    AstarPath = gr.Textbox(label="Chemin emprunté")
-    audio.change(
-        handle_audio,
-        inputs=[audio],
-        outputs=[
-            content,
-            promptChooser,
-            prompt,
-            departureCity,
-            destinationCity,
-        ],  # On rend la section "content" visible
-        show_progress="full",
-    )
-    file.upload(
-        handle_file,
-        inputs=[file],
-        outputs=[
-            content,
-            promptChooser,
-            prompt,
-            departureCity,
-            destinationCity,
-        ],  # On rend la section "content" visible
-        show_progress="full",
-    )
-    backButton.click(handle_back, inputs=[], outputs=[content, promptChooser])
-    departureCity.change(
-        handleCityChange, inputs=[departureCity], outputs=[departureStation]
-    )
-    destinationCity.change(
-        handleCityChange, inputs=[destinationCity], outputs=[destinationStation]
-    )
-    departureStation.change(
-        handleStationChange,
-        inputs=[departureStation, destinationStation],
-        outputs=[timeDijkstra, dijkstraPath, timeAStar, AstarPath],
-    )
-    destinationStation.change(
-        handleStationChange,
-        inputs=[departureStation, destinationStation],
-        outputs=[timeDijkstra, dijkstraPath, timeAStar, AstarPath],
-    )
 if __name__ == "__main__":
     demo.launch()

 import numpy as np
 import pandas as pd
 from travel_resolver.libs.nlp.ner.models import BiLSTM_NER, LSTM_NER, CamemBERT_NER
+# import torch
 from travel_resolver.libs.nlp.ner.data_processing import process_sentence
 from travel_resolver.libs.pathfinder.CSVTravelGraph import CSVTravelGraph
 from travel_resolver.libs.pathfinder.graph import Graph
+import time
 transcriber = pipeline(
     "automatic-speech-recognition", model="openai/whisper-base", device="cpu"
 )
+models = {"LSTM": LSTM_NER(), "BiLSTM": BiLSTM_NER(), "CamemBERT": CamemBERT_NER()}
+entities_label_mapping = {1: "LOC-DEP", 2: "LOC-ARR"}
+with gr.Blocks(css="#back-button {width: fit-content}") as demo:
+    with gr.Column() as promptChooser:
+        with gr.Row():
+            audio = gr.Audio(label="Fichier audio")
+            file = gr.File(
+                label="Fichier texte", file_types=["text"], file_count="single"
+            )
+        model = gr.Dropdown(
+            label="Modèle NER", choices=models.keys(), value="CamemBERT"
+        )
+    @gr.render(inputs=[audio, file, model], triggers=[model.change])
+    def handle_model_change(audio, file, model):
+        if audio:
+            render_tabs([transcribe(audio)], model, gr.Progress())
+        elif file:
+            with open(file.name, "r") as f:
+                sentences = f.read().split("\n")
+                render_tabs(sentences, model, gr.Progress())
+    @gr.render(inputs=[audio, model], triggers=[audio.change])
+    def handle_audio(audio, model, progress=gr.Progress()):
+        progress(0, "Analyzing audio...")
+        promptAudio = transcribe(audio)
+        time.sleep(1)
+        render_tabs([promptAudio], model, progress)
+    @gr.render(
+        inputs=[file, model],
+        triggers=[file.upload],
+    )
+    def handle_file(file, model, progress=gr.Progress()):
+        progress(0, desc="Analyzing file...")
+        time.sleep(1)
+        if file is not None:
+            with open(file.name, "r") as f:
+                progress(0.33, desc="Reading file...")
+                file_content = f.read()
+                rows = file_content.split("\n")
+                sentences = [row for row in rows if row]
+                render_tabs(sentences, model, progress)
+def handle_back():
+    audio.clear()
+    file.clear()
+    return (gr.update(visible=False), gr.update(visible=True))
+def handleCityChange(city):
+    stations = getStationsByCityName(city)
+    return gr.update(choices=stations, value=stations[0], interactive=True)
+def handleCityChange(city):
+    stations = getStationsByCityName(city)
+    return gr.update(choices=stations, value=stations[0], interactive=True)
+def formatPath(path):
+    return "\n".join([f"{i + 1}. {elem}" for i, elem in enumerate(path)])
+def handleStationChange(departureStation, destinationStation):
+    if departureStation and destinationStation:
+        dijkstraPath, dijkstraCost = getDijkstraResult(
+            departureStation, destinationStation
+        )
+        dijkstraPathFormatted = formatPath(dijkstraPath)
+        AStarPath, AStarCost = getAStarResult(departureStation, destinationStation)
+        AStarPathFormatted = formatPath(AStarPath)
+        return (
+            gr.update(value=dijkstraCost),
+            gr.update(value=dijkstraPathFormatted, lines=len(dijkstraPath)),
+            gr.update(value=AStarCost),
+            gr.update(value=AStarPathFormatted, lines=len(AStarPath)),
+        )
+    return (
+        gr.HTML("<p>Aucun prompt renseigné</p>"),
+        gr.update(value=""),
+        gr.HTML("<p>Aucun prompt renseigné</p>"),
+        gr.update(value=""),
+    )
 def transcribe(audio):
     return stations
+def getEntitiesPositions(text, entity):
+    start_idx = text.find(entity)
+    end_idx = start_idx + len(entity)
+    return start_idx, end_idx
+def getDepartureAndArrivalFromText(text: str, model: str):
+    entities = models[model].get_entities(text)
+    if not isinstance(entities, list):
+        entities = entities.tolist()
+    tokenized_sentence = process_sentence(text, return_tokens=True)
     dep = None
     arr = None
+    if 1 in entities:
+        dep_idx = entities.index(1)
+        dep = tokenized_sentence[dep_idx]
+        start, end = getEntitiesPositions(text, dep)
+        dep = {
+            "entity": entities_label_mapping[1],
+            "word": dep,
+            "start": start,
+            "end": end,
+        }
+    if 2 in entities:
+        arr_idx = entities.index(2)
+        arr = tokenized_sentence[arr_idx]
+        start, end = getEntitiesPositions(text, arr)
+        arr = {
+            "entity": entities_label_mapping[2],
+            "word": arr,
+            "start": start,
+            "end": end,
+        }
+    return dep, arr
+def render_tabs(sentences: list[str], model: str, progress_bar: gr.Progress):
+    idx = 0
+    with gr.Tabs() as tabs:
+        for sentence in progress_bar.tqdm(sentences, desc="Processing sentences..."):
+            with gr.Tab(f"Sentence {idx}"):
+                dep, arr = getDepartureAndArrivalFromText(sentence, model)
+                entities = []
+                for entity in [dep, arr]:
+                    if entity:
+                        entities.append(entity)
+                # Format the classified entities
+                departureCityValue = dep["word"].upper() if dep else ""
+                arrivalCityValue = arr["word"].upper() if arr else ""
+                # Get the available stations
+                departureStations = getStationsByCityName(departureCityValue)
+                departureStationValue = (
+                    departureStations[0] if departureStations else ""
+                )
+                arrivalStations = getStationsByCityName(arrivalCityValue)
+                arrivalStationValue = arrivalStations[0] if arrivalStations else ""
+                dijkstraPathValues = []
+                AStarPathValues = []
+                timeDijkstraValue = "<p>Aucun prompt renseigné</p>"
+                timeAStarValue = "<p>Aucun prompt renseigné</p>"
+                # Get the paths and time for the two algorithms
+                if departureStationValue and arrivalStationValue:
+                    dijkstraPathValues, timeDijkstraValue = getDijkstraResult(
+                        departureStationValue, arrivalStationValue
+                    )
+                    AStarPathValues, timeAStarValue = getAStarResult(
+                        departureStationValue, arrivalStationValue
+                    )
+                dijkstraPathFormatted = formatPath(dijkstraPathValues)
+                AStarPathFormatted = formatPath(AStarPathValues)
                 with gr.Row():
+                    with gr.Column(scale=1, min_width=300):
+                        gr.HighlightedText(
+                            value={"text": sentence, "entities": entities}
+                        )
+                        departureCity = gr.Textbox(
+                            label="Ville de départ",
+                            value=departureCityValue,
+                        )
+                        arrivalCity = gr.Textbox(
+                            label="Ville d'arrivée",
+                            value=arrivalCityValue,
+                        )
+                    with gr.Column(scale=2, min_width=300):
+                        with gr.Row():
+                            departureStation = gr.Dropdown(
+                                label="Gare de départ",
+                                choices=departureStations,
+                                value=departureStationValue,
+                            )
+                            arrivalStation = gr.Dropdown(
+                                label="Gare d'arrivée",
+                                choices=arrivalStations,
+                                value=arrivalStationValue,
+                            )
+                        with gr.Tab("Dijkstra"):
+                            timeDijkstra = gr.HTML(value=timeDijkstraValue)
+                            dijkstraPath = gr.Textbox(
+                                label="Chemin emprunté",
+                                value=dijkstraPathFormatted,
+                                lines=len(dijkstraPathValues),
+                            )
+                        with gr.Tab("AStar"):
+                            timeAStar = gr.HTML(value=timeAStarValue)
+                            AstarPath = gr.Textbox(
+                                label="Chemin emprunté",
+                                value=AStarPathFormatted,
+                                lines=len(AStarPathValues),
+                            )
+                        departureCity.change(
+                            handleCityChange,
+                            inputs=[departureCity],
+                            outputs=[departureStation],
+                        )
+                        arrivalCity.change(
+                            handleCityChange,
+                            inputs=[arrivalCity],
+                            outputs=[arrivalStation],
+                        )
+                        departureStation.change(
+                            handleStationChange,
+                            inputs=[departureStation, arrivalStation],
+                            outputs=[timeDijkstra, dijkstraPath, timeAStar, AstarPath],
+                        )
+                        arrivalStation.change(
+                            handleStationChange,
+                            inputs=[departureStation, arrivalStation],
+                            outputs=[timeDijkstra, dijkstraPath, timeAStar, AstarPath],
+                        )
+                    idx += 1
 if __name__ == "__main__":
     demo.launch()

app/travel_resolver/libs/nlp/ner/models.py CHANGED Viewed

@@ -11,6 +11,8 @@ from .data_processing import (
 )
 from .metrics import masked_loss, masked_accuracy, entity_accuracy
 import stanza
 nlp = stanza.Pipeline("fr", processors="tokenize,pos")
@@ -37,18 +39,14 @@ class NERModel(ABC):
 class LSTM_NER(NERModel):
     def __init__(self):
-        self.model_path = os.path.join(
-            self.file_path, "models", "lstm_with_pos", "model.keras"
-        )
-        self.model = tf.keras.models.load_model(
-            self.model_path,
-            custom_objects={
-                "masked_loss": masked_loss,
-                "masked_accuracy": masked_accuracy,
-                "entity_accuracy": entity_accuracy,
-                "log_softmax_v2": tf.nn.log_softmax,
-            },
         )
     def encode_sentence(self, sentence: str):
         processed_sentence = process_sentence(
@@ -75,18 +73,11 @@ class LSTM_NER(NERModel):
 class BiLSTM_NER(NERModel):
     def __init__(self):
-        self.model_path = os.path.join(
-            self.file_path, "models", "bilstm", "model.keras"
-        )
-        self.model = tf.keras.models.load_model(
-            self.model_path,
-            custom_objects={
-                "masked_loss": masked_loss,
-                "masked_accuracy": masked_accuracy,
-                "entity_accuracy": entity_accuracy,
-                "log_softmax_v2": tf.nn.log_softmax,
-            },
         )
     def encode_sentence(self, sentence: str):
         processed_sentence = process_sentence(
@@ -167,8 +158,6 @@ class CamemBERT_NER(NERModel):
                     if current_word is not None:
                         sentence_labels.append(word_label)
-                    print(i)
-                    print(token_idx)
                     # Reset for the new word
                     current_word = word_idx
                     word_label = predictions[i][token_idx]

 )
 from .metrics import masked_loss, masked_accuracy, entity_accuracy
 import stanza
+from .models_definitions.bilstm.architecture import BiLSTM
+from .models_definitions.lstm_with_pos.architecture import LSTM
 nlp = stanza.Pipeline("fr", processors="tokenize,pos")
 class LSTM_NER(NERModel):
     def __init__(self):
+        self.model_weights_path = os.path.join(
+            self.file_path,
+            "models_definitions",
+            "lstm_with_pos",
+            "lstm_with_pos.weights.h5",
         )
+        self.model = LSTM(self.vocab, 3, self.pos_tags)
+        self.model.load_from_weights(self.model_weights_path)
     def encode_sentence(self, sentence: str):
         processed_sentence = process_sentence(
 class BiLSTM_NER(NERModel):
     def __init__(self):
+        self.model_weights_path = os.path.join(
+            self.file_path, "models_definitions", "bilstm", "bilstm.weights.h5"
         )
+        self.model = BiLSTM(self.vocab, 3)
+        self.model.load_from_weights(self.model_weights_path)
     def encode_sentence(self, sentence: str):
         processed_sentence = process_sentence(
                     if current_word is not None:
                         sentence_labels.append(word_label)
                     # Reset for the new word
                     current_word = word_idx
                     word_label = predictions[i][token_idx]

app/travel_resolver/libs/nlp/ner/models_definitions/__init__.py ADDED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/__init__.py ADDED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/architecture.py ADDED Viewed

	@@ -0,0 +1,21 @@

+import tensorflow as tf
+class BiLSTM:
+    def __init__(self, vocab, nb_labels, emb_dim=100):
+        self.model = tf.keras.models.Sequential(
+            layers=[
+                tf.keras.layers.Embedding(len(vocab) + 1, emb_dim, mask_zero=True),
+                tf.keras.layers.Bidirectional(
+                    tf.keras.layers.LSTM(emb_dim, return_sequences=True)
+                ),
+                tf.keras.layers.Dropout(0.3),
+                tf.keras.layers.Dense(nb_labels, activation=tf.nn.log_softmax),
+            ]
+        )
+    def load_from_weights(self, weights_path):
+        self.model.load_weights(weights_path)
+    def predict(self, x, verbose=0):
+        return self.model.predict(x, verbose=verbose)

app/travel_resolver/libs/nlp/ner/models_definitions/bilstm/bilstm.weights.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c4457e1c5249bef9062556a0f371f75bbe41f1c903ca485de55899d3a99c453
+size 7964368

app/travel_resolver/libs/nlp/ner/{models → models_definitions}/bilstm/model.keras RENAMED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/{models → models_definitions}/bilstm/tf_version.txt RENAMED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/__init__.py ADDED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/architecture.py ADDED Viewed

	@@ -0,0 +1,37 @@

+import tensorflow as tf
+class LSTM:
+    def __init__(self, vocab, nb_labels: int, pos_tags: list, emb_dim=100, emb_size=32):
+        word_input = tf.keras.layers.Input(shape=(emb_dim,), name="word_input")
+        pos_input = tf.keras.layers.Input(shape=(emb_dim,), name="pos_input")
+        word_embedding = tf.keras.layers.Embedding(
+            len(vocab), emb_size, name="word_embedding"
+        )(word_input)
+        pos_embedding = tf.keras.layers.Embedding(
+            len(pos_tags),
+            emb_size,
+            name="pos_embedding",
+        )(pos_input)
+        concatenated = tf.keras.layers.Concatenate()([word_embedding, pos_embedding])
+        masked_cat = tf.keras.layers.Masking(mask_value=0)(concatenated)
+        lstm_layer_with_pos = tf.keras.layers.LSTM(
+            emb_size, return_sequences=True, name="lstm_layer"
+        )(masked_cat)
+        dropout = tf.keras.layers.Dropout(0.2)(lstm_layer_with_pos)
+        output = tf.keras.layers.Dense(nb_labels, activation=tf.nn.log_softmax)(dropout)
+        self.model = tf.keras.Model(inputs=[word_input, pos_input], outputs=output)
+    def load_from_weights(self, weights_path):
+        self.model.load_weights(weights_path)
+    def predict(self, x, verbose=0):
+        return self.model.predict(x, verbose=verbose)

app/travel_resolver/libs/nlp/ner/models_definitions/lstm_with_pos/lstm_with_pos.weights.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb5a1a558c9156caa7dc56a64576be9331b13991bc8c87886ae69546fdeb80ca
+size 2111328

app/travel_resolver/libs/nlp/ner/{models → models_definitions}/lstm_with_pos/model.keras RENAMED Viewed

File without changes

app/travel_resolver/libs/nlp/ner/{models → models_definitions}/lstm_with_pos/tf_version.txt RENAMED Viewed

File without changes

app/travel_resolver/tests/data_processing_test.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import unittest
 from pathlib import Path
-from travel_resolver.libs.nlp.data_processing import (
     get_tagged_content,
     convert_tagged_sentence_to_bio,
     from_tagged_file_to_bio_file,

 import unittest
 from pathlib import Path
+from app.travel_resolver.libs.nlp.ner.data_processing import (
     get_tagged_content,
     convert_tagged_sentence_to_bio,
     from_tagged_file_to_bio_file,

test.py ADDED Viewed

	@@ -0,0 +1,10 @@

+from app.travel_resolver.libs.nlp.ner.models import LSTM_NER, BiLSTM_NER, CamemBERT_NER
+import tensorflow as tf
+print(tf.__version__)
+ner_model = LSTM_NER()
+sentence = "Je voudrais voyager de Nice à Clermont Ferrand."
+print(ner_model.get_entities(sentence))

test.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ Je veux partir de Montpellier à Clermont-Ferrand.

test2.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ Je suis à Paris. Je veux prendre le train à Montpellier.
2	+ Je veux prendre le train de Lyon à Marseille.