Professional Documents
Culture Documents
SOURCE CODE :
import numpy as np
import pandas as pd
import re
import spacy
from spacy import displacy
data = pd.read_csv('train.csv')
data = data.sample(100)
NER = spacy.load("en_core_web_sm")
def NameEntTagger(data) :
text = NER(data)
print(data)
print("###########################################")
for word in text.ents:
print(word.text, word.label_)
for sent in data['question1'] :
# sent = re.sub('[\W_]+', ' ', sent)
NameEntTagger(sent)
print("###########################################")
def NameEntDisplayer(data) :
text = NER(data)
displacy.render(text,style="ent",jupyter=True)
OUTPUT :