You are on page 1of 3

DATASET :

SOURCE CODE :

import numpy as np
import pandas as pd
import re

import spacy
from spacy import displacy

data = pd.read_csv('train.csv')
data = data.sample(100)

NER = spacy.load("en_core_web_sm")

def NameEntTagger(data) :
text = NER(data)
print(data)
print("###########################################")
for word in text.ents:
print(word.text, word.label_)
for sent in data['question1'] :
# sent = re.sub('[\W_]+', ' ', sent)
NameEntTagger(sent)
print("###########################################")

def NameEntDisplayer(data) :
text = NER(data)
displacy.render(text,style="ent",jupyter=True)

for sent in data['question1'] :


# sent = re.sub('[\W_]+', ' ', sent)
NameEntDisplayer(sent)

OUTPUT :

You might also like