Named_Entity_Recognition(LAbsheet-07).ipynb (20221CSE0413)- Colab
Named_Entity_Recognition(LAbsheet-07).ipynb (20221CSE0413)- Colab
import spacy
#from spacy import displacy
from collections import Counter
nlp = spacy.load("en_core_web_sm")
sample = "European authorities fined Google a record $5.1 billion on Wednesday for abusing its power in the mobile phone market and order
doc = nlp(sample)
def getTextFromFile(fileName):
with(open(fileName, 'r') as fp):
return fp.read()
fileName = "File17.txt"
text = getTextFromFile(fileName)
#print(len(text.split(" ")))
doc = nlp(text)
for entity in doc.ents:
print(entity.text + " - " + entity.label_ + " - " + str(spacy.explain(entity.label_)))
print(len(doc.ents))
44
def findOutUniqueNamedEntities(doc):
entities = set()
for entity in doc.ents:
element = entity.text.upper() + " - " + entity.label_
entities.add(element)
return entities
print(len(findOutUniqueNamedEntities(doc)))
38