#!/usr/bin/env python # coding: utf-8 # In[1]: import spacy # In[2]: nlp = spacy.load("en_core_web_sm") text = "West Chestertenfieldville was referenced in Mr. Deeds." # In[3]: doc = nlp(text) # In[4]: for ent in doc.ents: print (ent.text, ent.label_) # In[5]: ruler = nlp.add_pipe("entity_ruler") # In[6]: patterns = [ {"label": "GPE", "pattern": "West Chestertenfieldville"} ] ruler.add_patterns(patterns) # In[7]: doc = nlp(text) for ent in doc.ents: print (ent.text, ent.label_) # In[8]: nlp.analyze_pipes() # In[9]: nlp = spacy.load("en_core_web_sm") # In[10]: ruler = nlp.add_pipe("entity_ruler", before="ner") patterns = [ {"label": "GPE", "pattern": "West Chestertenfieldville"} ] ruler.add_patterns(patterns) # In[11]: nlp.analyze_pipes() # In[12]: doc = nlp(text) # In[13]: for ent in doc.ents: print (ent.text, ent.label_) # In[14]: nlp3 = spacy.load("en_core_web_sm") # In[15]: ruler = nlp3.add_pipe("entity_ruler", before="ner") patterns = [ {"label": "GPE", "pattern": "West Chestertenfieldville"}, {"label": "FILM", "pattern": "Mr. Deeds"} ] ruler.add_patterns(patterns) # In[16]: doc = nlp3(text) # In[17]: for ent in doc.ents: print (ent.text, ent.label_) # In[18]: text = "This is a sample number (555) 555-5555." # In[19]: nlp = spacy.blank("en") ruler = nlp.add_pipe("entity_ruler") # In[23]: patterns = [ {"label": "PHONE_NUMBER", "pattern": [ {"ORTH": "("}, {"SHAPE": "ddd"}, {"ORTH": ")"}, {"SHAPE": "ddd"}, {"ORTH": "-", "OP": "?"}, {"SHAPE": "dddd"} ]} ] ruler.add_patterns(patterns) # In[24]: doc = nlp(text) for ent in doc.ents: print (ent.text, ent.label_) # In[ ]: