spacy de_core_news_sm change splitter code example
Example 1: spacy tokineze stream
texts = ["One document.", "...", "Lots of documents"]
for doc in tokenizer.pipe(texts, batch_size=50):
pass
Example 2: spacy entity linking example
import spacy
nlp = spacy.load("my_custom_el_model")
doc = nlp("Ada Lovelace was born in London")
ents = [(e.text, e.label_, e.kb_id_) for e in doc.ents]
print(ents)
ent_ada_0 = [doc[0].text, doc[0].ent_type_, doc[0].ent_kb_id_]
ent_ada_1 = [doc[1].text, doc[1].ent_type_, doc[1].ent_kb_id_]
ent_london_5 = [doc[5].text, doc[5].ent_type_, doc[5].ent_kb_id_]
print(ent_ada_0)
print(ent_ada_1)
print(ent_london_5)