In [None]:
import spacy
nlp = spacy.load('models\model-best')

In [None]:
# Print the names of the pipeline components
print(nlp.pipe_names)

# Print the full pipeline of (name, component) tuples
print(nlp.pipeline)

In [None]:
# List the tokens
doc = nlp("Bu bir sade cümle ise diğer İstanbul içeren bir cümledir.")
for token in doc:
    print(token.text, '\t\t', token.lemma_, '\t\t', token.pos_)

In [None]:
# Tokenization, Tagging, Lemmatization and Dependency Parsing in a pretty table
import pandas as pd

attribs = ['orth_', 'lemma_', 'tag_', 'pos_', 'dep_', 'head']
table = [{att:tok.__getattribute__(att) for att in attribs} for tok in doc]
df = pd.DataFrame(table)
print(df[attribs])

In [None]:
# Play with the pos values
for token in doc:
    # Check if the current token is a proper noun
    if token.pos_ == "ADJ":
        # Check if the next token is a verb
        if doc[token.i + 1].pos_ == "NOUN":
            print("Found adjective before a noun:", token.text)

In [None]:
# DEP visualization
from spacy import displacy
displacy.render(doc, style="dep")

In [None]:
# Parsing multiple sentences
doc = nlp("Bu bir cümle. Bu da başka bir cümle.")
for sent in doc.sents:
    print(sent)

In [None]:
displacy.render(doc, style = 'dep', options = {"compact": True})

In [None]:
# Named entities
doc = nlp("Şimdilik ER yok.") # ~Rzeczpospolita 

for entity in doc.ents:
    print(entity.text, entity.label_)

In [None]:
# NER visualization
displacy.render(doc, style="ent")

In [None]:
# Simple token attributes
for token in doc:
    # Check if the token resembles a number
    if token.like_num:
        print(token)