In [None]:
# Install the spaCy library
%pip install spacy

In [None]:
# Import the spaCy library
import spacy

In [10]:
# Download the small English model
from spacy.cli import download

download("en_core_web_sm")

[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
[38;5;3m⚠ Restart to reload dependencies[0m
If you are in a Jupyter or Colab notebook, you may need to restart Python in
order to load all the package's dependencies. You can do this by selecting the
'Restart kernel' or 'Restart runtime' option.


In [None]:
# Load the pre-trained small English model
nlp = spacy.load("en_core_web_sm")

In [41]:
# Process a text string. The nlp object returns a Doc object
doc = nlp(
    "Autonomous cars shift insurance liability toward manufacturers. This creates interesting legal questions."
)

In [42]:
# Iterate through each token in the Doc object and print token analysis
# text: raw text, pos_: coarse-grained part-of-speech, dep_: dependency relation
for token in doc:
    print(token, token.text, token.pos_, token.dep_)

Autonomous Autonomous ADJ amod
cars cars NOUN nsubj
shift shift VERB ROOT
insurance insurance NOUN compound
liability liability NOUN dobj
toward toward ADP prep
manufacturers manufacturers NOUN pobj
. . PUNCT punct
This This PRON nsubj
creates creates VERB ROOT
interesting interesting ADJ amod
legal legal ADJ amod
questions questions NOUN dobj
. . PUNCT punct


In [43]:
# Inspect the active pipeline components
nlp.pipeline

[('tok2vec', <spacy.pipeline.tok2vec.Tok2Vec at 0x2d8390afbf0>),
 ('tagger', <spacy.pipeline.tagger.Tagger at 0x2d8390afcb0>),
 ('parser', <spacy.pipeline.dep_parser.DependencyParser at 0x2d839b0ece0>),
 ('attribute_ruler',
  <spacy.pipeline.attributeruler.AttributeRuler at 0x2d83900fa90>),
 ('lemmatizer', <spacy.lang.en.lemmatizer.EnglishLemmatizer at 0x2d83ad34a90>),
 ('ner', <spacy.pipeline.ner.EntityRecognizer at 0x2d839b0ec70>)]

In [44]:
# Get a list of the pipeline component names
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [45]:
# Check the object type (spacy.tokens.doc.Doc)
type(doc)

spacy.tokens.doc.Doc

In [46]:
# Create a Span object (a slice of the document)
# Note: Spans are views of the Doc, not copies
my_span = doc[5:11]
print(my_span)

toward manufacturers. This creates interesting


In [47]:
# Check the object type (spacy.tokens.span.Span)
type(my_span)

spacy.tokens.span.Span

In [48]:
for sentence in doc.sents:
    print(sentence)

Autonomous cars shift insurance liability toward manufacturers.
This creates interesting legal questions.
