### Installation

In [1]:
!pip install -U pip setuptools wheel
!pip install -U spacy



### Language class and object

In [2]:
# Import the English language class
from spacy.lang.en import English

# Create the nlp object
nlp = English()

### Processing text

In [3]:
# Processing a string of text with the nlp object
doc = nlp("Hello world!")

### Docs and tokens

In [4]:
doc = nlp("Hello world!")

# Index into the Doc to get a single Token
token = doc[1]

# Get the token text via the .text attribute
print(token.text)

world


### Span

In [5]:
doc = nlp("Hello world!")

# A slice from the Doc is a Span object
span = doc[1:3]

# Get the span text via the .text attribute
print(span.text)

world!


In [6]:
!python -m spacy download en_core_web_sm
!python -m spacy download en

2021-06-23 15:39:03.103979: W tensorflow/stream_executor/platform/default/dso_loader.cc:60] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory
2021-06-23 15:39:03.104014: I tensorflow/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine.
Collecting en-core-web-sm==3.0.0
  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.0.0/en_core_web_sm-3.0.0-py3-none-any.whl (13.7 MB)
[K     |████████████████████████████████| 13.7 MB 773 kB/s eta 0:00:01     |███████████████████████▎        | 10.0 MB 1.6 MB/s eta 0:00:03
[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
2021-06-23 15:39:24.283447: W tensorflow/stream_executor/platform/default/dso_loader.cc:60] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot ope

[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')


### Syntactic dependencies

In [7]:
import en_core_web_sm
nlp = en_core_web_sm.load()

# Process a text
doc = nlp("She ate the pizza")

# Iterate over the tokens
for token in doc:
    # Print the text and the predicted part-of-speech tag
    print(token.text, token.pos_)

She PRON
ate VERB
the DET
pizza NOUN


In [8]:
from spacy import displacy

doc = nlp("She ate the pizza")
displacy.serve(doc, style="dep")




Using the 'dep' visualizer
Serving on http://0.0.0.0:5000 ...

Shutting down server on port 5000.


### Named entities

In [9]:
# Process a text
doc = nlp("Apple is looking at buying a U.K. startup for $1 billion")

# Iterate over the predicted entities
for ent in doc.ents:
    # Print the entity text and its label
    print(ent.text, ent.label_)

Apple ORG
U.K. GPE
$1 billion MONEY


In [10]:
doc = nlp("Apple is looking at buying a U.K. startup for $1 billion")
displacy.serve(doc, style="ent")


Using the 'ent' visualizer
Serving on http://0.0.0.0:5000 ...

Shutting down server on port 5000.
