# Intro Models

## First Execution

In [None]:
import stanza

nlp = stanza.Pipeline('en')

doc = nlp('Barack Obama was born in Hawaii.')

for sentence in doc.sentences:
  for word in sentence.words:
    print(word.text, word.lemma, word.pos)


# Redo

In [None]:
import stanza

nlp = stanza.Pipeline('en', processors='tokenize,pos', use_gpu=True, pos_batch_size=3000) # Build the pipeline, specify part-of-speech processor's batch size

doc = nlp("Barack Obama was born in Hawaii.") # Run the pipeline on the input text

print(doc) # Look at the result

# Multiple Documents

In [None]:
import stanza

nlp = stanza.Pipeline(lang="en") # Initialize the default English pipeline

documents = ["This is a test document.", "I wrote another document for fun."] # Documents that we are going to process

in_docs = [stanza.Document([], text=d) for d in documents] # Wrap each document with a stanza.Document object

out_docs = nlp(in_docs) # Call the neural pipeline on this list of documents

print(out_docs[1]) # The output is also a list of stanza.Document objects, each output corresponding to an input Document object

## Bulk Processing

In [None]:
import stanza

nlp = stanza.Pipeline(lang="en") # Initialize the default English pipeline

documents = ["This is a test document.", "I wrote another document for fun."] # Documents that we are going to process

out_docs = nlp.bulk_process(documents) # Call the neural pipeline on this list of documents

print(out_docs[1]) # The output is also a list of stanza.Document objects, each output corresponding to an input Document object