In [1]:
import sys
sys.path.append("..")

In [2]:
import pandas as pd
import re
from spacy_annotator.pandas_annotations import annotate as pd_annotate

## Example

In [3]:
df = pd.DataFrame({
    "text": [
        "New York is lovely, Milan is nice, but London is amazing!",
        "Stockholm is too cold."
    ]})

In [4]:
df

Unnamed: 0,text
0,"New York is lovely, Milan is nice, but London ..."
1,Stockholm is too cold.


### Annotating without model

In [5]:
df_labels = pd_annotate(
    df,
    col_text="text",
    labels=["GPE", "PERSON"],
    sample_size=1,
)

[1mInstructions[0m 
Input must be in the following format: 
labelA: item1, item2; 
labelB: itemX, itemZ; 

If no entities in text, leave as is and press submit. 
Similarly, if no entities for a particular label, leave as is (or delete the line for that label). 

Buttons: 
*submit inserts new annotation (or overwrites existing one if one is present). 
*skip moves forward and leaves empty string (or existing annotation if one is present). 
*finish terminates the annotation session.


HTML(value='-1 examples annotated, 3 examples left')

Textarea(value='GPE: insert;\nPERSON: insert;', layout=Layout(width='auto'), rows=2)

HBox(children=(Button(description='submit', style=ButtonStyle()), Button(description='skip', style=ButtonStyle…

Output()

In [6]:
df_labels

Unnamed: 0,text,annotations
0,Stockholm is too cold.,
1,"New York is lovely, Milan is nice, but London ...",


In [7]:
df_labels.loc[0, "annotations"]

''

### Annotating with model

In [8]:
df_labels_2 = pd_annotate(
    df,
    col_text="text",
    labels=["GPE", "PERSON"],
    sample_size=1,
    model="en_core_web_sm"
)

[1mInstructions[0m 
Input must be in the following format: 
labelA: item1, item2; 
labelB: itemX, itemZ; 

If no entities in text, leave as is and press submit. 
Similarly, if no entities for a particular label, leave as is (or delete the line for that label). 

Buttons: 
*submit inserts new annotation (or overwrites existing one if one is present). 
*skip moves forward and leaves empty string (or existing annotation if one is present). 
*finish terminates the annotation session.


HTML(value='-1 examples annotated, 3 examples left')

Textarea(value='GPE: insert;\nPERSON: insert;', layout=Layout(width='auto'), rows=2)

HBox(children=(Button(description='submit', style=ButtonStyle()), Button(description='skip', style=ButtonStyle…

Output()