In [None]:
import io, os, sys, types
from IPython import get_ipython
from nbformat import read
from IPython.core.interactiveshell import InteractiveShell
def find_notebook(fullname, path=None):
    """find a notebook, given its fully qualified name and an optional path
    
    This turns "foo.bar" into "foo/bar.ipynb"
    and tries turning "Foo_Bar" into "Foo Bar" if Foo_Bar
    does not exist.
    """
    name = fullname.rsplit('.', 1)[-1]
    if not path:
        path = ['']
    for d in path:
        nb_path = os.path.join(d, name + ".ipynb")
        if os.path.isfile(nb_path):
            return nb_path
        # let import Notebook_Name find "Notebook Name.ipynb"
        nb_path = nb_path.replace("_", " ")
        if os.path.isfile(nb_path):
            return nb_path
        
class NotebookLoader(object):
    """Module Loader for Jupyter Notebooks"""
    def __init__(self, path=None):
        self.shell = InteractiveShell.instance()
        self.path = path
    
    def load_module(self, fullname):
        """import a notebook as a module"""
        path = find_notebook(fullname, self.path)
        
        print ("importing Jupyter notebook from %s" % path)
                                       
        # load the notebook object
        with io.open(path, 'r', encoding='utf-8') as f:
            nb = read(f, 4)
        
        
        # create the module and add it to sys.modules
        # if name in sys.modules:
        #    return sys.modules[name]
        mod = types.ModuleType(fullname)
        mod.__file__ = path
        mod.__loader__ = self
        mod.__dict__['get_ipython'] = get_ipython
        sys.modules[fullname] = mod
        
        # extra work to ensure that magics that would affect the user_ns
        # actually affect the notebook module's ns
        save_user_ns = self.shell.user_ns
        self.shell.user_ns = mod.__dict__
        
        try:
          for cell in nb.cells:
            if cell.cell_type == 'code':
                # transform the input to executable Python
                code = self.shell.input_transformer_manager.transform_cell(cell.source)
                # run the code in themodule
                exec(code, mod.__dict__)
        finally:
            self.shell.user_ns = save_user_ns
        return mod
class NotebookFinder(object):
    """Module finder that locates Jupyter Notebooks"""
    def __init__(self):
        self.loaders = {}
    
    def find_module(self, fullname, path=None):
        nb_path = find_notebook(fullname, path)
        if not nb_path:
            return
        
        key = path
        if path:
            # lists aren't hashable
            key = os.path.sep.join(path)
        
        if key not in self.loaders:
            self.loaders[key] = NotebookLoader(path)
        return self.loaders[key]

sys.meta_path.append(NotebookFinder())

In [None]:
import transformers

In [None]:
from transformers import AutoTokenizer,AutoModelWithLMHead

In [None]:
gpt_tokenizer = AutoTokenizer.from_pretrained("gpt2")

In [None]:
gpt_model = AutoModelWithLMHead.from_pretrained("gpt2")

In [None]:
gpt_inputs = gpt_tokenizer("A long time ago,",return_tensors="pt")

gpt_outputs = model(gpt_inputs)

In [None]:
from transformers import AutoTokenizer,AutoModel

In [None]:
tokenizer = AutoTokenizer.from_pretrained("bert-base-uncased")

In [None]:
model = AutoModel.from_pretrained("bert-base-uncased")

In [None]:
inputs = tokenizer("Hello world!",return_tensors="pt")

In [None]:
outputs = model(**inputs)

In [None]:
outputs

In [None]:
type(outputs)

In [None]:
from transformers import pipeline

In [None]:
classifier = pipeline("sentiment-analysis")

#### 正负面情感分类器

In [None]:
classifier("We are sad.")

In [None]:
classifier("hahahaha")

In [None]:
classifier("We are happy and sad.")

In [None]:
classifier("You are sad")

In [None]:
classifier("suicide")

In [None]:
classifier("killer")

In [None]:
classifier("The killer is happy.")

In [None]:
classifier("The killer is happy to kill people.")

In [None]:
classifier("The killer is going to kill people.")

#### 问答

In [None]:
question_answer = pipeline("question-answering")

In [None]:
question_answer({'question':'What\'s the name of ronaldo?','context':'Cristiano Ronaldo is the best football player in the world!' })

In [None]:
question_answer({'question':'我爱谁？','context':"我爱学习，爱情不太美好。"})#对中文不支持啊

In [None]:
from sklearn import preprocessing

In [None]:
enc = preprocessing.OneHotEncoder()

In [None]:
enc.fit([[0,0,3],[1,1,0],[0,2,1],[1,0,2]])

In [None]:
array = enc.transform([[0,1,3]]).toarray()

In [None]:
array