In [14]:
from keybert import KeyBERT

doc = """
         Supervised learning is the machine learning task of learning a function that
         maps an input to an output based on example input-output pairs. It infers a
         function from labeled training data consisting of a set of training examples.
         In supervised learning, each example is a pair consisting of an input object
         (typically a vector) and a desired output value (also called the supervisory signal).
         A supervised learning algorithm analyzes the training data and produces an inferred function,
         which can be used for mapping new examples. An optimal scenario will allow for the
         algorithm to correctly determine the class labels for unseen instances. This requires
         the learning algorithm to generalize from the training data to unseen situations in a
         'reasonable' way (see inductive bias).
      """
kw_model = KeyBERT()
keywords = kw_model.extract_keywords(doc)

In [15]:
kw_model.extract_keywords(doc,  keyphrase_ngram_range=(3, 3), stop_words='english',
                              use_mmr=True, diversity=0.5)

[('supervised learning algorithm', 0.6992),
 ('function labeled training', 0.663),
 ('labels unseen instances', 0.4239),
 ('called supervisory signal', 0.4016),
 ('function maps input', 0.3176)]

In [16]:
from keybert import KeyBERT
kw_model = KeyBERT(model='all-MiniLM-L6-v2')
keywords = kw_model.extract_keywords(doc)

In [17]:
kw_model.extract_keywords(doc,  keyphrase_ngram_range=(3, 3), stop_words='english',
                              use_mmr=True, diversity=0.5)

[('supervised learning algorithm', 0.6992),
 ('function labeled training', 0.663),
 ('labels unseen instances', 0.4239),
 ('called supervisory signal', 0.4016),
 ('function maps input', 0.3176)]

In [18]:
from flair.embeddings import TransformerDocumentEmbeddings

roberta = TransformerDocumentEmbeddings('roberta-base')
flair_kw_model = KeyBERT(model=roberta)

In [1]:
dt= "Here are specific instructions If the name on the NY State Title Certificate will not change , sales tax forms and proofs are not required. See information below if you were not a NY State resident when you purchased the vehicle. If you bought the vehicle from a NY State automobile dealer or an out - of - state dealer that is authorized to collect NY State sales tax , bring the dealer's bill of sale that shows that you paid NY State sales tax. Also bring a Dealer s Bill of Sale MV-50 NY State dealer only or a completed Sales Tax Exemption {Sales Tax Form} pdf at NY State Department of Tax and Finance DTF-803 for an out - of - state dealer. If NY State sales tax was paid to a NY State dealer , the DMV does not collect sales tax when you apply for a vehicle registration , and the DMV does not issue a sales tax receipt."

In [19]:
flair_kw_model.extract_keywords(dt,  keyphrase_ngram_range=(3, 3), stop_words='english',
                              use_mmr=True, diversity=0.5)

[('taxes online estimate', 0.9952),
 ('fees taxes trailers', 0.9952),
 ('vehicle estimate fees', 0.9952),
 ('estimate fees taxes', 0.9952),
 ('register vehicle pay', 0.9951)]

In [21]:
flair_kw_model.extract_keywords(ut)

[('vehicle', 0.9977),
 ('plate', 0.9977),
 ('registration', 0.9976),
 ('fee', 0.9976),
 ('yes', 0.9973)]

In [20]:
flair_kw_model.extract_keywords(dt)

[('taxes', 0.9945),
 ('certificate', 0.9944),
 ('fees', 0.9944),
 ('sales', 0.9943),
 ('counties', 0.9943)]

In [2]:
ut='On a good note, you do not have to pay sales tax at the DMV office.'

In [None]:
from sentence_transformers import SentenceTransformer

In [19]:
flair_kw_model.extract_keywords(ut)

[('sales', 0.9981),
 ('dmv', 0.9978),
 ('note', 0.9977),
 ('office', 0.9976),
 ('pay', 0.9974)]

In [3]:
from similarity_checks import SimilarityChecks



In [None]:
sim = SimilarityChecks()

In [12]:
dt = "Estimate registration fees and taxes. If this is the original registration first time you register your vehicle, you must pay the registration fee vehicle plate fee county use tax sales tax see sales tax information title certificate fee of $50.00 MCTD 1 fee for the following 12 counties only: Bronx, Kings Brooklyn, New York Manhattan, Queens, Richmond Staten Island, Dutchess, Nassau, Orange, Putnam, Rockland, Suffolk, and Westchester If you transfer the registration and plates from another vehicle , you don t need to pay the plate fees or MCTD fee , and you may be able to transfer the registration fees to your new vehicle. Estimate fees and taxes online The online estimates DOES NOT include the sales tax. You can also use these charts to estimate your registration fees, use taxes, and supplemental fees for passenger vehicles commercial vehicles Sorry , you cannot use the online service to estimate fees and taxes for trailers or boats see instructions below. Estimate registration fees and taxes online Estimate trailer and boat registration fees Trailer and boat registration fees are calculated differently."
ut= "Yes, there is a vehicle plate fee as well as a registration fee."

In [13]:
sim.compute(ut,dt)

array([[0.6645771]], dtype=float32)

In [8]:
!nvidia-smi

Wed Dec 14 00:25:32 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.141.10   Driver Version: 470.141.10   CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla K80           On   | 00000001:00:00.0 Off |                    0 |
| N/A   42C    P0    69W / 149W |  11000MiB / 11441MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
                                                                               
+-----------------------------------------------------------------------------+
| Proces

In [11]:
!nvidia-smi

Wed Dec 14 00:34:37 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.141.10   Driver Version: 470.141.10   CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla K80           On   | 00000001:00:00.0 Off |                    0 |
| N/A   40C    P8    30W / 149W |      0MiB / 11441MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
                                                                               
+-----------------------------------------------------------------------------+
| Proces