# Python Client

In [None]:
# Import ModelBazaar class.
import thirdai
from thirdai.neural_db import ModelBazaar

# Activate your license
thirdai.licensing.activate("YOUR-THIRDAI-ACTIVATION-KEY")

In [None]:
# Initialise a ModelBazaar object with url where model_bazaar is hosted.
# Append `/api/` in the url.
bazaar = ModelBazaar(base_url="http://20.29.78.64//api/")

In [None]:
# Used to signup on model bazaar. Sends a email verification link.
bazaar.sign_up(email="mritunjay@thirdai.com", password="password", username="mj3ai")

In [None]:
# Login with your email_id and password.
bazaar.log_in(email="mritunjay@thirdai.com", password="password")

In [None]:
train_extra_options = {
    "num_samples_per_shard": 3_500_000,
    "allocation_memory": 300000,
    #   ---shard agnostic training params---
    "model_cores": 20,
    "model_memory": 200000,
    "csv_id_column": "label",
    "csv_strong_columns": ["title"],
    "csv_weak_columns": ["abstract"],
    "csv_reference_columns": ["title", "abstract"],
    "fhr": 200000,
    "embedding_dim": 4096,
    "output_dim": 100000,
    "max_in_memory_batches": 2000,
}

In [None]:
# Creates a model from scratch trained on given list of documents.
# Can be synchronous or asynchronous(default; in which case we call await_train)
# `doc_type` can be "local"(default), "nfs" or "s3".
model = bazaar.train(
    model_name="pubmed-35M-10-models-char4-0",
    docs=["/model_bazaar/datasets/pubmed/lowercased_all_withoutpapertags.csv"],
    doc_type="nfs",
    sharded=True,
    is_async=True,
    train_extra_options=train_extra_options,
)

In [None]:
# Blocking call to wait till model finishes training.
bazaar.await_train(model)

In [None]:
# Deploys the model and returns an ndb_client which can be used to interact to neural_db.
# Can be synchronous or asynchronous(default; in which case we call await_deploy)
ndb_client = bazaar.deploy(
    model_identifier=model.model_identifier,
    deployment_name="deployment-0",
    is_async=True,
)

In [None]:
# Blocking call to wait till deployment finishes.
bazaar.await_deploy(ndb_client)

In [None]:
# Insert new files in the neural_db model.
ndb_client.insert(
    files=["/Users/mjay/Documents/MACH.pdf", "/Users/mjay/Documents/OpenMPIInstall.pdf"]
)

In [None]:
# Search the ndb model.
results = ndb_client.search(query="who are the authors of this paper", top_k="5")

query_text = results["query_text"]
references = results["references"]
for reference in references:
    print(reference["text"])

In [None]:
# [RLHF] Associate : takes list of dictionaries where each dictionary has 'source' and 'target' keys.
ndb_client.associate(
    [
        {"source": "authors", "target": "contributors"},
        {"source": "paper", "target": "document"},
    ]
)

In [None]:
# [RLHF] Upvote/Downvote : takes list of dictionaries where each dictionary has 'query_text' and 'reference_id' keys.
best_answer = references[4]
good_answer = references[2]
ndb_client.upvote(
    [
        {"query_text": query_text, "reference_id": best_answer["id"]},
        {"query_text": query_text, "reference_id": good_answer["id"]},
    ]
)

In [None]:
# Deletes documents from the deployment so they are not able to be searched over anymore
ndb_client.delete([references[0]["source_id"]])

In [None]:
# Undeploys the model.
bazaar.undeploy(ndb_client)

In [None]:
# Deletes the model from model bazaar.
bazaar.delete(model_identifier=model.model_identifier)

In [None]:
# Return a list of models accessible to user on model bazaar.
bazaar.list_models()

In [None]:
# Returns a list of all active deployments.
bazaar.list_deployments()

In [None]:
# Connects to an active deployment.
ndb_client = bazaar.connect(deployment_identifier="mj3ai/model-0:mj3ai/deployment-0")

In [None]:
# Push an NDB model from local to model bazaar
bazaar.push_model(
    model_name="test-upload-2",
    local_path="/Users/mjay/test.ndb",
    access_level="private",
)

In [None]:
# Pull model from model bazaar to local
ndb_model = bazaar.pull_model(model_identifier="mj3ai/model-1")