In [1]:
# Import the libraries
from transformers import AutoModelForCausalLM, AutoTokenizer, DataCollatorForLanguageModeling, Trainer, TrainingArguments
from datasets import load_dataset

# Load the model and tokenizer
model = AutoModelForCausalLM.from_pretrained("https://huggingface.co/meta-llama/Llama-2-7b-chat-hf")
tokenizer = AutoTokenizer.from_pretrained("https://huggingface.co/meta-llama/Llama-2-7b-chat-hf")

# Load the dataset
dataset = load_dataset("wikitext", "wikitext-103-raw-v1")

# Tokenize the dataset
def tokenize_function(examples):
    return tokenizer(examples["text"], return_special_tokens_mask=True)

tokenized_datasets = dataset.map(tokenize_function, batched=True, num_proc=4, remove_columns=["text"])

# Define the data collator
data_collator = DataCollatorForLanguageModeling(tokenizer=tokenizer, mlm_probability=0.15)

# Define the training arguments
training_args = TrainingArguments(
    output_dir="output",
    overwrite_output_dir=True,
    num_train_epochs=1,
    per_device_train_batch_size=4,
    save_steps=10_000,
    save_total_limit=2,
)

# Define the trainer
trainer = Trainer(
    model=model,
    args=training_args,
    train_dataset=tokenized_datasets["train"],
    eval_dataset=tokenized_datasets["validation"],
    data_collator=data_collator,
)

# Train the model
trainer.train()

# Save the model
trainer.save_model("output")


Welcome to bitsandbytes. For bug reports, please submit your error trace to: https://github.com/TimDettmers/bitsandbytes/issues
CUDA SETUP: CUDA runtime path found: /usr/local/cuda/lib64/libcudart.so
CUDA SETUP: Highest compute capability among GPUs detected: 7.5
CUDA SETUP: Detected CUDA version 118
CUDA SETUP: Loading binary /root/anaconda3/envs/venv/lib/python3.11/site-packages/bitsandbytes/libbitsandbytes_cuda118.so...


  warn(msg)


[2023-07-28 12:44:14,221] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)




Downloading (…)a/Llama-2-7b-chat-hf:   0%|          | 0.00/116k [00:00<?, ?B/s]

OSError: It looks like the config file at '/tmp/tmposmwh558' is not a valid JSON file.

In [3]:
from huggingface_hub import notebook_login
notebook_login()


VBox(children=(HTML(value='<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…

In [4]:
from huggingface_hub import snapshot_download
snapshot_download("meta-llama/Llama-2-7b-chat-hf")


Fetching 16 files:   0%|          | 0/16 [00:00<?, ?it/s]

Downloading (…)of-00002.safetensors:   0%|          | 0.00/3.50G [00:00<?, ?B/s]

Downloading (…)eda92b8e/config.json:   0%|          | 0.00/635 [00:00<?, ?B/s]

Downloading (…)of-00002.safetensors:   0%|          | 0.00/9.98G [00:00<?, ?B/s]

Downloading (…)neration_config.json:   0%|          | 0.00/167 [00:00<?, ?B/s]

Downloading (…)92b8e/.gitattributes:   0%|          | 0.00/1.52k [00:00<?, ?B/s]

Downloading (…)eda92b8e/LICENSE.txt:   0%|          | 0.00/7.02k [00:00<?, ?B/s]

Downloading (…)fetensors.index.json:   0%|          | 0.00/26.8k [00:00<?, ?B/s]

Downloading (…)l-00001-of-00002.bin:   0%|          | 0.00/9.98G [00:00<?, ?B/s]

Downloading (…)l-00002-of-00002.bin:   0%|          | 0.00/3.50G [00:00<?, ?B/s]

Downloading (…)d5eda92b8e/README.md:   0%|          | 0.00/10.4k [00:00<?, ?B/s]

Downloading (…)a92b8e/USE_POLICY.md:   0%|          | 0.00/4.77k [00:00<?, ?B/s]

Downloading (…)cial_tokens_map.json:   0%|          | 0.00/414 [00:00<?, ?B/s]

Downloading (…)model.bin.index.json:   0%|          | 0.00/26.8k [00:00<?, ?B/s]

Downloading (…)okenizer_config.json:   0%|          | 0.00/770 [00:00<?, ?B/s]

Downloading tokenizer.model:   0%|          | 0.00/500k [00:00<?, ?B/s]

Downloading (…)92b8e/tokenizer.json:   0%|          | 0.00/1.84M [00:00<?, ?B/s]

'/root/.cache/huggingface/hub/models--meta-llama--Llama-2-7b-chat-hf/snapshots/01622a9d125d924bd828ab6c72c995d5eda92b8e'

In [6]:
from transformers import AutoModelForCausalLM, AutoTokenizer
model = AutoModelForCausalLM.from_pretrained("/root/.cache/huggingface/hub/models--meta-llama--Llama-2-7b-chat-hf/snapshots/01622a9d125d924bd828ab6c72c995d5eda92b8e")
tokenizer = AutoTokenizer.from_pretrained("/root/.cache/huggingface/hub/models--meta-llama--Llama-2-7b-chat-hf/snapshots/01622a9d125d924bd828ab6c72c995d5eda92b8e")
model.save_pretrained("/var/basefolder_smit/dbq/localdata")
tokenizer.save_pretrained("/var/basefolder_smit/dbq/localdata")

Loading checkpoint shards:   0%|          | 0/2 [00:00<?, ?it/s]

('/var/basefolder_smit/dbq/localdata/tokenizer_config.json',
 '/var/basefolder_smit/dbq/localdata/special_tokens_map.json',
 '/var/basefolder_smit/dbq/localdata/tokenizer.model',
 '/var/basefolder_smit/dbq/localdata/added_tokens.json',
 '/var/basefolder_smit/dbq/localdata/tokenizer.json')