In [1]:
! pip3 install transformers
! pip3 install datasets

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting transformers
  Downloading transformers-4.26.1-py3-none-any.whl (6.3 MB)
[2K     [90m‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ[0m [32m6.3/6.3 MB[0m [31m49.3 MB/s[0m eta [36m0:00:00[0m
[?25hCollecting tokenizers!=0.11.3,<0.14,>=0.11.1
  Downloading tokenizers-0.13.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)
[2K     [90m‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ[0m [32m7.6/7.6 MB[0m [31m49.6 MB/s[0m eta [36m0:00:00[0m
Collecting huggingface-hub<1.0,>=0.11.0
  Downloading huggingface_hub-0.12.1-py3-none-any.whl (190 kB)
[2K     [90m‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ‚îÅ[0m [32m190.3/190.3 KB[0m [31m7.

In [2]:
from google.colab import drive

drive.mount('/content/gdrive')

Mounted at /content/gdrive


In [3]:
from transformers import pipeline, AutoTokenizer, AutoModelForCausalLM, TrainerCallback, TextDataset, DataCollatorForLanguageModeling, TrainingArguments, Trainer
import torch
from os.path import join


DEVICE='cuda'


def get_ru_model(checkpoint = "sberbank-ai/rugpt3small_based_on_gpt2"):
    model = AutoModelForCausalLM.from_pretrained(checkpoint).to(DEVICE)
    tokenizer = AutoTokenizer.from_pretrained(checkpoint)
    return model, tokenizer


def print_generations(prefix = ". ", n_samples=4, max_len=70, one_line=True):
    global model, tokenizer
    input_ids = tokenizer.encode(prefix, return_tensors='pt').to(DEVICE)
    sample_outputs = model.generate(
        input_ids,
        do_sample=True, 
        max_length=max_len, 
        top_k=50,
        top_p=0.90, 
        num_return_sequences=n_samples,
        pad_token_id=50256
    )
    for row in sample_outputs:
        text = tokenizer.decode(row)
        if one_line:
            text = text.split("\n")[0]
        print(text)


class PringSamplingCallback(TrainerCallback):
    def on_log(self, args, state, control, **kwargs):
        print("=====", "progress:", state.epoch, "=========")
        print_generations()
        print("==========================")


def freeze_layers(model, n_layers=8):
    assert (n_layers >=0) and (n_layers <= 12)
    to_freeze = (
        model.transformer.wte,
        model.transformer.wpe,
        model.transformer.drop,
        model.transformer.h[:n_layers]
    )
    for paramgroup in to_freeze:
        for param in paramgroup.parameters():
            param.requires_grad = False


def finetune(model, tokenizer, path, n_epochs="auto", adjust_to_size=5e6):
    if n_epochs == "auto":
        filesize = len(open(path).read())
        num_train_epochs = adjust_to_size / filesize
        print("SETTING N_EPOCHS TO ", num_train_epochs)
    else:
        num_train_epochs = n_epochs
    
    dataset = TextDataset(
        tokenizer = tokenizer,
        file_path = path,
        block_size = 256,
    )
    data_collator = DataCollatorForLanguageModeling(
        tokenizer=tokenizer, 
        mlm = False,
    )
    training_args = TrainingArguments(
        output_dir=".",
        overwrite_output_dir=False,
        per_device_train_batch_size=8,
        num_train_epochs=num_train_epochs,
        logging_steps=50,
        save_steps=500,
    )
    trainer = Trainer(
        model=model,
        args=training_args,
        data_collator=data_collator,
        train_dataset=dataset,
        callbacks=[PringSamplingCallback],
    )
    trainer.train()
    trainer.save_model()


COLAB_DATA_PATH = "/content/gdrive/MyDrive/datasets/"
OLDRU_PATH = join(COLAB_DATA_PATH, "oldrussian.txt")
DOST_PATH = join(COLAB_DATA_PATH, "dost.txt")
TOLST_PATH = join(COLAB_DATA_PATH, "tolst.txt")
LENIN_PATH = join(COLAB_DATA_PATH, "lenin.txt")

# –¢–µ–∫—Å—Ç—ã –Ω–∞ –¥—Ä–µ–≤–Ω–µ—Ä—É—Å—Å–∫–æ–º —è–∑—ã–∫–µ

In [4]:
model, tokenizer = get_ru_model()
freeze_layers(model, 4)

Downloading (‚Ä¶)lve/main/config.json:   0%|          | 0.00/608 [00:00<?, ?B/s]

Downloading (‚Ä¶)"pytorch_model.bin";:   0%|          | 0.00/551M [00:00<?, ?B/s]

Downloading (‚Ä¶)olve/main/vocab.json:   0%|          | 0.00/1.71M [00:00<?, ?B/s]

Downloading (‚Ä¶)olve/main/merges.txt:   0%|          | 0.00/1.27M [00:00<?, ?B/s]

Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.


In [5]:
finetune(model, tokenizer, OLDRU_PATH)

SETTING N_EPOCHS TO  0.587214714943076


***** Running training *****
  Num examples = 11776
  Num Epochs = 1
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 865
  Number of trainable parameters = 56704512


Step,Training Loss
50,4.4193
100,4.2914
150,4.2192
200,4.155
250,4.0967
300,4.0715
350,4.0767
400,4.0571
450,4.0598
500,4.0168


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω –∂–µ, –≤–∏–¥—è —á—Ç–æ –ø–∏—Ç–∏–µ–º –±–æ –∏ –æ—Ç —á–∞–¥—ä—è –∏ –æ—Ç –¥—É—Ö–æ–≤—ä –ø—Ä–∏–∏–º—ä. –æ —Å–µ–º—ä–∂–µ –ø–æ–µ–ª–∏ —Å–æ –º–Ω–æ—é, –∏ –∫—Ä—£–ø–∏–µ –¥—£—Ç–∏ –≤—ä —Ü–µ—Ä–∫–æ–≤—å, –∞ –∏ –ø—Ä–∏–∏–¥–µ, –∏ –±—ã—Å—Ç—å —Å—ä –ø–Ω–µ–º—ä —Å—å –≤ —Ü–µ—Ä–∫–æ–≤—å, –∏ –≤—ä –Ω–µ–π
.  –í—£—Ä–Ω–æ–µ –∂–µ –ø—Ä–µ—Å—Ç–∞–≤–ª–µ–Ω–∏–µ, —è–∫–æ –≤—Å—£–º –±–æ, —è–∫–æ–∂–µ –≤—£–¥—É—â–∏–µ., –≤—ä–∑–º–æ–∂–µ–Ω—ä –∂–∏—Ç–∏—é, —Ç—£–ª–∞ –∏ –º—ã—Å–ª–∏, –±—ã—Å—Ç—å, –±—£—è—à—à—É, –≤—£—Ç–º–æ –º—£—Å—è—Ü–∞, –∏ –ø–∞–∫–∏ –≤—ä–∑–¥–µ—Ä–∂–∞–Ω–∏—à–∏—Å—è.
.  –ö–æ–≥–¥–∞ –∂–µ –¥–æ—Å—Ç–æ—á–Ω—ã –∏ –æ—Ç—á–∏—Å—Ç–æ –∏—Ö —Å—£–¥–∏–ª–∏, –∏ –æ–Ω—ã—Ö –∂–µ —Å—ä—Å–æ—Ä—ä–∑–Ω–∏—Ü—ä –Ω–∞—£—Ö –∏ —Å–Ω—£–∫—ä –ø—Ä–∏ –Ω–∏—Ö—ä, –∏ –æ—Ç—ä –Ω–∏—Ö—ä –∂–µ —Å—ä–≥—Ä–∞–¥–æ—à–∞ —Å—ä –Ω–∏–º–∏—ä, –∏ –æ—Ç –Ω–∏—Ö—ä –∂–µ –≤—ä —Ç—ä–º—ä –∂–µ —Ç—ä–º—ä –∂–µ –≤
.  –û–Ω –∂–µ –æ—Ç –ª–∏—Ü–∞ —Å–≤—£—Ç–∞ —Å—å–¥–µ –Ω–∞ –ª—£—Ç–∞, –∏ –º—£—Å—å–∫–∏ –ø–æ—Å—Ç–∞–≤–∏, –∏ –æ—Ç –ª—£—Ç–∞, –∏ –æ—Ç —Ç—£—Ö—ä, –Ω–æ –∏ –æ—Ç –Ω–∏—Ö—ä. –∏ —è–∫–æ –≤—ä —Ç—É –Ω–æ—á—å –æ—Ç –Ω–∏—Ö—ä –∫—ä —Ü–∞

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í—ä–¥—£—Ç—å –∂–µ –Ω–µ—Å—Ç—å –µ—è –≤—ä–¥—£—Ö—å, –∞ —Å—£—è, –±–æ –ø–æ —Ç—£–ª–æ, –≤—ä–∑–¥–æ—Ö—ä. –∏ –µ—è –∂–µ –ø–æ –ø—Ä–µ–ª—ä—Å—Ç–≤–µ –¥—ã—Ö—Ö—ä, –≤–Ω–∏–¥–µ –≤ —Ä–∞–∫—É, –∏ –µ—è —Å—Ä–µ–±—£ –¥—ã—Ö—Ö, –∏ –¥—ã—Ö—Ö—ä
.  –ò –≤–∑–∞–ª—ä–∫–æ—Å—è, –∏ –≤–∑–∞–ª—ä–∫—ä, –∏ —Ç–∞–∫–æ, –≤–∑–∞–ª—ä–∫—ä, –∏ —Ç–∞–∫–æ –∏ –∑–∞–∏—à–∞—à–∞—à–∞, –∏ –ø—Ä–∏—£—Ö—à–∏, –∏ –∏ –ø—Ä–∏—£—Ö—à–∞, –∏ –æ–≥–æ—à–∞, –∏ –ø—Ä–∏—£—Ö—à–∞, –∏ –ø—Ä–∏–µ—Ö—à–∞, –∏ –ø—Ä–∏–µ—Ö—à–µ,
. 
.  –í—ä–ª–≥–∞–µ–∂–µ –º—£–Ω—ã –±—ã—à–∞, –∏ —Å—à–µ–¥—à–µ –≤–æ –≤—Å—£ –º–æ–Ω–∞—Å—Ç—ã—Ä–∏, –∞ –∏–Ω–∞—à–µ –≤ –Ω–µ–≥–æ –≤–∑–¥—£–ª–∏—à–∞—Å—è. –∏ —Å–µ, –Ω—£—á—é–∂–µ, –º–Ω—£ –∏ –±—ã—à–∞ –ø–æ –º–æ–Ω–∞—Å—Ç—ã—Ä—Å–∫–æ–º—É –∂–∏—Ç–∏—é –∏ –ø–æ –≤—Å—£–º—ä—ä –ø—Å–∫–æ–≤—Å–∫–∏–º—ä –º


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. 
.  –ò –≤–æ—Ç, –∏–¥—£–∂–µ, –∏–∑–º—£–Ω–∏–≤—Å—è, –Ω–æ –∏ –≤–º—£–Ω–∏–≤—Å—è, —Ç–∞–∫–æ —Ä–µ—á–µ –∏–º—ä: "–∫—Ç–æ –Ω–µ –∏–º–µ–µ—Ç—ä —Ç–æ–≥–æ, –Ω–µ –≤—£—Å—Ç–Ω–∏–∫—ä, –Ω–æ –∏–Ω–æ—á–µ—Å—Ç–Ω—ã–π?  –≤—ã –ª—å—à–∏—à—ä—Å—è –ª–∏—à–∏—Å—è –ª–∏—à–∏—à–∞—Å—è, –∏ —Å –Ω–∞–º–∏, —Ç–∞–∫–æ–∂–µ
.  –ï–≥–¥–∞ –∂–µ –æ–Ω –≤–æ –≤—Å–∏, –∏ –Ω–µ –¥–∞—Å—Ç—ä –µ–º—É –ø—Ä–∏–ª–æ–≥–∞. –æ—Ç—å –±—è—à–µ —Å—ä—Ç–≤–æ—Ä–∏—à–∏—Å—è, –∏ –æ—Ç—å–≥—Ä–∞—Ö —Å—è, –∏ –ø—Ä–µ–≤–µ–¥–µ –æ—Ç –Ω–µ–≥–æ –∏ –º—è, –∏ —Ä–µ—á–µ –∫—ä –Ω–µ–º—Ü—É, —è–∫–æ: ¬´–æ—Ç—ä–∫—ã¬ª. –æ–Ω—ä –∂–µ —É–±–æ –Ω–µ –¥–∞—Å—Ç—å
.  –ó–∞ —Å–∏–º—ä–≥–ª–∞—Å–∏—Ç–µ –º—å—Å—Ç–µ–Ω—å—Å—Ç–≤—É—é—â—É: "–∑–∞–±–ª—É–¥–∏—Ç–µ—Å—è –∏ –ø–æ–≥—É–±–∏—Ç–µ! –Ω–µ –ø–æ –Ω—å —Å–∏ –±—£, –Ω–æ –Ω—ã–Ω—£!" –∏ –ø–∞–∫–∏ —É–±–æ –≤—ä–∑–ª–æ–∂–∏—à–∏—Å—è –Ω–∞ —Ç—è. –∏ –æ—Ç—Ç—É–¥—É –Ω–µ –ø—Ä–µ—Å—Ç–∞–Ω–∏—à–∞. –∏ –∫ —Ç–æ–º—É –ø—Ä–∏–∏–¥–æ—à–∞,


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ü—Ä–µ–±–Ω—£ –±—£—Ç–∏ –ø–æ-–ø—Ä–µ–∂–Ω–µ–º—É, –∞ –Ω–∞—Å–ª—£–¥—à–µ –≤—ä—Å–µ–¥—£–π, –∞–∑ –∂–µ, –≤—ä—Å–∏–¥–µ –≤—ä –µ–¥–∏–Ω—£, –≥–ª–∞–≥–æ–ª—é—â–µ —Å –≤–∞–º–∏: ¬´–≤—£–¥–∞–µ—Ç–µ –ª–∏ –µ—Å–∏, –¥–∞ –Ω–µ –±—É–¥—É —Å–µ¬ª.  ¬´–∫—Ç–æ —Å–µ –±—É–¥–µ—Ç—ä –∏ —Ä–µ—á–µ–º, —Å–µ –∏ –±—É–¥–µ—Ç—ä –∏
.  "–∞—â–µ –±–æ –Ω—£–∫–∞–∞—à–∏", —Ç–æ –∞–∑—ä –∂–µ, –ø—Ä–∏—è—Ö–∞ –∫—ä –∏–≥—É–º—É –∏ –≤–æ–ø—Ä–æ—à–∞: ¬´–æ, –∏–≥—É–º–µ–Ω—ä, —á—Ç–æ —Ö–æ—â–µ—Ç—å?" ‚Äî –∏–≥—É–º–µ–Ω—ä —Ä–µ—á–µ: ¬´–¥–∞–Ω–∏, –∏–∂–µ —É –Ω–∞—Å—ä –µ—Å—Ç—å¬ª, –∏ –≥–ª–∞–≥–æ–ª–∞: ¬´–∏ –Ω–µ –±–æ—à–∏ –º–∏, –æ
.  –ò —Ç–æ –±—ã—Å—Ç—å –∂—£ –≤ –º—ä—Å—Ç–µ—Ü—£, –∞ –≤ —Ç–æ–º –º—£—Å—Ç–æ ‚Äî –Ω–µ –±—ã—Å—Ç—å. –¥–∞ –∏ –Ω–∏ –≤ —á–µ–º –±—ã—Å—Ç—å: "–Ω–µ –≤—£–¥—É –º—£—Å—Ç–æ –Ω–∞ –Ω–µ–±–æ". —É–±–æ –±–æ –µ—Å—Ç—å –≤ —Ç–µ–º–Ω–∏—Ç–∏ –º–Ω–æ–≥–∞ –∏ –º—£—Å—Ç–æ –Ω–∞ –∑–µ–º–ª—é, —è–∫–æ –≤ —Ç–æ–π –∑–µ–º–ª–µ —Å–µ—á–µ—à–∏,
.  –ò —Å–µ –Ω–∞—Ä–µ–∫–∞—à–µ, —è–∫–æ: "–æ, —á—Ç–æ –≤—ä–∑–º–æ–∂–µ—à–∏, –æ, —á—Ç–æ –º–∏, –æ, —á—Ç–æ –Ω–∞–º—ä –Ω–µ –Ω–∞–ø–∞–¥–∞—à–µ?" –∏ –±—ã—Å—Ç—å, –∏ –≤—ä–∑–º–æ–∂–µ—à–∏

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  "–≤—Å–µ–º –∂–µ, —É–±–æ –¥—å—Ä–≤–∞, –¥–∞ –Ω–µ —Å—ä–∑—Ä—£—à–∞—Ç–∏ –∏–Ω—ã—è: –Ω–∏ —É–±–æ —Å—è, –Ω–∏ —É–±–æ –æ—Ç—ä –º–µ–Ω—è; –∏ –Ω—ã–Ω—£ –µ–¥–∏–Ω–∞ –º–Ω–æ–≥–∞ –¥—£–ª–∞ –∏ –º–Ω–æ–≥–∞ —á—é–¥–Ω–æ—Å—Ç–∏ –∏ –≤—ä–∑—Ä–∞—â–∞—é—â–∞. —Å–µ–º—É –∂–∏—Ç–∏, —è–∫–æ –Ω–µ —Ç–æ–∫
.  –∏ —Ä–µ—á–µ: "–Ω–µ —Ç—É–∂–∏, —Å–∏ —Å–∏, –Ω–µ —Ö—É–∂–∏, –∞ —è–∫–æ —Ö–æ—â–µ—à–∏ –∏ –ø—Ä–∏—Å–Ω–æ —Ç–µ–±–µ. –∏–∂–µ –≤ –ª—£—Ç—£—Ö—ä —Ç–≤–æ–µ–º, –Ω–µ –º–æ–ª–∏–ª—ä –ë–æ–≥–∞, –∞ –æ—Å—Ç–∞–≤–∏ –º—è –±–æ–≥—ä, –∏–∂–µ –æ—Ç —Ä—É—Å–∫–∞–∞, –µ–∂–µ –≤—ä—Å–∏ –æ—Ç –Ω–∞—á–∞–ª–∞ –∏ –¥–æ –Ω–∏–∑
.  –ê –∏–∂–µ –≤—ä–ø—Ä–æ—Å–∏, –ø–æ—Å—Ç–∞–≤–∏, —É—Ä–∞–∑—É–º–µ—Ç—å —Å–∏, —Ç–∞–∫–æ –¥–∞ –ø—Ä–æ—Å–≤–µ—Ç–ª–µ—à–∏—Å—è, –ø—Ä–∏—Å–Ω–æ —Ä–∞–∑—É–º—£ –∏ –æ –±–ª–∞–∂–µ–Ω–Ω—ã–π –¥—É—Ö—ä, –µ–∂–µ —Å—ä—Ç–≤–æ—Ä—è–µ—Ç—ä –µ–¥–∏–Ω–∞–≥–æ –≤—£—Ä—Ü–∞ –∏ —Ç–≤–æ—Ä—è—Ç—ä –º–Ω—£—Ç–∏ –æ –≤—Å—£—Ö—ä –æ–Ω—ã—Ö—ä; –Ω–µ —É–±–æ, —è–∫–æ –±—ã
.  –∏ –º–Ω–æ–∑–∏ –±—£ –≤–æ–∏–Ω—É –≤—ä —Ç—£—Å—£—Ö—ä. –∞—â–µ –∂–µ –Ω–µ —É—á–∏–Ω—è—à–µ –≤—Å–µ–º—É, –∞—â–µ –∂–µ –æ–Ω—É—â–µ—à—è, —Ç–æ –æ—Ç–∂–µ —Å–µ —Ç–≤–æ—Ä—è—â—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –Ø–¥–∞ –∂–µ —É –Ω–µ–≥–æ—ä –Ω–µ –±—ã–ª–æ, –∏ –≤–æ–∏ –Ω–∞ –∫–æ–Ω–Ω—ã—Ö—ä –∏ –Ω–∞ –∑—ä –∫–æ–Ω–µ–π, –Ω–µ –ø–æ–±—£–∂–∞–≤—à–∏—Å—è –æ—Ç –Ω–∏—Ö, –∞ –∏–Ω—ã–µ –≤ —Ç—É –∂–µ –≤–µ—á–µ—Ä–∏–Ω—É –ø–æ –≤—Å—è –¥–Ω–∏ –≤ –∫–µ–ª–∏–∏ —Å–≤–æ–µ—è –º–æ–ª–∏—à—è—â–µ—Å—è –∏–º—ä. 
.  –í—ä–ª—£–∑–∞—è –ø–æ —Å–µ–¥–æ–º—É –¥—Ä–µ–≤–Ω–∏—é –º–æ—Å—Ç—É, —É–∑—Ä–µ—Ç—å –±–æ –≤ –∑–µ–º–ª—é –æ—Å—Ç–∞–≤–∏ –∏ –æ—Ç –∑–ª–∞—Ç–æ—Ç–∫–∞. –æ–Ω –∂–µ —Å –ª—é–±–æ–≤–∏—é —Å–≤–æ–µ—é —Å–≤—è—Ç—É—é –∏–∫–æ–Ω—É —Å–≤—è—Ç–∏—Ç–µ–ª—è, —è–∫–æ —Å–≤—è—Ç—É—é –µ–≥–æ –∏–∫–æ–Ω—É –≤ –ª—£—Ç—ä —Å–≤–æ–µ–≥–æ –º—£—Å—Ç–∞, –∏ –æ—Å—Ç–∞–≤–∏—à–∞ –∏–∫–æ–Ω—É –µ–≥–æ, –∏–∂–µ –≤ —Ä—É—Ü—£
.  –û–Ω—ä –∂–µ, –≤–∏–¥—è, —è–∫–æ –Ω–µ –ø–æ —Å–µ–±–µ, –∏ –Ω–µ –º–æ–∂—£—Å—è –æ—Ç—ä—Å—Ç–æ—è—Ç–∏ –æ—Ç –º–µ–Ω–µ, —Ç–æ –∏ –Ω–µ –≤–∑–∏–º–∞–π—Å—è –Ω–∞ –¥—Ä—É–∂–∏–Ω—ã —Å–≤–æ–∏—Ö. –∏ –Ω–µ –æ–±—Ä—£—Ç–æ—à–∞ –∏—Ö –∏ —Å–µ—é, –≤ –ø–æ–ª–µ –∏ –≤ —Ä–∞—Ç—É—à–∏ —Å —Å—£–±—£—Ö–æ–º—ä –∏ —Å –¥—Ä—É–∂–∏–Ω—ã.  –ò
.  –ê–∂–µ –æ –º–Ω–æ–∑–µ, –≤ –Ω–µ–π–∂–µ –Ω–∏—Å–º–∏. –æ–∂–µ –º–Ω–æ–∑–∞ –∏ —è–∫–æ –Ω—£–∫—ã–π –º–∑–¥–æ–∏–º—£—Å

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò —Ç–∞–∫–æ –Ω–∞ –º—è—Å–µ –∏ –Ω–∞ –∑—£–ª–æ, –∏ —Ç–∞–∫–æ –Ω–∞ –º—è—Å–µ –∏ –Ω–∞ –∑—£–ª–æ –∏ –Ω–∞ –µ–ø—Ç–∞—Ä–µ—Ö—ä –∏ –Ω–∞ –≤—ä–ø–∏—Ö–∏–∏—Ö–∏–∏—Ö–∏—à–∞. –∏ —Ç–∞–∫–æ –Ω–∞ –º—è—Å–µ –∏ –Ω–∞ –µ–ø—Ç–∞—Ä–µ—Ö—É –∏ –Ω–∞ –µ–ø—Ç–∞—Ä–µ—Ö –∏ –Ω–∞ –±—è—à–µ,
.  –û–¥—É—Ä–µ—Ç–∏ –±—è—à, –Ω–µ –¥–æ—Å—Ç–∞–≤–∏—à–∏ –∫ –æ—Ç—Ü—É —Å–≤–æ–∏—Ö, –≤ —Ç–æ –≤—Ä–µ–º—è –∂–µ, –∏ –Ω–∞ –Ω—å, –æ—Ç—Ü–µ–º —Å–≤–æ–∏–º—ä, –∏ —Å–∞–º—ä –∑–ª–∞—è, –æ—Ç—ä –±—Ä–∞—Ç–∞ —Å–≤–æ–µ–≥–æ, —è–∫–æ —Ä–∞—Ç—å, –∏ –ø–æ –≤—Å—è –¥–Ω–∏ –Ω–µ –æ—Ç–∏. —Å–∞–º—ä –∂–µ. –≤ —Ç–æ–º –∂–µ –ª—£—Ç–æ 6345.
.  –ò —Ä–µ—á–µ –µ–º—É: "—Å–µ–∏ –±–æ –µ—Å–∏: –∞—â–µ —Ö–æ—â–µ—à–∏ –Ω–∞ –Ω—£—Ç–º–æ, –¥–∞ –Ω–µ –æ—Ç—Ä–∏–Ω—É—Ç –≤ –∑–µ–º–ª—é —Å–∏ –∏–∂–µ –µ—Å—Ç—å –≤—ä—Å—Ö–æ—Ç—£–Ω–∏–∏, —Ç–æ —Å —Ç–æ–±–æ—é –±—É–¥–µ—Ç—å –∑–µ–º–ª–∏ –µ–≥–æ, –∞—â–µ –∏ –Ω—ã–Ω—£ –±—ã—Ö—ä –±—ã–ª—ä, –æ—Ç—Ä–∏–Ω—É –±—ã—Ö, –¥–∞ –∏
.  –û–Ω–∏ –∂–µ, –ø–æ–Ω–µ–∂–µ, —Ö—Ä–∏—Å—Ç–æ–≤—ã –¥–∞—Ä—ã —Ä–∞–∑–ª—É—á–µ–Ω–∏–µ–º –ø—Ä–µ—á–∏—Å—Ç—ã—Ö –∏ –ø—Ä–µ—Å–ª–∞–≤–Ω—ã–º –ø—Ä–µ—Å—Ç–∞–≤–ª–µ–Ω–∏–µ–º –≤–æ –º–Ω—£—Ö –ø—Ä–∏—á–∞—Å—Ç–∏—é, –∏

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  "–≤—ä—Å—Ç–∞ –±–æ –µ—Å—Ç—å –¥–æ –ø—£–Ω–∏–∏ –ø–æ—£–¥—ä". –∞ –≤—ä—Å—Ç–∞, —è–∫–æ –Ω–µ –ø–æ –Ω–æ–∑—£ –ø—£–¥—£—Ç–∏, –∏ —Ä–µ—á–µ: ¬´–Ω–µ —Ö–æ—â—É –æ—Ç–∏–∂–µ –≤—ä–∑–¥—£¬ª. —Ç—£–ª–æ —Ç–æ, —Å–ª–æ–≤–æ —Ä–µ—á–µ, –¥–∞ –Ω–µ –≤—£–¥–∞—Ç–∏, –Ω–∏ –ø–æ—Ç—å, –Ω–∏
. 
.  –ò —Ç–æ—á–∏—é –∂–µ —É–±–æ –∑—Ä—£—Ç–∏ –∏ –ø—Ä–∏–∏–¥–æ—à–∞ –∫ —Å–≤—£—Ç—É –±–æ–≥—É, –∏ –ø–æ–ª–æ–∂–∏—Ç–∏ –≤ —Ü–µ—Ä–∫–æ–≤—å.  –∏ –æ—Ç—Ç–æ–ª–µ, –∞ –≤ —Ç–æ –∂–µ –≤—Ä–µ–º—è —Å—ä–∫—Ä–æ–≤–∏ –µ–≥–æ —Å–≤—£—Ç–∏—Å—è –æ—Ç –≤—Å—£—Ö—ä –æ–Ω—ã—Ö—ä, –∏ –≥–ª–∞–≥–æ–ª–∞—à–µ: ¬´–∏–∏—Å—É—Å–µ –Ω–∞—à—å,
. 


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –ø–∞—á–µ —É–±–æ –∏–∑–∏—â—É, –∏ —Å—ä–∑–Ω–æ–≤–∞—é, ‚Äî –≥–ª–∞–≥–æ–ª—é—Ç—å. 
.  –ê —Ç—ã —É —Ç—è –≤ –∫–∏—Ç—Ü—£ –±—ã–ª—ä. –∏ –≤—Å–µ. –∞ —Ç–æ —É –Ω–∞—Å—ä —Ç–æ–ª—å–∫—ã –Ω–∏—á—å–Ω—ã—è –æ—Ç—Ç—É–¥—ã –∏ –¥–µ–ª–∏—Å—è, –∞ –º—ã —É —Ç–µ–±—£ —Ç–∞–∫—ä –∏ –∑–≤–∞–Ω—ä –±—ã–ª—ä, –Ω–µ —Ç–æ –Ω–µ –º–æ–∂–µ—à–∏, —á–µ–≥–æ –º–æ–∂–µ—à–∏ —Å–æ—Ç–≤–æ—Ä–∏—Ç–∏. –∏ –Ω–µ –º—ã
.  –°–≤—è—Ç—ã–π –∂–µ –∞–ø–æ—Å—Ç–æ–ª—ä –∂–µ –æ—Ç –∑–ª–∞—Ç–∞ –∏ –æ—Ç –∫—Ä–µ—Å—Ç–∏—Å–ª–∞–≤–æ–≤—ä —É–¥–µ –∏ÃÅ –æ—Ç—ä –∑–ª–∞—Ç–∞ –≤ –∑–µ–º–ª—é –∏ –æ—Ç —Å–≤—è—Ç–∞–≥–æ —Å–≤—£—Ç–∞ –∏ –æ—Ç —Å—Ä–µ–±—Ä–æ –∏ —Å–ª–∞–≤–Ω–æ, –∞ –æ—Ç —Å—Ä–µ–±—Ä–µ–Ω–∏–∫–∞ –∏ –æ—Ç –æ—Ç—Ä–æ—á–∞, –∏ –æ—Ç –æ—Ç—Ä–æ—á–∞, –∏ –æ—Ç—Ä–æ—á–∞ –æ—Ç—Ä–æ–∫–∞ –∏ –æ—Ç—Ä–æ–∫–∞
.  "—É–≥–æ—Ç–æ–≤–∏–ª–∞ –Ω—£–∫–æ–≥–æ –∫–Ω—è–∑—è —É–±–æ –∏ –≤—ä–∑–≤–µ—Å—Ç–∏ –≤—ä —Ö—Ä–∞–º—ä —Å –Ω–∏–º—ä –∏ —Å—è–¥—É—â–∞ —Å –Ω–∏–º—ä —Å –±—Ä–∞—Ç–æ–º—å", –ø–æ–Ω–µ–∂–µ –∏ –≤—ä—Å–ø–æ–º—è–Ω—É—Å—è –∏ –º–æ–ª—è—Å—è –µ–º—É: "–∫—ã –±—É–¥–∏ —Ç–∏ —Å –Ω–∏–º—ä? –∏ –ø–æ–∏–¥—£–º—ä –∫—ã –µ–º—É, –Ω–æ –µ–º—É


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}





Saving model checkpoint to ./checkpoint-500
Configuration saved in ./checkpoint-500/config.json
Configuration saved in ./checkpoint-500/generation_config.json


.  –ù–æ, –∫–æ–≥–¥–∞ –∂–µ –æ—Ç —Ç–æ–≥–æ –±—ã–≤–∞—à–∞ –∏–º–∞—à–∏ –±–æ–∂–∏–∏–º—ä –ø–æ–∏—Ç–∏ –≤—ä –æ–±–∏—Ç–µ–ª—å –∏ —Å—ä–¥—£—Ç–∏ –±—ã—Å—Ç—å, –∏ –ø–∞–∫–∏ –±—ã—Å—Ç—å —Ç–∞–º—ä.–∏ –ø–æ –ø–æ–¥–æ–±–∞–Ω–∏–∏ –≤—ä—Å—Ö–æ—Ç—£ –Ω–∏—Ä—Å–∏—à–∏ –∏–º—ä. –∏ –ø–æ—Å—Ç–∞–≤–∏—à–∞ –∫ —Ç—£—Ö—ä –∂–µ –≤–æ –æ–±–∏—Ç–µ–ª–∏ –∏, –æ—Ç—Ç–æ–º
.  –ò –ø–æ–≤–µ–ª—£—à–µ –¥–∞–Ω–∏–ª–ª—É –Ω–∞ –±—Ä–∞–Ω—å –¥–∞–Ω–∏–ª–ª—É, –∏ —Å –Ω–∏–º—ä —Å–æ —Å–ª—É–∂–±–∏ —Å—Ä—£—Ç–æ—à–∞ –æ —Å–µ–±—£, —è–∫–æ –±–æ –≤ –¥–æ–º—£ —Å–≤–æ–µ–º—ä –æ–Ω—ä, –Ω—ä –æ—Ç–ª—£–∂–∏ –∂–µ –µ–º—É —Å—ä—Ç–≤–æ—Ä–∏—Ç–∏. –Ω–æ –∑–º–∏–ª–æ—Å—Ç–∏–≤—å –∫ –≤–µ–ª–∏–∫–æ–º—É –∫–Ω—è–∑—é –∏ –±–æ—è—Ä–µ —Å–≤–æ–µ–º—É –¥–∞
.  –°–∞–º—ä –∂–µ —Å–≤—è—Ç—ã–π, –ø–æ –µ–≤–∞–Ω–≥–µ–ª—å—Å–∫–æ–º—É –æ–±—Ä–∞–∑—É, –ø—Ä–∏—Å—Ç—É–ø–∏–≤—ä —Å –ø–∞—Å—Ç—ã—Ä—Å–∫–∏–º—ä —Ä—É–∫–æ–≤–æ–¥—Å—Ç–≤–æ–º—ä –∏ –æ—Ç –ø–∞—Å—Ç—ã—Ä—Å–∫–∏—Ö—ä –æ–±—è–∑–∞–Ω–Ω–æ—Å—Ç–µ–π—ä –∫ —Ç–æ–º—É, –∫–∞–∫–æ –ø–æ –º–Ω–æ–≥—ã—è –¥–æ–±—Ä–æ–¥–µ—Ç–µ–ª–∏ –±—ã—Å—Ç—å –µ–º—É –ø—Ä–∏–∏—Ç–∏ –∫ –µ–¥–∏–Ω–æ–º—É –æ—Ç –Ω–∏—Ö –æ–±—Ä–∞–∑—É, –Ω–µ —Ç–æ–∫–º–æ –∏—Å–ø–æ–≤–µ–¥

Model weights saved in ./checkpoint-500/pytorch_model.bin
Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ì–æ—Å–ø–æ–¥—å –±–æ —Å –Ω–∞–º–∏—ä –Ω–∞—á–∞—Ç—ä, –∏ –Ω–µ –≤–Ω–∏–¥–æ —Ç–∏. –∏ —Ç–∞–∫–æ —Ç—£ –∂–µ –ø—Ä–µ—Å—Ç–∞–≤–∏—Ç—Å—è —Å –Ω–∞–º–∏. –∏ –ø–∞–∫–∏ –ø—Ä–µ—Å—Ç–∞–≤–∏—Ç—Å—è –æ—Ç –º–µ—Ä—Ç–≤—ã—Ö. –∏ –≤—ä–∑–º–æ–∂–µ –±–æ–≥—ä –Ω–∞—Å—å –±–æ–≥—ä –Ω–∞ –≤—Å—è–∫—É –±–æ–ª–µ–∑–Ω—å, –∏ –≤—ä–∑–Ω–µ—Å–µ—Ç—å—Å—è —Å—ä –Ω–∞–º–∏. –Ω–µ –≤—ä–∑–º–æ–∂–µ—à–∏ –±–æ
.  –ù–æ –∞—â–µ –µ—Å—Ç—å –≤—ä —Ü–µ—Ä–∫–≤–∏ —Å–≤—è—Ç–∞–≥–æ –æ—Ç—Ü–∞ –Ω–∞—à–µ–≥–æ –∫–∏—Ä–∏–ª–∞ –∏ –≤–æ —Å–≤—è—Ç—ã—Ö –æ—Ç–µ—Ü—å —Å–∏—Ö, –ø—Ä–µ–ø–æ–¥–æ–±–Ω–µ, –∏, —è–∫–æ –±–æ–≥—ä, –∞–∫–∏ –∑–≤–µ—Ä—å –∏ —á–µ–ª–æ–≤—£–∫—ä, –∏ –≤—ä —Å–≤–æ–∏—Ö —Å–≤—è—Ç—ã—Ö—ä –∫–Ω–∏–≥–∞—Ö—ä –ø–∏—Å–∞–Ω–æ –±—ã—Å—Ç—å. –∞—â–µ –±—ã –∫—Ç–æ –∏ –Ω–∞ —Ç–æ–º—ä —Å–æ–±–æ—Ä–µ –≤–æ —Ü–µ—Ä–∫–≤–∏ –±—ã—Å—Ç—å, –Ω–∏ –≤–æ —Å–≤—è—Ç—ã—Ö—ä –æ—Ç—Ü–∞
.  –∞ –∞–∫–∏ –æ–ª—ä, —è–∫–æ –∏ —Ç–∏ –µ—Å—Ç—å –∏ –≤–æ –≥—Ä–∞–¥–µ. –∞—â–µ –±–æ –Ω–µ –≤—ä—Å—£–ª—£, –Ω–µ –≤—ä–∑–ª—é–±—è—â–µ. –∞—â–µ –±–æ, –Ω–æ –≤—£–¥–∞–π, –Ω–æ –≤—ä—Å—Ç–∞–≤—å—Å—è. –∞—â–µ –±–æ –µ—Å—Ç—å, –Ω–æ –≤—£—Ä–µ, –Ω–µ –±—ã–≤–∞–µ—à–∏. –∞—â–µ –±–æ, —Ç–æ
.  –í –¥–µ

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  "–Ω–µ –º–æ–∂–µ—Ç—ä –±–æ —Å—è –∑—Ä—£—Ç–∏, —è–∫–æ—ä —Ç–∞–∫–æ–∂–µ –∏ –≤ –¥–æ–º—£ —Å–≤–æ–µ–º—ä –ø—Ä–µ–±—ã–≤–∞—Ç–∏. –∏ –æ—Ç —Ç–æ–≥–æ, —á—Ç–æ –ø–æ –≤—Å–µ–π
.  –ò —Ç–æ–µ –∏ –¥—Ä—É–≥–æ–µ –Ω–µ –ø–æ–≤—£—Å—Ç—å –∏–Ω–µ—è, –∏–∂–µ –∏ –≤—ä –ª—£—Ç–æ –ø—Ä–∏–∏–¥–µ –≤—Å–∏, –¥–∞ –Ω–µ —Å—ä—Ç–≤–æ—Ä–∏. –∏, —Å–ª—ã—à–∞–≤, –∫–Ω—è–∑—å –≤–µ–ª–∏–∫–∏–π, –µ–≥–æ–∂–µ –∫–Ω—è–∑—å —Ç—ã—Å—è—Ü–∫–∏–π, —Å–æ –≤—Å—£–º–∏ —Å–≤–æ–∏–º–∏ —Ä–∞—Ç—å, –∏ –º–Ω–æ–∑–∏ —Å –Ω–∏–º–∏—ä, –∏ —Ä—£—Ö–æ–º—ä, –∏
.  –¢–æ–≥–¥–∞ –∂–µ, –ø–æ —Å–µ–º—É –ø–æ–≤—£–¥–∞—à–∞ —Å–∏—Ü–µ: –∏ –¥–∞—Å—Ç—å –∏–º—ä –±—£ –¥—£—Ç–∏, –∏–∂–µ —É—Ä–∞–∑—É–º—£–≤—à–µ, –æ—Ç–∏–¥–µ –∫ –Ω–∏–º—ä, –∏ –≤—ä–∑–≤—Ä–∞—Ç–∏—à–∞—Å—è –∫—ä –Ω–∏–º—ä. –∏–º—£—è –±–æ –∏—Ö—ä –Ω—£–∫–æ–ª–∏–∫–æ –¥—£—Ç–∏ –∏ –≤—ä–Ω–∏–¥—É—à–µ
.  –î–∞ –∏ –Ω–µ —Ç–æ–ª—å–∫–æ, –∞ –∏–Ω—ã—è –µ—Å—Ç—å –≤ —á—é–¥–µ—Å–µ. –∞ —Ç—ã, —è–∫–æ –±—ã—Ç–∏, –Ω–µ —É–≤–µ–¥–µ –µ—Å–º–æ, –Ω–æ —Å –ø—Ä–æ—á–∏–º–∏ —Å–≤—è—Ç—ã–º–∏ –ø–æ –≤—Å—è –¥–Ω–∏ –ø–æ —Å—Ä–µ–±—Ä—è–Ω—ã–º—ä –∏–º—£–Ω–∏–∞. –∞ –æ —Ö–≤–∞–ª–µ, –µ—Å–º–æ, ‚Äî –∫–∞–∫–æ–∂–µ —É–º—ã—Å–ª–∏—à–∏, –∏–ª

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –ø–æ–≤–µ–ª—£—à–∞ —É–±–æ —Ü–∞—Ä—é —Ü–∞—Ä—é: "–æ, —Ü–∞—Ä—å, –∫—Ä—£–ø–∫–∏–º–∏ –≤—£—Ä—ã, —è–∫–æ –∏ –º–Ω–æ–≥–∞ –ª–µ—Ç–∞ –≤—£—Ç—Ä–∞–º—ä, –∏ —è–∫–æ –º–Ω—£ –∞–∑—ä –º–Ω—è—à–µ –∏–º–∞—à–∏ –æ—Ç –≤–∞—Å –∏ –¥–æ —Å–∏—Ö—ä, –Ω–æ –æ—Ç —Å–∏—Ö—ä, –Ω–µ –∏–∑–≤–æ–ª—å—Ç–µ –æ—Ç –≤–∞—Å, –Ω–∏ –æ—Ç –∏–Ω—ã—Ö
.  –û –Ω–µ–º—ä–∂–µ –∏–º—£—Ç–∏ –∫—Ä—£–ø–∫–æ–≥–æ –≤—£—Å—Ç–Ω–∏–∫–∞ –∏ –ø–æ–±—£–¥–æ—à–∞ –µ–≥–æ –æ—Ç –Ω–µ–≥–æ. –∏ –Ω–µ –¥–∞—Å—Ç—å –µ–º—É –∫–æ—Ä–∏–Ω–∞ –∏–ª–∏ –º–Ω–∏—Ö—É. —Ç–æ—Ç –∂–µ –∫–æ—Ä–∏–Ω, –≤—£—Ä–∂–µ –µ–º—É –≤ —Å–µ–±—£, –Ω–∞—á–∞ –µ–º—É —Å–æ –≤—Å—è—Ü—£–π —Ä—É—Å–∫–æ–π –∑–µ–º–ª–∏ –∏ –∏ —Å —Ä—É—Å–∏ —Å–æ
.  –ü—å–µ—Ö –∏ —Ä—£—Ö–æ–≤—ä, –Ω—£–∫—ã –∂–µ –∑—£—è–Ω–∏–∏—Ö, –±—£—Ö—ä –Ω–µ–∏—Å—Ç–æ–≤—ä, –∏ –æ—Ç–Ω–∏–¥–æ—Ö—ä, —è–∫–æ –Ω—£–∫–æ–ª–∏–∫–æ –≤—Å–∏ –∑—£–∏. –¥–∞ –±—É–¥–µ—Ç—å –∏–º–∞–º—ä –±–æ–∏–≤–∞–∞ –∏ –≤–æ—Å—Ç–∞–≤—å. –≤–æ—Å–∫—Ä–µ—Å—å –∏ –ø—Ä–∏–¥–∏,
.  –ü—Ä–∏–ª–æ–∂–∏ –∂–µ –∫ —Ä—É—Ü—£ –∏ –Ω–µ –≤–æ–∑–º–æ–∂–µ –ª–∏ –Ω–µ –¥–∞—Ç–∏ –º–Ω—£ –º—£–¥–∞? –∏ –Ω–∏—á–∏—é–∂–µ –º–Ω—£ –µ—Å–º—ã –Ω–µ –∏–º–∞–º—ä, –Ω–∏ –º—£—Å—Ç–∞ –Ω–µ –±—ã—Ç–∏

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ê –≤ –º—£—Å—Ç–æ —Ç–æ –µ—Å—Ç—å –Ω–∞ —Ä—É—Ü—£ —Å—£–¥–ª–µ—Ö –∏ –Ω–∞ –≥–æ—Ä–∞—Ö, –∏ –∞–∫–∏ —Å—£–¥–ª–µ—Ö —Å—£–¥–ª–µ—Ö—ä. –Ω–æ –∞–ª–µ–∫—Å–∞–Ω–¥—Ä—ä, –≤–µ–ª–∏–∫–∏–π –∏ –ª—é–±–∏–º—ã–π, –æ—Ç –Ω–µ–≥–æ –∫–æ–∏–¥–∞ –∂–µ –ø—Ä–∏–∞—Ç—Ç–∏? –∞–ª–µ–∫—Å–∞–Ω–¥—Ä—ä –∂–µ —Å–∞–º—ä —Ä–µ—á–µ: ¬´—è
.  –¢–∞–∫–æ –∂–µ –∏ –Ω–∞ –º–∞–Ω–∞—Å—Ç—ã—Ä—å, –∏ –Ω–∞ –ø–∞–≤–ª–æ–≤—ä, –∏ –Ω–∞ –æ—Ç—å—Ü—£, –∏ –Ω–∞ –∑–º–∏—è, –∏ –Ω–∞ –¥—å—Ä—É–≥, –∏ –Ω–∞ —Ö—Ä–∏—Å—Ç–∞ —Ä–∞–¥–∏, –∏ –Ω–∞ –ø—Ä–µ—Å–≤—è—Ç—É—é —Ç—Ä–æ–∏—Ü—É. –ø–æ —Å–∏—Ö –∂–µ –≤–Ω–∏–¥–æ—Ö—ä, —è–∫–æ –∏ –Ω—£–∫—Ç–æ –±—ã—Å—Ç—å, –≥–ª–∞–≥
.  –ü—Ä–∏–∏–¥–æ—à–∞ –∂–µ –∫–Ω—è–∑–∏, –∑—Ä—ä–¥—ä –∏ –ø—Ä–∞—Å—Ç—å, –ø—Ä–∏–∏–¥–µ –≤ —Ä–∞–∏ –Ω–∞ —Å–µ–±—£, –∏ —Ä–µ–∫–æ—à–∞ –µ–º—É: ¬´–±—Ä–∞—Ç–µ –∏ –Ω—å, –∏ —Ç—ä –Ω–µ –æ—Å–ª—É–≥–∞–π—Ç–µ –µ–≤—ã. –∏ –∞–∑—ä –æ—Å–ª—É—à–∞—é—Å—è –∏ –Ω–µ –æ—Å–ª—É—à–∞—é—Å—è. –∏ –Ω–µ –æ—Å–ª—É
.  –ò –∫—Ä—£–ø–∫–æ —Ä–µ—á–µ –º–Ω–µ: "–Ω–µ –º–æ–∂–µ—à–∏, –æ—Ç—á–µ". –∏ –ø—Ä–∏—Å—Ç–∞–≤–∏ –º–∏ —Ä—É–∫—É, –∞ –æ–Ω—ä —Ä–µ–∫–æ—Ç–∏ —Ç–∞–∫–æ –∏ –Ω–µ –ø—Ä–∏–∏–º—É, –Ω–µ –∏–º–∞—Ç–∏. –∞–∑ –∂–µ —Ä–

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. 
.  –û—Ç—Ç–æ–≥–æ –∂–µ —Å–µ–≥–æ, –∫–æ–≥–¥–∞ –∏ —è –≤—£–¥—É, –Ω–æ –∏ –ø–æ–Ω–µ–∂–µ –Ω—£—á—Ç–æ –æ—Ç –∏–Ω–∞ –¥—£–ª–µ—Å—è —Å –Ω–∏–º—ä —Å –Ω–∏–º—å –¥—£–ª—É—é—â–µ–º –∏ –º–Ω–æ–≥–∞ –∏–º–∞, –∞—â–µ –±—£–ª–æ, –Ω–æ –µ–≥–¥–∞ –±–æ –±—ã–≤—ä –Ω–∞ –∏–ø—£ –∏ —Ç—ä—á–∞—à–µ—Å—è,
.  –°–∏–π—ä, –≥–ª–∞–≥–æ–ª–µ—Ç—ä, —á—Ç–æ, –∏ –º—ã, –∏–º–∞–∏, –µ–≥–æ –Ω–µ —Ö–æ—Ç—è—â—é.
.  "–∏ –ø–∞–∫–∏ —Å–ø–æ–¥–æ–±—Å—è, –∏ –≤—£–¥–∞—à–µ, —è–∫–æ –º—£—Å—Ç–æ –µ—Å—Ç—å ‚Äî —Å–≤—è—Ç—ã–π –∫–∞–º–µ–Ω–∏. –Ω–µ –ø–æ—Å—Ç–æ–π –º–∏ –≤–æ –≤—Å–µ–º, –Ω–∏ –≤ —á–µ–º–∂–µ –≤—£—Ä–æ—é –∏ –Ω–µ—á–µ—Å—Ç–∏–∞–≥–æ, –Ω–∏ –≤ —á–µ–º–∂–µ, –Ω–æ –∏ –≤—£—Ä–æ–≤–∞ –∏ —Ä–∞–∑—É–º—£–≤–∞". –∏ —Ç–æ–≥–¥–∞ —Å–≤—è—Ç—ã–π –∞–ø–æ—Å—Ç–æ–ª—ä —Ä–µ—á–µ


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ê–ª–µ–∫—Å–∞–Ω–¥—Ä—ä –∂–µ –Ω–µ –∏–Ω–∞–∫–æ –≥–ª–∞–≥–æ–ª–µ—Ç—å: "–º–æ–ª–∏—Å—è –æ –Ω–µ–π, –∞ –Ω–µ –º–æ–ª–∏—Ç—å –æ –Ω–µ–π". –∏ —Ä–µ—á–µ –≤–ª—£—Å–Ω–∏–∫—ä: "–Ω–æ —Å–µ —É–±–æ –ø—Ä–∏–∏–¥–µ—Ç—ä —Å—ä –Ω–∞–º–∏, –¥–∞ –ø–æ–∏–¥–µ, ‚Äî –∏ –ø—Ä–∏–∏–¥–µ, –∏ –æ—Ç –Ω–∞—Å—ä –æ—Ç –Ω–∞—Å—ä –æ—Ç–≤—£—â–µ—Ç—å".
.  –∞ —Å –Ω—£–º—Ü–µ–º –∏ —Å—ä —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å –º–æ–ª–∏—Ç–≤–∞–º–∏. –∞ —Å –Ω—£–º—Ü–µ–º –∏ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏, –∏ —Å–æ —Å–ª–µ–∑–∞–º–∏,
. 
.  –ò —Ç–µ –∂–µ, –∏ —Ç–µ –∂–µ, –¥–∞ –∏ –ø–æ –¥–≤–∞-—Ç—Ä–∏ –≤ –≥–æ–¥ —Å –ø–æ–ª–æ–≤–µ—Ü–∫–æ–π –≤–æ–π–Ω—ã –≤–æ–µ–≤–æ–¥—ã –µ–≥–æ. –∏ –¥–æ —Å–µ–≥–æ –≤—Ä–µ–º–µ–Ω–∏ –≤–æ–µ–≤–æ–¥—ã –Ω–∞—à–∏—Ö –¥–∞ –Ω–∞ —Ç—Ä–∏ —Å—Ç–æ—Ä–æ–Ω—ã –≤ –æ—Å–∞–¥—É –µ–≥–æ –±—è—à–µ, –¥–∞ –ø–æ –¥–≤–∞-—Ç—Ä–∏ —Ä–∞–∑–∞ –ø–æ –¥–≤–∞–¥—Ü–∞—Ç—å. –∏ –æ—Ç —Å–µ–≥–æ –≤—Ä–µ–º–µ–Ω–∏ –

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ê —Ç–∞–∫–∂–µ –¥–æ –≤–µ—á–µ—Ä–∞, –ø–æ–Ω–µ–∂–µ –≤—ä–∑–≤–µ—â–∞—é, –∏ –≤ –Ω–µ–º—å –±—É–¥—É—Ç—å, –∞—â–µ –ª–∏ –≤—ä–º—å—á—å, —Ç–æ–≥–¥–∞ –∏–º—£–µ–º—ä –≤–Ω–∏–¥–æ—à–∞ –≤—ä –∫—ã–µ–≤—ä. –æ—Ç –Ω–∏—Ö—ä –∂–µ –∏ –¥–æ–∏–¥–µ –≤ —Ü–µ—Å–∞—Ä—å—Å–∫–∏–∞, –Ω–∞ —Ç–æ –∂–µ –≤—Ä–µ–º—è —É–±–æ –Ω–µ –ø—Ä–µ–∂–µ –≤—Å–∏
.  –∞—â–µ –µ—Å—Ç—å –≤ —á–µ–º –Ω–µ —Ç—£–º–æ, –∞—â–µ –∂–µ –µ—Å—Ç—å, –Ω–æ –µ—Å—Ç—å –≤ —á–µ–º, –∏ —Å–µ —Å—ä—Ç–≤–æ—Ä–∏—Ç–∏ –≤—ä–∑–±—Ä–∞—Ç–∏—à–∞, —è–∫–æ–∂–µ –∏ –¥–æ —Å–∏—Ö—ä. —Ç–æ—á–∏—é –∏ –≤—ä –≤—Å—£—Ö—ä –µ—Å–∏. –∞—â–µ –∂–µ –µ—Å—Ç—å, –∏–ª–∏ –Ω–µ –≤—ä—Å—Ç–∞ –µ—Å–∏; –≤—£–¥–∞–µ—à–∏ –ª–∏
.  –Ø–∂–µ –µ—Å—Ç—å –ø–æ –∑–µ–º–ª–∏, –∏ –≤ –Ω–µ–π –µ—Å—Ç—å –º—£—Å—Ç–æ, –∏ –º—£—Å—Ç–æ, –∏–∂–µ –µ–ª–ª–∏ –µ–≥–æ –æ—Ç—å—Ü—è, –∏ —Å—ä–º—å, —è–∫–æ–∂–µ –µ–ª–ª–∏, –≤ –Ω–µ–π–∂–µ, –±—£—Å–∞, –∏ –¥–∞–∂–¥—å –∏ –¥–æ –≥—Ä–æ–±–∞ –≤–Ω–∏–¥–∏. –∏ —Å–µ –µ—Å—Ç—å –º—£—Å—Ç–æ, –∏ –≤
.  –ò –Ω–∞ —Å–≤—£—Ç—£ –≤—£–º—ä –≤—£—Ä—£—Ö—ä –∏–º—£—è, —Ç–∞–∫–æ –∏–∂–µ, –∏–∂–µ –≤—ä –º—£—Å—Ç—É —Ö—Ä–∏—Å—Ç–æ—Å—ä, —è–∫–æ –Ω–µ –≤—ä—Ä–≤—É—Ç—ä —Ç—£–ª–æ, –Ω–µ –≤—ä–∑–≤—ã—Å—è—



Training completed. Do not forget to share your model on huggingface.co/models =)


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –î–∞, —Ä–µ—á–µ –æ –Ω–∏—Ö, —è–∫–æ –º–Ω–æ–≥–∞ –∫ –Ω–∏–º—ä –ø—Ä–∏–∏—Ç–∏. —Å–µ –±–æ –∏–º—£–Ω–∏—è.  –∏ –ø—Ä–∏–∏–¥–æ—à–∞ –∫–æ –≥—Ä–∞–¥—É. –∏ –ø—Ä–∏—à–µ–¥—à–∞ –∫–æ –≥—Ä–∞–¥—É –∫—Ä—£–ø—Ü—ã, –∏ –≤–∑–∏–¥–µ –Ω–∞ –º—£—Å—Ç–æ –∏–º–∞—à–∞, –∏ –ø—Ä–∏–∏–¥–æ—à–∞ –∫ –≥—Ä–∞–¥—É; –∏ –ø–æ—Å—Ç–∞–≤–∏—à–∞ –≥–æ—Ä–æ–¥—ä –∏
.  –ò –≤ —Ç–æ–º—ä —á–∞—Å—£ –Ω–µ –±—ã—à–∞ –æ—Ç –º–∞–ª–∞, –Ω–∏ –≤–µ–ª–∏–∫–∞–≥–æ —á—é–¥–µ—Å–∞. –∏ –Ω–∞ —Ç–æ–º—ä —á–∞—Å—£ –Ω–µ –±—ã—Å—Ç—å. –∏ –Ω–∞ —Ç–æ–º—ä —á–∞—Å—£ –Ω–µ –±—ã—Å—Ç—å. 
. 
.  –∏ —Ç–∞–∫–æ –≤—ä–∑—Ä–∞—Å—Ç—É –≤—ä –±–ª–∞–∂–µ–Ω–Ω–æ–π,


Saving model checkpoint to .
Configuration saved in ./config.json
Configuration saved in ./generation_config.json
Model weights saved in ./pytorch_model.bin


In [6]:
print_generations(prefix="—Å–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



—Å–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ –≤—£—Ä–∏–µ,
—Å–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ –≤–æ—è, –∞ –∏–µ–∂–µ–∏ –≤–Ω–∏–¥—É—â–µ –≤ –Ω–µ–º—ä.
—Å–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ —Å–ª–æ–≤–æ¬ª. –∏–∂–µ –æ—Ç —Ç–æ–≥–æ –≤—Ä–µ–º–µ–Ω–∏ –∏–Ω–∞ –µ–¥–∏–Ω–∞–≥–æ, —è–∫–æ–∂–µ –æ—Ç –±–æ–≥–∞ –æ —Å–µ–º –µ—Å—Ç—å, –∏–∂–µ –∏ —Å–∞–º –±–æ–≥ –¥–∞ –Ω–µ –≤–æ–∑–Ω–µ–Ω–∞–≤–∏–¥—è—Ç, –¥–∞ –∏ –Ω–µ –≤–æ–∑–Ω–µ–Ω–∞–≤–∏–¥—è—Ç.
—Å–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ


In [7]:
print_generations(prefix="–∑–∞—á–µ–º", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



–∑–∞—á–µ–º –∏ –∫—Ç–æ –∏ –∫–∞–∫? –Ω–µ –∏–∑–º—£—é—Ç—ä, –¥–∞ –∏ –∫–∞–∫—ä –±—É–¥–µ—Ç—ä, –Ω–µ –∑–Ω–∞—é—Ç, –∞ –∫—Ç–æ –∏ –∫–∞–∫—ä –±—É–¥–µ—Ç—ä, –∞ –∫—Ç–æ –∏ –∫–∞–∫—ä –±—É–¥–µ—Ç—ä, –∞ –∫—Ç–æ –∏ –∫–∞–∫—ä –±—É–¥—É—Ç—ä, —Ç–æ –Ω–µ –≤–µ–¥–∞—é—Ç—ä.
–∑–∞—á–µ–º—ä —Å—£—á–µ –µ–≥–æ –Ω–∞ –ø—É—Ç–∏, —Å—ã–π–∂–µ –≤—ä –∞–≥–∏–∞–Ω—£, –∏ –∏–∂–µ –ø–æ—Å—Ç–∞–≤–∏—à–∏ –Ω–∞ –ø—É—Ç–∏ –µ–≥–æ¬ª. –∏, –Ω–µ –≤—ä–∑–¥–µ—Ä–∂–∞–≤—à–∏, –ø–∞–∫–∏ –≤–Ω–∏–¥–æ—à–∞ –∏ —Å—£—á–µ —Å—£—á–µ –Ω–∞ –ø—É—Ç–∏ –µ–≥–æ, –∏ –∏–∂–µ –ø–æ—Å—Ç–∞–≤–∏ –µ–≥–æ –Ω–∞ –ø—É—Ç–∏ –µ–≥–æ, –∏ –ø–∞–∫–∏ –ø–æ–ª–æ–∂–∏—Ç–∏ –µ–≥–æ –Ω–∞ –ø—É—Ç–∏ –µ–≥–æ –∏ —Å–ø—è—Ç–∏ –µ–º—É –æ—Ç –Ω–µ–≥–æ, –∞–∫–∏ –≤—ä—Å–∫–æ–Ω—å –µ–≥–æ –ø–∏—Ç–∏—Å—è. –∏ —Ç–∞–∫–æ –ø—Ä–∏–∏–¥–µ –≤—£—Ç—Ä–µ–Ω—ä, –∏ –¥–æ—à–µ–¥ –¥–æ –∑–µ–º–ª–∏, –æ–≤–∏–∏ –∂–µ, –ø–∞—á–µ –≤—Å–µ—Ö—ä —Å–≤–æ–∏—Ö, –∏ —Ä–µ—á–µ: ¬´–≤—Ä–µ–º—è, –æ—Ç—å—Ü—é. —Ç–∞–∫–æ –∏ –≤—ã, –æ—Ç—á–µ, –Ω–∞ –∑–µ–º–ª–µ –∂–∏–≤—è, –∫–∞—è–π—Ç–µ—Å—å –∏ –º–æ–ª–∏–º —Ç—è. –¥–∞ –±—É–¥–µ—à–∏ –Ω—ã¬ª. –∏ –±—ã–≤—ä—à–∏ —Å—£—á—É, –ø—Ä–∏–∏–¥–æ—Ö –¥–æ –∑–µ–º–ª–∏, –∏ —Ä–µ—á–µ, ‚Ä

In [8]:
print_generations(prefix="–∫–æ–≥–¥–∞", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



–∫–æ–≥–¥–∞ –æ—Ç –Ω–µ–µ, –æ–∂–µ –≥–ª–∞–≥–æ–ª–∞—à–µ, –æ–∂–µ –≥–ª–∞–≥–æ–ª—£—Ç–∏: ¬´—Å—ä–¥—£—Ç–µ –Ω–∞ –Ω–µ–±–æ –∏ –ø–æ–≤—£–¥–∞–π—Ç–µ, —è–∫–æ –¥—£–ª–æ –∏ –≤–æ–ª—è –≤–∞—à–∞ —Å—É—Ç—å, –µ–≥–æ–∂–µ –±–æ –µ—Å—Ç—å –±–æ–≥—ä. –∏ –≤—ä–∑–±—Ä–∞–Ω–Ω–æ –∏ —Ö—Ä–∏—Å—Ç–æ–ª—é–±–µ–∑–Ω–æ–µ –µ–≥–æ –µ—Å—Ç—å –∏–∂–µ –µ—Å—Ç—å –µ—Å–º—ã, –æ–∂–µ –Ω–µ –≤—£—Ä—É –æ—Ç –Ω–∞—Å—ä —Ç–≤–æ—Ä—è—Ö—É, –Ω–∏ –µ–¥–∏–Ω–æ–º—É –¥—Ä—É–≥–æ–º—É –∂–µ —Å –≤–∞–º–∏ –Ω–µ –æ–±—Ä—£—Ç—É—è. –¥–∞ –∞—â–µ –±–æ –≤–∞–º—ä —á–µ–≥–æ –∏–º–∞—Ç—å –Ω–∞ –Ω–µ–±–æ –∏ –ø–æ–≤—£–¥–∞—Ç–∏, –Ω–µ —Ö—Ç–æ –ª–∏ –º–∏ –≤—£–¥–∞—é –≤–∞–º—å –∏ –µ—Å–º—ã, –∞—â–µ –±–æ –≤–∞–º—ä –æ —Ç–æ–º—ä –µ—Å–º—ã, –∏ –Ω–µ —Ö—Ç–æ –ª–∏ –º–∏ –≤—£–∂–¥—É?¬ª.
–∫–æ–≥–¥–∞ –æ–Ω—ä –∂–µ —Å—è–¥—è –∏ —Ä–µ—á–µ –∫ –Ω–µ–π: ¬´–≤–∏–¥—£, –±—Ä–∞—Ç–µ, —á—Ç–æ –Ω—£—Å—Ç—å –ø–æ—£–¥–∞ –≤ —Ç–æ–π –≥—Ä–∞–¥—£ –∏ –Ω—£ —á—Ç–æ –µ—Å—Ç—å –≤—ä –Ω–µ–º—ä? –∏–ª–∏ –Ω—£–∫–æ–≥–¥–∞? –∏ –µ—Å—Ç—å –ª–∏ —É —Ç–µ–±—è –≤—£—Å—Ç—ã, –∞ —É –Ω–∞—Å—ä —Å—ä —Ç–æ–±–æ—é –≤—£—Å—Ç–Ω–∏–∫–∏ –∏ –¥—£–ª–∞ –¥—£—è—Ç–∏ –∏ –¥—£–ª–∞—Ç–∏, –∏ –¥—£–ª–∞—Ç–∏ –µ—Å—Ç—å –ø—Ä

# –°–æ–±—Ä–∞–Ω–∏–µ —Å–æ—á–∏–Ω–µ–Ω–∏–π –î–æ—Å—Ç–æ–µ–≤—Å–∫–æ–≥–æ

In [9]:
model, tokenizer = get_ru_model()
freeze_layers(model, 8)
finetune(model, tokenizer, DOST_PATH)

loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--sberbank-ai--rugpt3small_based_on_gpt2/snapshots/f2f7c585b05a16726efe8974586e10b4d5939082/config.json
Model config GPT2Config {
  "_name_or_path": "sberbank-ai/rugpt3small_based_on_gpt2",
  "activation_function": "gelu_new",
  "architectures": [
    "GPT2LMHeadModel"
  ],
  "attn_pdrop": 0.1,
  "bos_token_id": 50256,
  "embd_pdrop": 0.1,
  "eos_token_id": 50256,
  "gradient_checkpointing": false,
  "initializer_range": 0.02,
  "layer_norm_epsilon": 1e-05,
  "model_type": "gpt2",
  "n_ctx": 2048,
  "n_embd": 768,
  "n_head": 12,
  "n_inner": null,
  "n_layer": 12,
  "n_positions": 2048,
  "reorder_and_upcast_attn": false,
  "resid_pdrop": 0.1,
  "scale_attn_by_inverse_layer_idx": false,
  "scale_attn_weights": true,
  "summary_activation": null,
  "summary_first_dropout": 0.1,
  "summary_proj_to_labels": true,
  "summary_type": "cls_index",
  "summary_use_proj": true,
  "transformers_version": "4.2

SETTING N_EPOCHS TO  0.34442475176791504


Loading features from cached file /content/gdrive/MyDrive/datasets/cached_lm_GPT2TokenizerFast_256_dost.txt [took 0.940 s]
PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
***** Running training *****
  Num examples = 14590
  Num Epochs = 1
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 629
  Number of trainable parameters = 28353024


Step,Training Loss
50,3.6617
100,3.6379
150,3.6345
200,3.5787
250,3.5895
300,3.5795
350,3.5626
400,3.5493
450,3.5422
500,3.5709


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω, –ø–æ –∫—Ä–∞–π–Ω–µ–π –º–µ—Ä–µ, –ø–æ–Ω—è–ª, —á—Ç–æ —Å –Ω–∏–º –¥–µ–ª–∞—é—Ç. ‚Äì –û–Ω —É–∂–µ —Ö–æ—Ç–µ–ª –±—ã–ª–æ —Å–∫–∞–∑–∞—Ç—å, —á—Ç–æ —Å —ç—Ç–æ–π –∂–µ–Ω—â–∏–Ω—ã ‚Äì —Ö–æ—Ç—å —ç—Ç–æ –∏ –±—ã–ª–æ –¥–ª—è –Ω–µ–≥–æ –≤—Å–µ –∂–µ‚Ä¶ —Ç–æ –µ—Å—Ç—å, –≤–∏–¥–∏–º–æ, –ø–æ—Ç–æ–º—É —á—Ç–æ –æ–Ω–∞ –±—ã–ª–∞ –ø–æ—á—Ç–∏ —á—Ç–æ –∏ —Ç–∞–∫ –Ω–µ —Ç–∞–∫–æ–π, –∫–∞–∫ –±—ã–ª–∞. 
.  –í –µ–≥–æ –≥–ª–∞–∑–∞—Ö —á–∏—Ç–∞–ª–æ—Å—å –º–Ω–æ–≥–æ, –≤ —Ç–æ–º —á–∏—Å–ª–µ –∏ —Å–æ–∂–∞–ª–µ–Ω–∏–µ, –æ —Ç–æ–º, —á—Ç–æ –¥–∞–∂–µ –Ω–µ—Å–º–æ—Ç—Ä—è –Ω–∞ —ç—Ç–æ, –Ω–µ –º–æ–≥ –æ–Ω –∏ –º–µ—á—Ç–∞—Ç—å –±—ã—Ç—å —Ä—è–¥–æ–º —Å –Ω–∏–º.  –û–Ω–∏ –æ–±–∞ –±—ã–ª–∏ –≤ —ç—Ç–æ–º –µ–¥–∏–Ω–µ–Ω–∏–∏, –Ω–æ –∫–∞–∫ —á–∞—Å—Ç–æ –æ–Ω –≤ –ø–æ—Å–ª–µ–¥–Ω–∏–π —Ä–∞–∑ –æ–±–æ—Ä–∞—á–∏–≤–∞–ª—Å—è!  –î–∞–∂–µ –≤ –≥–ª–∞–∑–∞—Ö –µ–≥–æ –∏ –µ–≥–æ —Å–µ—Å—Ç—Ä—ã –Ω–µ –±—ã–ª–æ —Å–æ–∂–∞–ª–µ–Ω–∏—è –∏–ª–∏ —Å–æ–∂–∞–ª–µ–Ω–∏–π. 
.  –ö–æ–≥–¥–∞ –∂–µ –¥–æ—Ç–∞—â–∏–ª–∞ –µ–≥–æ –¥–æ –∫—Ä–æ–≤–∞—Ç–∏, –æ–Ω —Å –Ω–µ–≥–æ–¥–æ–≤–∞–Ω–∏–µ–º, –∏ –¥–∞–∂–µ —Å–æ —Å—Ç—Ä–∞—Ö–æ–º –æ—Ç—à–∞—Ç–Ω—É–ª—Å—è –æ—Ç –Ω–µ–µ, –

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í —ç—Ç–æ—Ç –ø–µ—Ä–∏–æ–¥ –µ—â–µ –≤ XVIII –≤–µ–∫–µ –±—ã–ª–∞ –≤ –º–æ–¥–µ –º–∞—Å–∫–∞—Ä–∞–¥.  –ù–æ –µ–µ –∑–∞–º–µ–Ω–∏–ª–∏ —à–ª—è–ø–∞ –∏ –ø–ª–∞—Ç—å–µ —Å –ø—ã—à–Ω–æ–π, –ø—ã—à–Ω–æ–π –≥–æ–ª–æ–≤–æ–π –∏ –¥–ª–∏–Ω–Ω—ã–º–∏ –Ω–æ–≥–∞–º–∏.  –° –ø–æ–º–æ—â—å—é –º–∞—Å–∫–∞—Ä–∞–¥–Ω—ã—Ö –º–∞—Å–æ–∫ –±—ã–ª–∏ –ø—Ä–µ–æ–±—Ä–∞–∑–æ–≤–∞–Ω—ã –¥–∞–∂–µ —Å–∞–º—ã–µ –∑–Ω–∞–º–µ–Ω–∏—Ç—ã–µ –≤ –∏—Å—Ç–æ—Ä–∏–∏ –§—Ä–∞–Ω—Ü–∏–∏ –º–∞—Å–∫–∞—Ä–∞–¥—ã. 
.  –ò –µ—Å–ª–∏ –±—ã –≤—ã —Å —Ç–∞–∫–∏–º —É–¥–æ–≤–æ–ª—å—Å—Ç–≤–∏–µ–º –∏ –∫–∞–∫ —Å–ª–µ–¥—É–µ—Ç –∏, –æ—Å–æ–±–µ–Ω–Ω–æ, —Å —É–¥–æ–≤–æ–ª—å—Å—Ç–≤–∏–µ–º, –ø—Ä–∏–Ω—è–ª–∏—Å—å –∑–∞ —Å–≤–æ–µ –¥–µ–ª–æ, —Ç–æ –≤–ø–æ–ª–Ω–µ –º–æ–≥–ª–∏ –±—ã –∏ –ø–æ—Ç–µ—Ä–ø–µ—Ç—å –≤ —ç—Ç–æ–º –æ—Ç–Ω–æ—à–µ–Ω–∏–∏ –Ω–µ—É–¥–∞—á—É. 
. 
.  –í —Ç–∞–∫–æ–º —Å–ª—É—á–∞–µ –≤ —Å—É–¥ –ø—Ä–∏—Ö–æ–¥–∏—Ç –µ—â–µ –Ω–µ—Å–∫–æ–ª—å–∫–æ —Ç—ã—Å—è—á –≥—Ä–∞–∂–¥–∞–Ω –†–æ—Å—Å–∏–∏, –Ω–æ –æ–Ω–∏ –Ω–µ –º–æ–≥—É—Ç —Ä–µ—à–∏—Ç—å, –∫—Ç–æ –∑–∞–¥–∞–µ—Ç –≤–æ–ø—Ä–æ—Å: —Ç–∞–∫ –ª–∏ –≤—Å–µ —ç—Ç–æ –±—ã–ª–æ –≤ –¥–µ–π—Å—Ç–≤–∏—Ç–µ–ª—å–Ω–æ—Å—Ç–∏, –∏ –∫–∞–∫ –æ–Ω–∏ –ø–æ—Å—Ç

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω –≥–æ–≤–æ—Ä–∏–ª, —á—Ç–æ —ç—Ç–æ –¥–ª—è –Ω–µ–≥–æ –∏ –µ—Å—Ç—å —Å–∞–º–æ–µ –ª—É—á—à–µ–µ: –≤—Å–µ –µ–≥–æ –ª—é–±—è—Ç, –∞ —Å–∞–º –æ–Ω –æ—á–µ–Ω—å —Å—á–∞—Å—Ç–ª–∏–≤ –∏ –≤—Å–µ –µ–º—É –ø—Ä–æ—â–∞—é—Ç. ‚Äî –í—ã –º–Ω–µ –æ –≤—Å–µ—Ö –æ–±–æ –≤—Å–µ–º –≥–æ–≤–æ—Ä–∏–ª–∏? ‚Äî —Å–ø—Ä–æ—Å–∏–ª —è –≤ –ø–µ—Ä–≤—ã–π —Ä–∞–∑. 
.  –í—Å–µ —Ç—Ä–∏ –Ω–µ–¥–µ–ª–∏ —è —Ç–∞–∫ –∂–µ, –∫–∞–∫ –∏ –ø—Ä–µ–∂–¥–µ, —Ö–æ–¥–∏–ª–∞ —Ç—É–¥–∞.  –ö–∞–∂–¥—ã–π –¥–µ–Ω—å –≤ —à–∫–æ–ª–µ —è –±—ã–ª–∞ —Ç–∞–∫ –∂–µ –∫–∞–∫ –∏ –≤—Å–µ–≥–¥–∞, —Å –∫–∞–∫–∏–º-—Ç–æ –ª–∏—Ö–æ—Ä–∞–¥–æ—á–Ω—ã–º –ª—é–±–æ–ø—ã—Ç—Å—Ç–≤–æ–º.  –ò –µ—Å–ª–∏ –º–µ–Ω—è –æ—Å–æ–±–µ–Ω–Ω–æ –∏–Ω—Ç–µ—Ä–µ—Å–æ–≤–∞–ª —É—á–∏—Ç–µ–ª—å, —Ç–æ, –º–æ–∂–µ—Ç –±—ã—Ç—å, –µ—â–µ –∏ –ø–æ—Ç–æ–º—É, —á—Ç–æ —è —É–∂–µ –∫ —Ç–æ–º—É –ø—Ä–∏–≤—ã–∫–ª–∞.  –Ø —Ç–∞–∫ –∂–µ —á–∞—Å—Ç–æ, –∫–∞–∫ –∏
.  –ü—Ä–∏ —ç—Ç–æ–º –í—ã –º–æ–∂–µ—Ç–µ –Ω–∞–ø–∏—Å–∞—Ç—å –º–Ω–µ, –æ –∫–∞–∫–æ–º –ø–∏—Å—å–º–µ –≤—ã –ø—Ä–æ—Å–∏–ª–∏ –±—ã –Ω–∞–ø–∏—Å–∞—Ç—å.  –î–ª—è –ø–∏—Å–µ–º –æ —Ç–æ–º, —á—Ç–æ –í—ã —Ö–æ—Ç–∏—Ç–µ –æ—Ç –º–µ–Ω—è, –ø–∏—à–∏—Ç–µ –º–Ω–µ.  –Ø —Å–∞–º–∞ 

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ï—Å–ª–∏ –≤–¥—Ä—É–≥ –æ–Ω–∞ —Å–ø—Ä–æ—Å–∏—Ç, –µ—Å–ª–∏ –≤–¥—Ä—É–≥ –±—É–¥–µ—Ç –≤ —á–µ–º —É–ø—Ä–µ–∫–Ω—É—Ç—å, —Ç–æ —ç—Ç–æ –≤ —Å–∞–º—É—é –º–∏–Ω—É—Ç—É.  –¢–∞–∫ —á—Ç–æ –≤—ã –¥–∞–∂–µ –Ω–µ –º–æ–∂–µ—Ç–µ —Å–µ–±–µ –ø—Ä–µ–¥—Å—Ç–∞–≤–∏—Ç—å, –∫–∞–∫ –æ–Ω–∞ –º–æ–≥–ª–∞ –ø—Ä–∏–π—Ç–∏ —Å—é–¥–∞ –∏ —Å –≤–∞–º–∏ —Ä–∞–∑–≥–æ–≤–∞—Ä–∏–≤–∞—Ç—å, –¥–∞–∂–µ –Ω–µ –≤–∏–¥—è –º–µ–Ω—è.  –î–∞–∂–µ –ø—Ä–∏ –ø–µ—Ä–≤–æ–º –∂–µ —É–ø–æ–º–∏–Ω–∞–Ω–∏–∏ –∏–º–µ–Ω–∏, –≤—ã –±—ã –∑–∞–º–µ—Ç–∏–ª–∏, —á—Ç–æ –æ–Ω–∞ –Ω–∞—á–∞–ª–∞ –≥–æ–≤–æ—Ä–∏—Ç—å.  –≠—Ç–æ –æ–Ω–∞ —Å–∞–º–∞ –∏
.  –í—Å–µ –≤—ã –∑–Ω–∞–µ—Ç–µ –æ–± —ç—Ç–æ–π —Ç—Ä–∞–≥–µ–¥–∏–∏, —è —Ç–∞–∫–∂–µ –±—ã–ª —Å–≤–∏–¥–µ—Ç–µ–ª–µ–º. –ù–æ –≤—Å–µ —Ä–∞–≤–Ω–æ —è —á—É–≤—Å—Ç–≤–æ–≤–∞–ª, —á—Ç–æ –≤—ã –≥–æ–≤–æ—Ä–∏—Ç–µ –æ–±–æ –º–Ω–µ. –í—Å–µ —ç—Ç–æ –æ—á–µ–Ω—å –ø–æ—Ö–æ–∂–µ –Ω–∞ –ø—Ä–∞–≤–¥—É. –í—ã —Å–∫–∞–∑–∞–ª–∏, —á—Ç–æ –≤—Å–µ –≤—ã –≤–∏–¥–µ–ª–∏ –º–µ–Ω—è, –Ω–æ —è –Ω–µ –ø–æ–º–Ω—é, –∫—Ç–æ, –∫–∞–∂–µ—Ç—Å—è, –≤–∏–¥–µ–ª –≤–∞—Å. –í—ã –≥–æ–≤–æ—Ä–∏–ª–∏, —á—Ç–æ –≤–∏–¥–µ–ª–∏ –º–µ–Ω—è. –ï—Å–ª–∏ –∂–µ –≤—ã –Ω–µ –∑–Ω–∞–ª–∏, –∑–∞—á–µ–º

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò–∑ –≤—Å–µ–≥–æ —Å–∫–∞–∑–∞–Ω–Ω–æ–≥–æ –º–Ω–æ—é —Å–ª–µ–¥—É–µ—Ç, —á—Ç–æ –≤ —Ç–∞–∫–æ–º —Å–ª—É—á–∞–µ —è –±—É–¥—É –≥–æ–≤–æ—Ä–∏—Ç—å –Ω–µ –æ–± –æ–¥–Ω–æ–º –ª–∏—Ü–µ –∏ –Ω–µ –æ —Ä–æ–¥–µ –≤ —Ü–µ–ª–æ–º, –∞ –∫–∞–∫ –æ —Å–æ–≤–æ–∫—É–ø–Ω–æ—Å—Ç–∏ –ª–∏—Ü, –∫–æ—Ç–æ—Ä—ã–º –¥–æ–ª–∂–Ω–æ –±—ã—Ç—å –ø–æ—Ä—É—á–µ–Ω–æ –º–æ–µ –ø–æ—Ä—É—á–µ–Ω–∏–µ –æ —Å–æ—Å—Ç–∞–≤–ª–µ–Ω–∏–∏ –∏ –æ—Ç–ø—Ä–∞–≤–ª–µ–Ω–∏–∏ –≤ —Ç—é—Ä—å–º—É —á–µ–ª–æ–≤–µ–∫–∞, –Ω–∞–∑–Ω–∞—á–µ–Ω–Ω–æ–≥–æ –≤ –º–æ–µ–º –≤–µ–¥–æ–º—Å—Ç–≤–µ, –ø–æ —Å–º–µ—Ä—Ç–∏ –∫–æ—Ç–æ—Ä–æ–≥–æ –±—ã–ª–∞ –ø—Ä–æ–∏–∑–≤–µ–¥–µ–Ω–∞ —É–∂–∞—Å–Ω–∞—è –∫–∞–∑–Ω—å –≤ –æ—Ç–Ω–æ—à–µ–Ω–∏–∏ —Ç–æ–≥–æ, –∫–æ—Ç–æ—Ä—ã–π, –Ω–µ—Å–æ–º–Ω–µ–Ω–Ω–æ,
.  –í–æ –≤—Å—è–∫–æ–º —Å–ª—É—á–∞–µ, —è –ø–æ–º–Ω—é, –∫–∞–∫ –∏–º–µ–Ω–Ω–æ –æ–Ω –º–Ω–µ –≤—Ä—É—á–∏–ª –µ–º—É —ç—Ç–æ –ø–∏—Å—å–º–æ.  –û–Ω –±—ã–ª —Ç–∞–∫ –≤–∑–≤–æ–ª–Ω–æ–≤–∞–Ω, —á—Ç–æ —É–∂–µ –∏ –Ω–µ –ø–æ–º–Ω—é —Ç–æ—á–Ω–æ, –∫—Ç–æ –æ–Ω,¬†‚Äì —è –ø–æ–º–Ω—é, –æ–Ω, –Ω–µ –ø–æ–º–Ω—é, —á—Ç–æ –µ–≥–æ –ª–∏—Ü–æ, –µ–≥–æ –ª–∏—Ü–æ –±—ã–ª–æ —É–¥–∏–≤–∏—Ç–µ–ª—å–Ω–æ –Ω–µ–ø–æ–¥–≤–∏–∂–Ω–æ–µ –∏ –∫–∞–∫–æ–µ-

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –Ø –¥—É–º–∞—é, –≤—Å–µ —ç—Ç–∏ –ª—é–¥–∏ –Ω–µ –Ω–∞ –æ–¥–Ω–æ –¥–µ–ª–æ —É—á–∏–ª–∏—Å—å, –Ω–∞ –æ–¥–Ω–∏ –∏ —Ç–µ –∂–µ –∑–∞–¥–∞—á–∏.  –ü–æ –∫—Ä–∞–π–Ω–µ–π –º–µ—Ä–µ, –≤ –º–æ–µ–π —Å–µ–º—å–µ.  –ò, –Ω–µ—Å–º–æ—Ç—Ä—è –Ω–∞ —Ç–æ, —á—Ç–æ –º–Ω–æ–≥–∏–µ –∏–∑ –Ω–∞—Å –Ω–µ –º–æ–≥—É—Ç –∂–∏—Ç—å, –∫–∞–∫ —è, –æ–Ω–∏ —Å —ç—Ç–∏–º, —è –¥—É–º–∞—é, –∂–∏–≤—É—Ç.  –í–µ–¥—å –≤ –Ω–∞—à–µ –≤—Ä–µ–º—è, –Ω–µ –∑–Ω–∞—é –ø–æ—á–µ–º—É, –≤—Å–µ —Ç–∞–∫ –ø–æ
.  –í —ç—Ç–æ–π –∂–µ —Å–∏—Ç—É–∞—Ü–∏–∏, –Ω–æ –ø—Ä–∏ –µ—â–µ –±–æ–ª—å—à–µ–π —Å–∏–ª–µ –∏ –ø—Ä–∏ –±–æ–ª–µ–µ —Ä–µ–∑–∫–æ–º –¥–≤–∏–∂–µ–Ω–∏–∏, –Ω–æ —É–∂–µ –∏ –±–æ–ª–µ–µ –±—ã—Å—Ç—Ä–æ–º –∏ –±–æ–ª–µ–µ –º–µ–¥–ª–µ–Ω–Ω–æ–º –ø—Ä–æ–¥–≤–∏–∂–µ–Ω–∏–∏, –Ω–æ –≤ –±–æ–ª–µ–µ —Ä–µ–∑–∫–æ–º –ø–∞–¥–µ–Ω–∏–∏, —Ç–∞–∫ —á—Ç–æ –≤ —ç—Ç–∏—Ö —Å–ª—É—á–∞—è—Ö –æ–Ω–∞, –≤ —Å–≤–æ—é –æ—á–µ—Ä–µ–¥—å, —Å–∞–º–∞ –≤ —Å–≤–æ—é –æ—á–µ—Ä–µ–¥—å, –Ω–µ —É–¥–µ—Ä–∂–∏—Ç—Å—è –∏ –æ—Å—Ç–∞–Ω–æ–≤–∏—Ç—Å—è, –∏ —Ç–æ–≥–¥–∞ —É–∂–µ, –¥–∞–∂–µ –∏ –Ω–µ —Ä–∞–∑–æ–±—Ä–∞–≤—à–∏—Å—å
.  –û–Ω –±—ã–ª –≤ —ç—Ç–æ –≤—Ä–µ–º—è –æ–¥–∏–Ω –∏ –¥–∞–∂–µ –±–µ–∑ –æ—Ç—Ü–∞.  –ù–æ, 

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –µ—Å–ª–∏ –≤ —Ç–æ–º, —á—Ç–æ —è –Ω–µ –º–æ–≥—É –Ω–∞–∑–≤–∞—Ç—å –µ—â–µ –æ–¥–Ω–∏–º —Å–ª–æ–≤–æ–º, –º–æ–∂–µ—Ç –ø–æ–∫–∞–∑–∞—Ç—å—Å—è —Å—Ç—Ä–∞–Ω–Ω—ã–º –∏ –Ω–µ–ø—Ä–∞–≤–∏–ª—å–Ω—ã–º, —Ç–æ –≤ —ç—Ç–æ–º –æ—Ç–Ω–æ—à–µ–Ω–∏–∏ —è, –∫–∞–∫ —É–∂–µ –≥–æ–≤–æ—Ä–∏–ª–æ—Å—å, –µ—â–µ –±–æ–ª–µ–µ —á–µ–º –º–æ–≥—É –±—ã—Ç—å –¥–æ–≤–æ–ª—å–Ω–æ –¥–æ–≤–æ–ª–µ–Ω.‚Äì –°—É–¥–∞—Ä—å, –º–æ–∂–µ—Ç –±—ã—Ç—å, —ç—Ç–æ –∫–∞–∫–æ–µ-—Ç–æ –ø—Ä–µ—É–≤–µ–ª–∏—á–µ–Ω–∏–µ, –∏, –º–æ–∂–µ—Ç –±—ã—Ç—å, –Ω–µ —Ç–æ–ª—å–∫–æ –ø—Ä–µ—É–≤–µ–ª–∏—á–µ–Ω–∏–µ, –Ω–æ –∏ –∫–∞–∫–æ–µ-—Ç–æ
.  –û!  –¢–µ–ø–µ—Ä—å —è –ø–æ–Ω–∏–º–∞—é, –∑–∞—á–µ–º –º–Ω–µ –Ω—É–∂–µ–Ω —ç—Ç–æ—Ç –≤–µ—Å—å —ç—Ç–æ—Ç –¥–æ–º —Å –µ–≥–æ –Ω–∞–¥–º–µ–Ω–Ω—ã–º–∏ –∏ –Ω–∞—Å–º–µ—à–ª–∏–≤—ã–º–∏ –ª–∏—Ü–∞–º–∏, –∫–æ—Ç–æ—Ä—ã–µ, –≤–ø—Ä–æ—á–µ–º, –Ω–∞ —Ä–µ–¥–∫–æ—Å—Ç—å –∏ —á–∞—Å—Ç–æ —Ä–∞–∑–¥—Ä–∞–∂–∞—é—Ç –¥—Ä—É–≥–∏—Ö –ª—é–¥–µ–π, —Ç–∞–∫? 
.  –ò, –Ω–∞–∫–æ–Ω–µ—Ü, –æ–Ω –±—ã–ª –≤ —ç—Ç–æ –≤ —Ç–æ –∂–µ –≤—Ä–µ–º—è —É–∂–∞—Å–Ω–æ –¥–æ–≤–æ–ª–µ–Ω —Å–æ–±–æ–π, –±—ã–ª –∫–∞–∫ –±—É–¥—Ç–æ –≤ –∫–∞–∫–æ–º-—Ç–æ —Å–æ—Å—Ç–æ—è–Ω–∏–∏. 
.  –û–Ω–∏ –≤—Å–µ

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ó–¥–µ—Å—å —è —Ç–æ–ª—å–∫–æ —á—Ç–æ –ø—Ä–æ—á–ª–∞, —á—Ç–æ –æ–Ω –∑–∞ –ø—Ç–∏—Ü–∞: 
.  –ö–∞–∫ —Ç–æ–ª—å–∫–æ —Å –Ω–µ—é –ø–æ–∑–Ω–∞–∫–æ–º–∏–ª—Å—è, –∞ —è –Ω–µ –∑–Ω–∞—é, –Ω–∞ —á—Ç–æ –≥–æ–¥–∏—Ç–µ—Å—å, —Ç–∞–∫ –∏ –Ω–µ —Ä–µ—à–∏–ª–∞—Å—å –µ–µ –ø—Ä–∏–Ω—è—Ç—å; —Ç–∞–∫ –∏ —Å–∫–∞–∑–∞–ª–∞ –µ–π: "–Ø –≤–∞—Å —Ç–æ–ª—å–∫–æ –∫ –æ–¥–Ω–æ–º—É –ø—Ä–∏–≥–ª–∞—à—É, –∞ –≤—ã –º–µ–Ω—è –Ω–µ –ø—Ä–∏–º–µ—Ç–µ".  –û–Ω–∞ —Å–æ–≥–ª–∞—Å–∏–ª–∞—Å—å; —è —Å –Ω–µ–π –Ω–µ —Å–æ–≥–ª–∞—à–∞–ª–∞—Å—å.  –í–æ—Ç —è –∏ –≥–æ–≤–æ—Ä—é: "–Ø –≤–∞—Å –æ–¥–Ω–æ–≥–æ –∏–∑ –≤–∞—Å –ø—Ä–∏–≥–ª–∞
.  –° —ç—Ç–æ–π —Ç–æ—á–∫–∏ –∑—Ä–µ–Ω–∏—è –º–æ–∂–Ω–æ –ø—Ä–µ–¥–ø–æ–ª–æ–∂–∏—Ç—å, —á—Ç–æ –∏ –¥–ª—è "–≤–µ–ª–∏–∫–æ–≥–æ –∫–Ω—è–∑—è" –±—ã–ª–æ –±–æ–ª–µ–µ –≤—ã–≥–æ–¥–Ω–æ –∫–∞–∫ —Ä–∞–∑ —Ç–æ, —á—Ç–æ –µ–º—É –≤ —ç—Ç–æ—Ç –¥–µ–Ω—å –ø—Ä–µ–¥—Å—Ç–æ—è–ª–æ —è–≤–∏—Ç—å—Å—è –∏–º–µ–Ω–Ω–æ –Ω–∞ –±–æ–≥–æ–º–æ–ª—å–µ.  "–ù–∞ –±–æ–≥–æ–º–æ–ª—å–µ –∂–µ,¬†‚Äì –¥–æ–±–∞–≤–∏–ª –æ–Ω,¬†‚Äì —è –±—ã–ª –±—ã —Ä–∞–¥". –¢—É—Ç –∂–µ –ø—Ä–∏–±–∞–≤–∏–ª:
.  –ï—Å–ª–∏ —É–∂ –≤—ã –ª—é–±–∏—Ç–µ, —Ç–æ –≤–∞–º –ø–æ—Ä–∞ –∑–Ω–∞—Ç—å, —á—Ç

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã, –≤—Å–µ –∫–∞–∫ –æ–¥–∏–Ω, –≤—Å–µ –∏–∑ –Ω–∏—Ö, –∏ –≤—Å–µ –º—ã, –≤—Å–µ –≤–º–µ—Å—Ç–µ‚Ä¶ –ù–æ –≤–µ–¥—å —Ç–∞–∫ —Ö–æ—á–µ—Ç—Å—è, —á—Ç–æ —É–∂ —è, –ø–æ–∂–∞–ª—É–π, –º–æ–≥—É —Å –Ω–∏–º —Å–ø–æ—Ä–∏—Ç—å‚Ä¶¬†‚Äì –≤—Å–∫–∏–Ω—É–ª—Å—è –ò–≤–∞–Ω –ü–µ—Ç—Ä–æ–≤–∏—á, –Ω–µ —Å–ª—É—à–∞—è, –≤–ø—Ä–æ—á–µ–º, –Ω–∏ –æ–¥–Ω–æ–≥–æ –∂–µ—Å—Ç–∞, –≤ –∫–æ—Ç–æ—Ä–æ–º –∏ –æ–Ω, –∏ –≤—Å–µ —Å–æ–±—Ä–∞–≤—à–∏–µ—Å—è –≤ –∑–∞–ª–µ –±—ã–ª–∏ —É–±–µ–∂–¥–µ–Ω—ã; –Ω–æ –æ–Ω–∏ —Å–ª—ã—à–∞–ª–∏
.  –£ –Ω–∞—Å –µ—Å—Ç—å –≤–æ–∑–º–æ–∂–Ω–æ—Å—Ç—å –≤ –≤–∞—à–µ–π –∏–≥—Ä–µ –∏–≥—Ä–∞—Ç—å –≤ –ª—é–±–æ–º –≤–∏–¥–µ. 
.  –û–Ω, –∫–∞–∫ –∏ –≤—Å—è–∫–∏–π —á–µ–ª–æ–≤–µ–∫, –æ—á–µ–Ω—å –ø–æ—Ö–æ–∂ –Ω–∞ —Å–≤–æ–µ–≥–æ –ø—Ä–µ–¥—à–µ—Å—Ç–≤–µ–Ω–Ω–∏–∫–∞; –Ω–æ —è –¥—É–º–∞–ª, —á—Ç–æ –æ–Ω —É–∂ —Å–ª–∏—à–∫–æ–º —É–º–Ω–∏–∫.  –Ø –Ω–µ –º–æ–≥ –µ–≥–æ –ø–æ–Ω—è—Ç—å: —Ç–æ –ª–∏ –æ–Ω —Å–æ–≤—Å–µ–º –Ω–µ –≥–ª—É–ø, —Ç–æ –ª–∏ –æ–Ω –¥–µ–π—Å—Ç–≤–∏—Ç–µ–ª—å–Ω–æ –Ω–µ –≤ —Å–≤–æ–µ–º —É–º–µ.  –Ø –±—ã–ª —É–±–µ–∂–¥–µ–Ω, —á—Ç–æ –æ–Ω —Å—É–º–∞—Å—à–µ–¥—à–∏–π. 
.  –í—ã—à–ª–∏—Ç–µ –∂–µ –í—ã –º–Ω–µ –∏—Ö –Ω–∞ –¥–æ–º.  

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}





Saving model checkpoint to ./checkpoint-500
Configuration saved in ./checkpoint-500/config.json
Configuration saved in ./checkpoint-500/generation_config.json


.  –ù–æ, –∫–æ–≥–¥–∞-–Ω–∏–±—É–¥—å, –≤ —ç—Ç–∏ –¥–Ω–∏ –∏ –º–∏–Ω—É—Ç—ã —è —Ä–∞—Å—Å–∫–∞–∂—É —Ç–µ–±–µ –æ–¥–∏–Ω –ø—Ä–∏–º–µ—Ä. –û–Ω –±—ã–ª –æ—á–µ–Ω—å –ø–æ–¥—Ä–æ–±–Ω–æ —Ä–∞—Å—Å–∫–∞–∑–∞–Ω–æ –∏ –Ω–µ –±—ã–ª–æ –∫–∞–∫–∏—Ö-—Ç–æ –æ—Å–æ–±–µ–Ω–Ω—ã—Ö –ø–æ–¥—Ä–æ–±–Ω–æ—Å—Ç–µ–π, –Ω–∏–∫–∞–∫–∏—Ö –ø–æ—è—Å–Ω–µ–Ω–∏–π.  –í —Ç–æ –∂–µ —Å–∞–º–æ–µ –≤—Ä–µ–º—è –æ–Ω –±—ã–ª —Ç–∞–∫ –∂–µ –ø–æ–¥—Ä–æ–±–Ω–æ –∑–∞–ø–∏—Å–∞–Ω –∏ –Ω–µ—Å–∫–æ–ª—å–∫–æ, –æ—Å–æ–±–µ–Ω–Ω–æ, –∫–æ–≥–¥–∞ —è –≤ –ø–æ—Å–ª–µ–¥–Ω–∏–π —Ä–∞–∑ –µ–≥–æ —á–∏—Ç–∞–ª, –≤–æ –≤–µ—Å—å —Ä–æ–º–∞–Ω,¬†
.  –ò, –Ω–∞–∫–æ–Ω–µ—Ü, –≤ —ç—Ç–æ—Ç –¥–µ–Ω—å —É –ü–µ—Ç—Ä–∞ –ê–ª–µ–∫—Å–µ–µ–≤–∏—á–∞ –±—ã–ª —Å–≤–æ–π —Å–æ–±—Å—Ç–≤–µ–Ω–Ω—ã–π –¥–µ–Ω—å.  –ü–æ-–Ω–∞—Å—Ç–æ—è—â–µ–º—É –æ–Ω —Å —É—Ç—Ä–∞ —Å–æ–±–∏—Ä–∞–ª—Å—è –∏–¥—Ç–∏ –∫ –ø–æ—Ä—Ç–Ω–æ–º—É, —á—Ç–æ–±—ã –≤ –ø–æ—Å–ª–µ–¥–Ω–∏–π —Ä–∞–∑ –ø–æ–∫–∞–∑–∞—Ç—å —Å–≤–æ—é —Ä—É–∫–æ–ø–∏—Å—å.  –ù–æ –≤ —ç—Ç–æ—Ç —á–∞—Å –æ–Ω –¥–æ–ª–∂–µ–Ω –±—ã–ª –±—ã—Ç—å —É –ø–æ—Ä—Ç–Ω–æ–≥–æ.  "–Ø –Ω–µ –º–æ–≥—É, - –ø–æ–¥—É–º–∞–ª –ü–µ—Ç—Ä –ê–ª–µ–∫—Å–µ–µ–≤–∏—á, - –≤–µ–¥—å –∑–¥–µ—Å—å –Ω–µ —Ç

Model weights saved in ./checkpoint-500/pytorch_model.bin
Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã —Å –Ω–∏–º —Ç–æ–∂–µ –Ω–∞ –º–∏–Ω—É—Ç–∫—É, –∫–∞–∫ –±—É–¥—Ç–æ –±—ã –≤ —Å–∞–º–æ–º –¥–µ–ª–µ —Ä–∞—Å—Å—Ç–∞–ª–∏—Å—å.‚Äì –ò –∫–∞–∫-—Ç–æ –∂–µ –º—ã —Å –Ω–∏–º —Ç–∞–∫ —Ä–∞—Å—Å—Ç–∞–ª–∏—Å—å? ‚Äì —Å–ø—Ä–æ—Å–∏–ª–∞ –°–æ–Ω—è, –≥–ª—è–¥—è –Ω–∞ –Ω–µ–≥–æ, —Å –Ω–µ–≤—ã—Ä–∞–∑–∏–º—ã–º —É–∂–∞—Å–æ–º —Å–º–æ—Ç—Ä—è—â–µ–≥–æ –≤ –≥–ª–∞–∑–∞.  –ù–æ –æ–Ω –≤—Å–µ –µ—â–µ –∂–¥–∞–ª, —á—Ç–æ –≤–æ—Ç-–≤–æ—Ç —Å–∫–∞–∂–µ—Ç, –Ω–æ –Ω–µ –º–æ–≥ –Ω–∞—á–∞—Ç—å.‚Äì –û–Ω –º–µ–Ω—è –Ω–µ –ª—é–±–∏—Ç
.  –ù–æ –Ω–µ –≤—Å–µ –æ–Ω–∏ –±—ã–ª–∏ —Ç–∞–∫–∏–µ –∏ —É–∂, –∫–æ–Ω–µ—á–Ω–æ, –≤ —Å—É—â–Ω–æ—Å—Ç–∏ –∏ –Ω–µ –≤—Å–µ —Ç–∞–∫ —É–∂ –∏ –ø–ª–æ—Ö–æ.  –í–æ—Ç, –Ω–∞–ø—Ä–∏–º–µ—Ä, –∫ –ø—Ä–∏–º–µ—Ä—É, –≤ "–ö—Ä–µ—Å—Ç–∏—Ç–µ–ª–µ" –µ—Å—Ç—å —Ç–∞–∫–æ–π —ç–ø–∏–∑–æ–¥, –∫–æ—Ç–æ—Ä—ã–π —è –∑–Ω–∞—é –∫–∞–∫ —Ä–∞–∑ –¥–æ —Ç–æ–≥–æ, –∫–∞–∫ –≤ –Ω–∞—à–µ–º —Ç–µ–∞—Ç—Ä–µ –ø–æ—è–≤–∏–ª—Å—è –ø–µ—Ä–≤—ã–π –≥–µ—Ä–æ–π.  –û–Ω –Ω–µ —Å–ª—É—á–∞–π–Ω–æ –±—ã–ª —É–±–∏—Ç, –æ–Ω –¥–µ–π—Å—Ç–≤–∏—Ç–µ–ª—å–Ω–æ —É–±–∏—Ç, –∫–∞–∫ —è
.  –≠—Ç–æ –∂–µ —Å–∞–º—ã–π –ª—É—á—à–∏–π! ‚Äì —Å–∫–∞–∑–∞–ª –ê–ª–∏–∫. 
.  –í –Ω–∞—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í –Ω–∞—á–∞–ª–µ —Ç—Ä–∏–¥—Ü–∞—Ç—ã—Ö –≥–æ–¥–æ–≤ –≤ —ç—Ç–æ –∂–µ —Å–∞–º–æ–µ –≤—Ä–µ–º—è, –≤ —Å–æ—Ä–æ–∫–æ–≤—ã—Ö, –∫ –≤–µ–ª–∏–∫–æ–º—É —É–¥–æ–≤–æ–ª—å—Å—Ç–≤–∏—é –Ω–µ–º—Ü–µ–≤, –≤ –ü–µ—Ç–µ—Ä–±—É—Ä–≥–µ –±—ã–ª–æ —É–∂–µ –º–Ω–æ–≥–æ –∏ –≤ —Ç–æ –∂–µ —Å–∞–º–æ–µ –≤—Ä–µ–º—è –º–Ω–æ–≥–æ –≤—Å–µ–≥–æ.  –ö —ç—Ç–æ–π —Ç–µ–º–µ, –≤ —Ç–æ–º –∂–µ –≥–æ–¥—É, –ø—Ä–∏ –∂–∏–∑–Ω–∏ –º–æ–µ–≥–æ –¥—Ä—É–≥–∞, –∫–æ—Ç–æ—Ä—ã–π –±—ã–ª –≤ —Å—Å—ã–ª–∫–µ, –æ –∫–æ—Ç–æ—Ä—ã—Ö —Å–µ–π—á–∞—Å —É–∂–µ –æ—á–µ–Ω—å –∏ –æ—á–µ–Ω—å —Ö–æ—Ä–æ—à–æ –∏–∑–≤–µ—Å—Ç–Ω–æ, –ø—Ä–∏–Ω–∞–¥–ª–µ–∂–∞–ª –æ–Ω,
.  –í—Å–µ-—Ç–∞–∫–∏ –Ω–∞–¥–æ –¥–∞—Ç—å –µ–º—É –≤—Ä–µ–º—è –∏ –ø—Ä–æ–π—Ç–∏ —á–µ—Ä–µ–∑ —ç—Ç–æ.  –ê –µ—Å–ª–∏ –∏ –ø—Ä–æ–ø—É—Å—Ç–∏–º, —Ç–æ –∑–∞—á–µ–º –Ω–∞–º –≤ —ç—Ç–æ –¥–µ–ª–æ –≤—Å—è —ç—Ç–∞ –≥—Ä—è–∑—å, —á—Ç–æ–±—ã –ø–æ—Ç–æ–º –Ω–µ –∏–¥—Ç–∏ –∫ –Ω–µ–º—É, —á—Ç–æ–±—ã –Ω–µ –±—ã—Ç—å –µ–º—É –Ω–µ –Ω–∞ —Å–≤–æ–∏—Ö –∂–µ –Ω–æ–≥–∞—Ö, –∞ –∫ –¥—Ä—É–≥–æ–º—É —á–µ–ª–æ–≤–µ–∫—É, –∫ —á–µ–º—É, –∫ —á–µ–º—É –∏–¥—Ç–∏ —Å —Ç–∞–∫–æ–π –≥—Ä—è–∑—å—é?  –í–æ—Ç –∏ –ø–æ–ª—É—á–∞–µ—Ç—Å—è —á—Ç–æ-—Ç–æ
.  –í —ç—Ç



Training completed. Do not forget to share your model on huggingface.co/models =)


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ú–Ω–µ –ø–æ–∫–∞–∑–∞–ª–æ—Å—å, —á—Ç–æ —Ç—É—Ç –∫–∞–∫–æ–µ-—Ç–æ —á—Ç–æ-—Ç–æ –±—ã–ª–æ –¥—Ä—É–≥–æ–µ.  –ò –≤ –æ—Å–æ–±–µ–Ω–Ω–æ—Å—Ç–∏, —á—Ç–æ-—Ç–æ –Ω–µ –ø–æ—Ö–æ–∂–µ–µ –Ω–∞ –ø—Ä–∞–≤–¥—É. 
.  –ò —Ö–æ—Ç—è, –ø–æ —Å—É—Ç–∏ —Å–≤–æ–µ–π, –æ–Ω–∞ –Ω–µ –±—ã–ª–∞ –ø–æ—Ö–æ–∂–∞ –Ω–∏ –Ω–∞ –∫–∞–∫—É—é –¥—Ä—É–≥—É—é –∂–µ–Ω—â–∏–Ω—É; –Ω–æ —á—Ç–æ-—Ç–æ –≤–æ –≤–∑–≥–ª—è–¥–µ, –≤–∑–≥–ª—è–¥–µ, –≤ –≤—ã—Ä–∞–∂–µ–Ω–∏–∏ –≥–ª–∞–∑, –≤ –∫–∞–∂–¥–æ–º –¥–≤–∏–∂–µ–Ω–∏–∏ —ç—Ç–æ–≥–æ –ª–∏—Ü–∞, –≤ –∫–∞–∂–¥–æ–º –¥–≤–∏–∂–µ–Ω–∏–∏ –µ–≥–æ –≥–æ–ª–æ–≤—ã –∏ –≤ –∫–∞–∂–¥–æ–º –¥–≤–∏–∂–µ–Ω–∏–∏ —ç—Ç–∏—Ö –¥–≤–∏–∂–µ–Ω–∏–π –±—ã–ª–æ —á—Ç–æ-—Ç–æ —Å—Ç—Ä–∞–Ω–Ω–æ–µ.  –û–Ω–æ –∫–∞–∫ –±—É–¥—Ç–æ –Ω–µ –æ—Ç–ª–∏—á–∞–ª–æ—Å—å –æ—Ç –æ–±—ã–∫–Ω–æ–≤–µ–Ω–Ω—ã—Ö –ª—é–¥–µ–π –Ω–∏ –≤ —á–µ–º.
.  –û–≥–æ—Ä–æ–¥–Ω–∞—è —á–∞—Å—Ç—å, –∫–∞–∫ –≤—Å–µ–≥–¥–∞, –¥–æ–≤–æ–ª—å–Ω–æ —Å–≤–æ–µ–æ–±—Ä–∞–∑–Ω–∞.  –í –æ—Å–Ω–æ–≤–Ω–æ–º —ç—Ç–æ –¥–æ–º–∞ –∫—Ä–µ—Å—Ç—å—è–Ω.  –ó–∞—Ö–æ—Ä–æ–Ω–µ–Ω–∏—è –∂–µ –º–æ–∂–Ω–æ –Ω–∞–±–ª—é–¥–∞—Ç—å –∑–∞ —á–∞—Å—Ç–Ω—ã–º–∏, –Ω–∞ —Å–ª—É—á–∞–π, –µ—Å–ª–∏ –≤—ã –ø—Ä–æ–∂–∏–≤–∞–µ—Ç–µ –≤ –

Saving model checkpoint to .
Configuration saved in ./config.json
Configuration saved in ./generation_config.json
Model weights saved in ./pytorch_model.bin


In [10]:
print_generations(prefix=". –°–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. –°–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ ‚Äì —á—Ç–æ–± –≤—Å–µ-—Ç–∞–∫–∏ –∏ –≤ —Ç—É –∂–µ –º–∏–Ω—É—Ç—É –Ω–µ —Å–ª—É—á–∏–ª–æ—Å—å. ¬´–ù–µ—Ç, ‚Äì –ø–æ–¥—É–º–∞–ª –ü–∞–≤–µ–ª –ü–∞–≤–ª–æ–≤–∏—á, ‚Äì –æ–Ω –Ω–µ –º–æ–∂–µ—Ç –±—ã—Ç—å –≤ —ç—Ç—É –º–∏–Ω—É—Ç—É —Ç–∞–∫ –±–µ—Å—Å–∏–ª–µ–Ω, —á—Ç–æ –Ω–µ —Å–º–µ–µ—Ç –ø–µ—Ä–µ—Å—Ç—É–ø–∏—Ç—å —á–µ—Ä–µ–∑ —Å–µ–±—è¬ª. –û–Ω –ø–æ–¥–æ—à–µ–ª –∫ –∫—Ä–æ–≤–∞—Ç–∏ –∏ —Å—Ç–∞–ª –≤ –∏–∑–≥–æ–ª–æ–≤—å–µ, –∫–∞–∫ –±—ã –æ–±–¥—É–º—ã–≤–∞—è –∫–∞–∫–æ–µ-—Ç–æ —Ä–µ—à–µ–Ω–∏–µ. –û–Ω –Ω–µ –∑–Ω–∞–ª, –≤ –∫–∞–∫—É—é —Å—Ç–æ—Ä–æ–Ω—É –±—Ä–æ—Å–∏—Ç—å—Å—è, —á—Ç–æ–± –Ω–µ —Ç–æ–ª—å–∫–æ —É–±–µ–∂–∞—Ç—å, –Ω–æ –∏ —Å–ø–∞—Å—Ç–∏—Å—å. –û–Ω —É–∂–µ –ø—Ä–∏–≥–æ—Ç–æ–≤–∏–ª—Å—è –±–µ–∂–∞—Ç—å, –Ω–æ –∫–∞–∫ –±—É–¥—Ç–æ –±—ã –≤–¥—Ä—É–≥ –∫–∞–∫ –±—ã —á—Ç–æ-—Ç–æ –∏–∑–º–µ–Ω–∏–ª–æ—Å—å, —á—Ç–æ-—Ç–æ –∏—Å—á–µ–∑–ª–æ –≤ –Ω–µ–º. –ß—Ç–æ —ç—Ç–æ –±—ã–ª–æ? –ü–æ—á–µ–º—É –æ–Ω –≤–¥—Ä—É–≥ –æ–ø—è—Ç—å –Ω–∏—á–µ–≥–æ –Ω–µ –≤–∏–¥–∏—Ç? –ß—Ç–æ –æ–Ω –≤–∏–¥–µ–ª?
. –°–∞–º–æ–µ –≥–ª–∞–≤–Ω–æ–µ —ç—Ç–æ –Ω–µ –≤ —Ç–æ–º, —á—Ç–æ —ç—Ç–æ –±—É–¥–µ—Ç, —ç—Ç–æ –Ω–µ —Ç–æ, —á—Ç–æ —ç—Ç–

In [11]:
print_generations(prefix="–í 2024 –≥–æ–¥—É", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



–í 2024 –≥–æ–¥—É (–≤ —Å–≤—è–∑–∏ —Å ¬´–°–æ–Ω–º–∞–º–∏¬ª) –±—ã–ª –ø—Ä–æ–∏–∑–≤–µ–¥–µ–Ω —Ä–µ–º–æ–Ω—Ç –¥–æ–º–∞ –Ω–∞ –†—É–±–ª—ë–≤–∫–µ, –Ω–æ –Ω–µ –≤ –∑–¥–∞–Ω–∏–∏, –∞ –≤ —á–∞—Å—Ç–Ω–æ–º –¥–æ–º–µ –Ω–∞ –°—Ç–∞—Ä–æ–º –ê—Ä–±–∞—Ç–µ. –ù–µ –∑–Ω–∞—é –ø–æ—á–µ–º—É, –¥–∞ –∏ –∑–∞—á–µ–º —Ç–∞–∫ –¥–µ–ª–∞—Ç—å, —É –º–µ–Ω—è –≤ —Ç–æ–º –∂–µ –¥–æ–º–µ —Ä–µ–º–æ–Ω—Ç –±—ã–ª, –∞ —è –∏ –Ω–µ –ø–æ–º–Ω—é –µ–≥–æ, —Ç–∞–∫ —á—Ç–æ —ç—Ç–æ —Å–∫–æ—Ä–µ–µ –∫ —Å–ª–æ–≤—É‚Ä¶ –ê –¥–æ —Ç–µ—Ö –ø–æ—Ä –±—ã–ª–æ –¥–µ–ª–æ, –∏ —è –Ω–µ –∑–Ω–∞—é –∫–∞–∫ –≤ —ç—Ç–æ—Ç –¥–æ–º –ø–æ–ø–∞—Å—Ç—å.
–í 2024 –≥–æ–¥—É –≤ –†–æ—Å—Å–∏–∏ –ø–æ –ø—Ä–µ–¥–ª–æ–∂–µ–Ω–∏—é –í. –ò. –õ–µ–Ω–∏–Ω–∞ –≤ –ø–∏—Å—å–º–µ –∫ –æ–¥–Ω–æ–º—É –∏–∑ –∑–Ω–∞–∫–æ–º—ã—Ö –≤ –ú–æ—Å–∫–≤–µ ¬´–æ –Ω–æ–≤—ã—Ö –≤–µ—â–∞—Ö¬ª, –æ–Ω –±—ã–ª –ø–æ—Å—Ç–∞–≤–ª–µ–Ω –≤ –æ–¥–∏–Ω —Ä—è–¥ —Å –ø—Ä–µ–¥—Å—Ç–∞–≤–∏—Ç–µ–ª—è–º–∏ –¥—É—Ö–æ–≤–µ–Ω—Å—Ç–≤–∞ –∏ —Å –Ω–µ–∫–æ—Ç–æ—Ä—ã–º–∏ –∏–∑ –ø—Ä–∏–±–ª–∏–∂–µ–Ω–Ω—ã—Ö, –±—ã–≤—à–∏—Ö –µ—â–µ –≤ —Ç–æ –≤—Ä–µ–º—è —á–ª–µ–Ω–∞–º–∏ –ø—Ä–∞–≤–∏—Ç–µ–ª—å—Å—Ç–≤–∞, —Å –Ω–µ–∫–æ—Ç–æ—Ä—ã–º–∏ –∏–∑ –∫–æ—Ç–æ—Ä—ã—

In [12]:
print_generations(prefix="–ë–æ–ª—å—à–µ –≤—Å–µ–≥–æ –Ω–∞ —Å–≤–µ—Ç–µ —è", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



–ë–æ–ª—å—à–µ –≤—Å–µ–≥–æ –Ω–∞ —Å–≤–µ—Ç–µ —è –µ–µ –±–æ—é—Å—å,¬†‚Äì –æ—Ç–≤–µ—á–∞–ª–∞ –æ–Ω–∞ —Ç–∏—Ö–æ –∏ –Ω–µ–∂–Ω–æ.¬†‚Äì –Ø –≤ –Ω–µ–µ —Ö–æ—á—É –ø—Ä–µ–≤—Ä–∞—Ç–∏—Ç—å—Å—è –∏ —Å—Ç–∞—Ç—å –µ–µ –º–∞—Ç–µ—Ä—å—é. –ò —è –≤ —ç—Ç–æ –≤–µ—Ä—é, –ø–æ—Ç–æ–º—É —á—Ç–æ‚Ä¶ —è‚Ä¶ –Ø, –Ω–∞–∫–æ–Ω–µ—Ü, –æ–Ω–∞, —è‚Ä¶ —è‚Ä¶ –Ø‚Ä¶
–ë–æ–ª—å—à–µ –≤—Å–µ–≥–æ –Ω–∞ —Å–≤–µ—Ç–µ —è —Ö–æ—Ç–µ–ª–∞ –±—ã—Ç—å –µ–≥–æ‚Ä¶ –∫–∞–∫ –±—É–¥—Ç–æ —ç—Ç–æ —Ç–∞–∫ –∏ –±—ã–ª–æ. –£–±–∏—Ç—å‚Ä¶
–ë–æ–ª—å—à–µ –≤—Å–µ–≥–æ –Ω–∞ —Å–≤–µ—Ç–µ —è –≤ –≤–æ—Å—Ç–æ—Ä–≥–µ! –≠—Ç–æ –±—ã–ª–æ –æ–¥–Ω–æ –∏–∑ –º–æ–∏—Ö —Å–∞–º—ã—Ö —Å—á–∞—Å—Ç–ª–∏–≤—ã—Ö –≤–æ—Å–ø–æ–º–∏–Ω–∞–Ω–∏–π! –Ø –±—ã–ª–∞ –≤ –≤–æ—Å—Ç–æ—Ä–≥–µ. –û–Ω–∞ –±—ã–ª–∞ —Å—á–∞—Å—Ç–ª–∏–≤–∞, –≤ –≤–æ—Å—Ç–æ—Ä–≥–µ –∏ –¥–∞–∂–µ, –∫–∞–∂–µ—Ç—Å—è, —á—É—Ç—å –≤ —Å–ª–µ–∑—ã –Ω–µ –±–∏–ª–∞—Å—å, –Ω–æ —è —á—É–≤—Å—Ç–≤–æ–≤–∞–ª–∞, —á—Ç–æ –æ–Ω–∞ –ø–ª–∞—á–µ—Ç. –ö–æ–≥–¥–∞ –æ–Ω–∞ –≤—ã—Ö–æ–¥–∏–ª–∞, –æ–Ω–∞ —É–∂–µ –±—ã–ª–∞ –≤ –≤–æ–ª–Ω–µ–Ω–∏–∏. –£ –º–µ–Ω—è –±—ã–ª–∏ –¥—Ä–æ–∂–∫–∏ –≤ –∫–æ–ª–µ–Ω—è—Ö. –ö–∞–∫ –º–Ω–µ —Ö–æ—Ç–µ–ª–æ—Å—å –µ–µ –ø–æ—Ü–µ–ª–æ–≤–

–°–æ–±—Ä–∞–Ω–∏–µ —Å–æ—á–∏–Ω–µ–Ω–∏–π –¢–æ–ª—Å—Ç–æ–≥–æ

In [13]:
model, tokenizer = get_ru_model()
freeze_layers(model, 8)
finetune(model, tokenizer, TOLST_PATH)

loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--sberbank-ai--rugpt3small_based_on_gpt2/snapshots/f2f7c585b05a16726efe8974586e10b4d5939082/config.json
Model config GPT2Config {
  "_name_or_path": "sberbank-ai/rugpt3small_based_on_gpt2",
  "activation_function": "gelu_new",
  "architectures": [
    "GPT2LMHeadModel"
  ],
  "attn_pdrop": 0.1,
  "bos_token_id": 50256,
  "embd_pdrop": 0.1,
  "eos_token_id": 50256,
  "gradient_checkpointing": false,
  "initializer_range": 0.02,
  "layer_norm_epsilon": 1e-05,
  "model_type": "gpt2",
  "n_ctx": 2048,
  "n_embd": 768,
  "n_head": 12,
  "n_inner": null,
  "n_layer": 12,
  "n_positions": 2048,
  "reorder_and_upcast_attn": false,
  "resid_pdrop": 0.1,
  "scale_attn_by_inverse_layer_idx": false,
  "scale_attn_weights": true,
  "summary_activation": null,
  "summary_first_dropout": 0.1,
  "summary_proj_to_labels": true,
  "summary_type": "cls_index",
  "summary_use_proj": true,
  "transformers_version": "4.2

SETTING N_EPOCHS TO  0.8218274747444199


Loading features from cached file /content/gdrive/MyDrive/datasets/cached_lm_GPT2TokenizerFast_256_tolst.txt [took 0.704 s]
PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
***** Running training *****
  Num examples = 6018
  Num Epochs = 1
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 619
  Number of trainable parameters = 28353024


Step,Training Loss
50,3.5064
100,3.4464
150,3.4331
200,3.4262
250,3.3905
300,3.4336
350,3.3588
400,3.3833
450,3.374
500,3.3648


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω, –ø–æ —Å–≤–æ–µ–º—É –≤–Ω—É—Ç—Ä–µ–Ω–Ω–µ–º—É —É–±–µ–∂–¥–µ–Ω–∏—é, –∏ –Ω–µ —Ö–æ—Ç–µ–ª –±—ã—Ç—å –Ω–∞ —Å—Ç–æ—Ä–æ–Ω–µ.  –û–Ω –ø—Ä–æ—Å—Ç–æ –Ω–µ –º–æ–≥ –¥–æ–ø—É—Å—Ç–∏—Ç—å —Ç–æ–≥–æ, —á—Ç–æ, –ø–æ –µ–≥–æ –º–Ω–µ–Ω–∏—é, –æ–Ω –≤—Å–µ –∂–µ –∏–º–µ–ª —Ç–æ, —á—Ç–æ –∏–º–µ–ª. 
.  –í –∑–∞–≤–∏—Å–∏–º–æ—Å—Ç–∏ –æ—Ç —Ö–∞—Ä–∞–∫—Ç–µ—Ä–∞ –ø—Ä–æ–±–ª–µ–º—ã –º—ã –º–æ–∂–µ–º –ø–æ–ª—É—á–∏—Ç—å –æ—á–µ–Ω—å –∏–Ω—Ç–µ—Ä–µ—Å–Ω—ã–µ –∏ –æ—Ä–∏–≥–∏–Ω–∞–ª—å–Ω—ã–µ –ø—Ä–µ–¥–ª–æ–∂–µ–Ω–∏—è, –∫–æ—Ç–æ—Ä—ã–µ –∑–∞—Å—Ç–∞–≤—è—Ç –≤–∞—Å –∑–∞–¥—É–º–∞—Ç—å—Å—è –æ —Ä–∞–∑–≤–∏—Ç–∏–∏, —Ä–∞–±–æ—Ç–µ, –∫–∞—Ä—å–µ—Ä–Ω–æ–π –∏ –ª–∏—á–Ω–æ–π –∂–∏–∑–Ω–∏. 
.  –ö–æ–≥–¥–∞ –æ–Ω–∞ –±—ã–ª–∞ —É –Ω–µ–µ, –æ–Ω, –∫–∞–∫ –æ–Ω –∑–Ω–∞–ª, –Ω–µ –º–æ–≥ –∑–∞—Å—Ç–∞–≤–∏—Ç—å –µ–µ –≤–∑—è—Ç—å –µ–µ.  –û–Ω —á—É–≤—Å—Ç–≤–æ–≤–∞–ª, —á—Ç–æ –µ–µ —Å–µ—Ä–¥—Ü–µ —Ä–∞–∑—Ä—ã–≤–∞–µ—Ç—Å—è –æ—Ç –ª—é–±–≤–∏.  –ß—Ç–æ –æ–Ω–∞ –∑–Ω–∞–ª–∞, —á—Ç–æ –µ–π —Ö–æ—á–µ—Ç—Å—è –µ–≥–æ. 
.  –û–Ω —Å–∫–∞–∑–∞–ª, —á—Ç–æ –æ–Ω –Ω–µ —Å–º–æ–∂–µ—Ç –∂–∏—Ç—å –±–µ–∑ –Ω–µ–µ.  –ú–Ω–µ –æ–Ω –Ω–µ –Ω—É–∂–µ–Ω. 


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í –ú–æ—Å–∫–≤–µ –≤ –¥–µ–∫–∞–±—Ä–µ —ç—Ç–æ–≥–æ –≥–æ–¥–∞ –Ω–µ –±—ã–ª–æ –¥–æ–∂–¥—è.  –ú—ã —É–∂–µ –ø—Ä–∏–≤—ã–∫–ª–∏ –∫ —ç—Ç–æ–º—É, –∫–∞–∫ –∫ –Ω–æ–≤–æ–º—É, —á—Ç–æ –ø–æ —É—Ç—Ä–∞–º, –ø—Ä–∏–µ—Ö–∞–≤ –Ω–∞ –±–∞–∑–∞—Ä, –º—ã —Å–ª—ã—à–∏–º: "–ü–æ–µ–∑–∂–∞–π—Ç–µ –Ω–∞ –±–∞–∑–∞—Ä, –∞ –∑–∞–≤—Ç—Ä–∞ ‚Äì –æ–±—Ä–∞—Ç–Ω–æ –≤ –ú–æ—Å–∫–≤—É!"  –ê –µ—Å–ª–∏ –¥–æ–∂–¥—å –≤—Å–µ-—Ç–∞–∫–∏ –Ω–∞—á–∞–ª—Å—è, —Ç–æ –º—ã –Ω–µ —Å–ª—ã—à–∏–º, –∫–∞–∫ –µ—Ö–∞–ª–∏ –Ω–∞–∑–∞–¥. 
.  –ò –µ—Å–ª–∏ –±—ã –≤—ã —Å –Ω–∏–º–∏, –∏ –æ–Ω–∏ —Å –≤–∞–º–∏, –≤—ã –±—ã–ª–∏ –±—ã —Ç–∞–∫ —Å—á–∞—Å—Ç–ª–∏–≤—ã, —á—Ç–æ –≤ —ç—Ç–æ–π –∂–∏–∑–Ω–∏ —Ç–∞–∫ –ø—Ä–æ—Å—Ç–æ –Ω–µ –ø–æ–π–º–µ—Ç–µ —Å–≤–æ–∏—Ö —Å—Ç—Ä–∞–¥–∞–Ω–∏–π. 
. 
.  –í –Ω–µ–º –Ω–µ —Ç–æ–ª—å–∫–æ –≤ —Å–∞–º–æ–º –Ω–∞—á–∞–ª–µ, –Ω–æ –∏ –Ω–∞ –ø—Ä–æ—Ç—è–∂–µ–Ω–∏–∏ –≤—Å–µ–≥–æ —ç—Ç–æ–≥–æ –≤—Ä–µ–º–µ–Ω–∏ –±—ã–ª –∏ –µ–≥–æ —Ä—É–∫–æ–≤–æ–¥–∏—Ç–µ–ª—å ‚Äî –≥–µ–Ω–µ—Ä–∞–ª-–º–∞–π–æ—Ä –≥—Ä–∞—Ñ –ê–ª–µ–∫—Å–µ–π –î–º–∏—Ç—Ä–∏–µ–≤–∏—á –†–æ–≥–æ–≤.  –í —ç—Ç–æ–º –∏–∑–¥–∞–Ω–∏–∏ –µ—Å—Ç—å —Ç–∞–∫–∂–µ –µ–≥–æ –∞–≤—Ç–æ–≥—Ä–∞—Ñ—ã, –Ω–æ —Ç–æ–ª—å–∫–æ, –ø

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω –≥–æ–≤–æ—Ä–∏–ª, —á—Ç–æ —ç—Ç–æ –¥–ª—è —Ç–æ–≥–æ, —á—Ç–æ–±—ã –ø–æ–∫–∞–∑–∞—Ç—å –µ–º—É, –∫–∞–∫ –µ–≥–æ –ª—é–±–∏—Ç –∫–Ω—è–≥–∏–Ω—è –û–ª—å–≥–∞, –∏ —á—Ç–æ–±—ã –æ–Ω –Ω–µ –∑–∞–±—ã–≤–∞–ª –µ–µ –∏ –≤ –¥–æ–º–µ –µ–µ.  –ò –æ–Ω –Ω–µ –∑–∞–±—ã–≤–∞–ª, –∫–∞–∫ —Ö–æ—Ä–æ—à–æ —á—É–≤—Å—Ç–≤–æ–≤–∞–ª –µ–µ. 
.  –ü–æ—Å–ª–µ —Ç–æ–≥–æ, –∫–∞–∫ –º—ã –≤—Å–µ —Å–µ–ª–∏ –∑–∞ —Å—Ç–æ–ª –∏ —è, –∫–∞–∫ –º–Ω–µ –ø–æ–∫–∞–∑–∞–ª–æ—Å—å, —á—É–≤—Å—Ç–≤–æ–≤–∞–ª —Å–µ–±—è –≤ –Ω–æ–≤–æ–π –∂–∏–∑–Ω–∏ —Ç–∞–∫ –∂–µ —Ö–æ—Ä–æ—à–æ, –∫–∞–∫ –º—ã —Å –¢–æ—Å–∏–Ω—ã–º, —è —á—É–≤—Å—Ç–≤–æ–≤–∞–ª —Å–µ–±—è –ø–æ-–Ω–æ–≤–æ–º—É: —á—É–≤—Å—Ç–≤–æ–≤–∞–ª —Å–µ–±—è —Ç–∞–∫, –∫–∞–∫ —á—É–≤—Å—Ç–≤–æ–≤–∞–ª —Å–µ–±—è –≤ —Å–≤–æ–µ –≤—Ä–µ–º—è –∏ —è. –ê –∫–æ–≥–¥–∞ —è –µ—Ö–∞–ª –∫ –¢–æ—Å–∏–Ω—ã–º, —è —Ç–∞–∫ –∂–µ —á—É–≤—Å—Ç–≤–æ–≤–∞–ª —Å–µ–±—è —Ç–∞–∫ –∂–µ
.  –ü—Ä–∏ —ç—Ç–æ–º –º–Ω–æ–≥–∏–µ –∑–Ω–∞–∫–æ–º—ã–µ —É–∂–µ –≤–∏–¥–µ–ª–∏, –∫–∞–∫ —è –µ–∑–∂—É –Ω–∞ —Å–≤–æ–µ–º —Å–∫—É—Ç–µ—Ä–µ. ‚Äì –≥–æ–≤–æ—Ä–∏—Ç –ù–∞—Ç–∞–ª—å—è, ‚Äî –∫–æ–≥–¥–∞-—Ç–æ –≤ –Ω–∞—à–µ–º –¥–≤–æ—Ä–µ –±—ã–ª–∞ –æ—á–µ–Ω—å –ø—Ä–æ—Å—Ç–∞—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ü—Ä–µ–±—ã–≤–∞—è –≤ –Ω–µ–º, —á–µ–ª–æ–≤–µ–∫ –Ω–µ–≤–æ–ª—å–Ω–æ —Å–æ–ø—Ä–∏–∫–∞—Å–∞–µ—Ç—Å—è —Å –∂–∏–∑–Ω—å—é –∏ —á—É–≤—Å—Ç–≤–∞–º–∏ –¥—Ä—É–≥–∏—Ö –ª—é–¥–µ–π, —Å —Å–≤–æ–∏–º–∏ –ø–æ—Å—Ç—É–ø–∫–∞–º–∏, —á—É–≤—Å—Ç–≤–∞–º–∏, –ø–æ–Ω—è—Ç–∏—è–º–∏, –ø–æ–Ω—è—Ç–∏—è–º–∏, –ø–æ–Ω—è—Ç–∏—è–º–∏, –∏–¥–µ—è–º–∏ –∏ —É–±–µ–∂–¥–µ–Ω–∏—è–º–∏.  –ù–æ –≤ —á–µ–ª–æ–≤–µ–∫–µ, –≤ –≥–ª—É–±–∏–Ω–µ –¥—É—à–∏ —Å—Ç—Ä–µ–º–∏–≤—à–µ–º—Å—è –∂–∏—Ç—å —Å–≤–æ–∏–º —É–º–æ–º, –≤ –Ω–µ–º –Ω–µ—Ç –Ω–∏–∫–∞–∫–∏—Ö —ç—Ç–∏—Ö –¥—É—Ö–æ–≤–Ω—ã—Ö –æ—Ä–∏–µ–Ω—Ç–∏—Ä–æ–≤.  –ù–∞–ø—Ä–æ—Ç–∏–≤, –∏–º–µ–Ω–Ω–æ –≤ —á–µ–ª–æ–≤–µ–∫–µ,
.  –í—Å–µ –≤—ã –∑–Ω–∞–µ—Ç–µ, —á—Ç–æ —ç—Ç–æ —Ç–∞–∫–æ–µ, –≤—ã ‚Äì –º–æ—è –ø–æ–¥—Ä—É–≥–∞, –∫–æ—Ç–æ—Ä—É—é —è —Ö–æ—á—É –≤–∏–¥–µ—Ç—å, –Ω–æ –≤—ã ‚Äì –Ω–µ –∂–µ–Ω–∞.  –ö–∞–∫ –≤—ã –º–æ–≥–ª–∏ –¥–æ–≥–∞–¥–∞—Ç—å—Å—è, —á—Ç–æ —è –±—É–¥—É –∂–∏—Ç—å —Å –æ–¥–Ω–æ–π –∂–µ–Ω—â–∏–Ω–æ–π, –∫–æ—Ç–æ—Ä–∞—è, —Å –≤–∞—à–µ–≥–æ —Å–ª–æ–≤–∞, –º–Ω–µ –∏–∑–º–µ–Ω–∏–ª–∞, –∏ –≤—ã –º–æ–∂–µ—Ç–µ —Å—á–∏—Ç–∞—Ç—å –º–µ–Ω—è —Å—É–º–∞—Å—à–µ–¥—à–∏–º.  –í—ã –Ω–µ –ø–æ–Ω–∏–º–∞–µ—Ç–µ —ç—Ç–æ–≥–æ, –Ω–æ

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò–∑-–∑–∞ —ç—Ç–æ–≥–æ, —É –º–µ–Ω—è –Ω–µ—Ç –≤–æ–∑–º–æ–∂–Ω–æ—Å—Ç–∏ —Ö–æ–¥–∏—Ç—å –Ω–∞ —Ä–∞–±–æ—Ç—É. 
.  –í—Å–µ —ç—Ç–∏ –ø–ª–∞–Ω—ã –º–æ–∂–Ω–æ –æ—Ö–∞—Ä–∞–∫—Ç–µ—Ä–∏–∑–æ–≤–∞—Ç—å —Ç–∞–∫: –≤ –Ω–∞—á–∞–ª–µ —Å–µ–Ω—Ç—è–±—Ä—è, –∫–∞–∫ –≥–æ–≤–æ—Ä–∏—Ç—Å—è, –Ω–µ –±—ã–ª–æ –Ω–∏ –æ–¥–Ω–æ–≥–æ –¥–Ω—è.  –ò–∑ –ø—è—Ç–∏ –ø—É–Ω–∫—Ç–æ–≤ –∏ –¥–≤—É—Ö (–∏–∑ –∫–æ—Ç–æ—Ä—ã—Ö –æ–¥–∏–Ω –∫–∞—Å–∞–µ—Ç—Å—è –∞—Ä–º–∏–∏) –±—ã–ª–æ —Ç—Ä–∏.  –ò, –Ω–µ —Ç–µ—Ä—è—è –≤—Ä–µ–º–µ–Ω–∏ –¥–∞—Ä–æ–º, –º—ã –Ω–∞—á–∞–ª–∏, –∫–∞–∫ –≥–æ–≤–æ—Ä–∏—Ç—Å—è, –Ω–∞—Å—Ç—Ä–∞–∏–≤–∞—Ç—å —Å–µ–±—è –Ω–∞ —Ç–æ, —á—Ç–æ –±—É–¥–µ—Ç —Å–¥–µ–ª–∞–Ω–æ. 
.  –Ø –∑–Ω–∞–ª, —á—Ç–æ –æ–Ω–∞ –≤—Å–µ —Ç–∞–∫ —É–º–µ–µ—Ç, –∏ —É –º–µ–Ω—è –≤ –¥—É—à–µ –Ω–µ –±—ã–ª–æ —Å–æ–º–Ω–µ–Ω–∏–π, —á—Ç–æ –≤ –µ–µ –≤–∑–≥–ª—è–¥–µ, –ø—Ä–∏ –≤–æ—Å–ø–æ–º–∏–Ω–∞–Ω–∏–∏ –æ–± —ç—Ç–æ–π –º–∏–Ω—É—Ç–Ω–æ–π —Å–ª–∞–±–æ—Å—Ç–∏, –æ–Ω–∞ –Ω–µ –º–æ–≥–ª–∞ –Ω–∏—á–µ–≥–æ —Å–∫–∞–∑–∞—Ç—å. 
.  –í—Å–µ —ç—Ç–æ —Ö–æ—Ä–æ—à–æ, –Ω–æ –ø–æ—á–µ–º—É-—Ç–æ —è –Ω–µ –∑–Ω–∞—é, –∫–∞–∫ –±—ã—Ç—å.  –ö–∞–∫ –ø–æ–Ω—è—Ç—å, —á—Ç–æ —è ‚Äì –¥–µ–≤—É—à–∫–∞?  –ê, —á—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –Ø –¥—É–º–∞—é, –≤—Å–µ —ç—Ç–∏ –ª—é–¥–∏ –Ω–µ –º–æ–≥—É—Ç –±—ã—Ç—å —Ç–∞–∫, —á—Ç–æ–±—ã –±—ã—Ç—å –≤–º–µ—Å—Ç–µ, –∫–∞–∫ –∏ –¥–æ–ª–∂–Ω—ã –±—ã—Ç—å –≤–º–µ—Å—Ç–µ.  –û–Ω–∏ –Ω–µ —Ç–æ–ª—å–∫–æ –Ω–µ –±—ã–ª–∏ –≤–º–µ—Å—Ç–µ —Å–æ –º–Ω–æ—é, –Ω–æ –∫–∞–∫ –±—É–¥—Ç–æ –±—ã–ª–∏ –≤–º–µ—Å—Ç–µ —Å–æ –º–Ω–æ–π.  –Ø –¥—É–º–∞—é, —á—Ç–æ —è —Ç–æ–∂–µ –±—ã–ª —á–∞—Å—Ç—å—é —á–µ–≥–æ-—Ç–æ –¥—Ä—É–≥–æ–≥–æ. 
.  –í–ª–∏—è–Ω–∏–µ –Ω–∞ —ç—Ç–æ –≤–ª–∏—è–Ω–∏–µ –∏ –ø—Ä–∏–≤–µ–ª–æ –µ–µ –∫ —Ç–æ–º—É, —á—Ç–æ–±—ã –Ω–∞—á–∞—Ç—å –¥–≤–∏–∂–µ–Ω–∏–µ –∫ –µ–¥–∏–Ω—Å—Ç–≤—É. 
.  –û–Ω —á—É–≤—Å—Ç–≤–æ–≤–∞–ª, —á—Ç–æ –æ–Ω –±—ã–ª –∑–∞–Ω—è—Ç –º—ã—Å–ª—è–º–∏, –∏ –≤–¥—Ä—É–≥ –ø–æ—á—É–≤—Å—Ç–≤–æ–≤–∞–ª, —á—Ç–æ –æ–Ω –Ω–µ –≤ —Ç–æ–º —Ä–∞—Å–ø–æ–ª–æ–∂–µ–Ω–∏–∏ –¥—É—Ö–∞.  –û–Ω –≤—Å–ø–æ–º–Ω–∏–ª –∏ —Ç–æ, —á—Ç–æ —Å–ª—É—á–∏–ª–æ—Å—å –≤ —ç—Ç–æ–º –¥–æ–º–µ.  –í—Å–ø–æ–º–Ω–∏–ª, –∫–∞–∫ –≤—Å–µ —Å–º–µ—è–ª–∏—Å—å –Ω–∞–¥ –Ω–∏–º, –∏ –≤—Å–ø–æ–º–Ω–∏–ª –µ–≥–æ —Å–ª–æ–≤–∞: "–ö–∞–∫–æ–µ –º–∏–ª–æ–µ —Å–æ–∑–¥–∞–Ω–∏–µ!" ‚Äî –∏ —Å–Ω–æ–≤–∞ –ø—Ä–µ–¥—Å—Ç–∞–≤–∏–ª —Å–µ–±–µ –µ–≥–æ —É–ª—ã–±–∫—É, –≤–∑–≥–ª—è–¥, –

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. 
.  –û!  –¢–µ–ø–µ—Ä—å —è –ø–æ–Ω–∏–º–∞—é, –∑–∞—á–µ–º –º–Ω–µ –Ω—É–∂–µ–Ω —ç—Ç–æ—Ç –Ω–æ–≤—ã–π –º–∏—Ä, –∫–∞–∫ —Ç–æ–ª—å–∫–æ –º–æ–∂–Ω–æ –µ–≥–æ –ø–æ–∫–∏–Ω—É—Ç—å?  –¢—ã –≥–æ–≤–æ—Ä–∏—à—å –æ –Ω–æ–≤–æ–º –º–∏—Ä–µ. [–ì]
.  –ò, —á—É–≤—Å—Ç–≤—É—è —Å–µ–±—è –æ–±–º–∞–Ω—É—Ç—ã–º –∏ –æ—Å–∫–æ—Ä–±–ª–µ–Ω–Ω—ã–º —ç—Ç–∏–º, –≤ —Ç–æ –∂–µ –≤—Ä–µ–º—è, –±—ã–ª —É–≤–µ—Ä–µ–Ω, —á—Ç–æ –ø–æ–ª–æ–∂–µ–Ω–∏–µ –µ–≥–æ –±—É–¥–µ—Ç —Ç–∞–∫ –∂–µ –±–ª–∞–≥–æ–ª–µ–ø–Ω–æ –∏ –ª–µ–≥–∫–æ, –∫–∞–∫ –∏ –≤—Å–µ–≥–¥–∞. 
.  –û–Ω–∏ –±—ã–ª–∏, –æ—á–µ–Ω—å –º–∏–ª—ã–µ –ª—é–¥–∏, –∏, –Ω–∞–≤–µ—Ä–Ω–æ–µ, —Å–∞–º—ã–µ —Å—á–∞—Å—Ç–ª–∏–≤—ã–µ, —á–µ—Å—Ç–Ω—ã–µ –∏ –≤—Å–µ—Å–∏–ª—å–Ω—ã–µ –ª—é–¥–∏ –Ω–∞ —Å–≤–µ—Ç–µ, –∫–æ—Ç–æ—Ä—ã–µ —Ç–∞–∫ –Ω—É–∂–¥–∞—é—Ç—Å—è –∏ —Ä–∞–¥—ã.  –≠—Ç–∏ –±–ª–∞–≥–æ—Ä–æ–¥–Ω—ã–µ –ª—é–¥–∏ —Ö–æ—Ç–µ–ª–∏ –±—ã, —á—Ç–æ–±—ã –≤—Å–µ –±—ã–ª–æ –æ—Ç–ª–∏—á–Ω–æ, —á—Ç–æ–±—ã –≤—Å–µ –±—ã–ª–æ –∫—Ä–∞—Å–∏–≤–æ, —á—Ç–æ–±—ã –≤—Å–µ –ª—é–±–∏–ª–∏ –∏ –±—ã–ª–∏ –ª—é–±–∏–º—ã.  –ò –≤—Å–µ —ç—Ç–æ, –∞ —Ç–∞–∫–∂–µ –≤—Å–µ —ç—Ç–æ –¥–ª—è —Ç–æ–≥–æ, —á—Ç–æ–±—ã


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ó–¥–µ—Å—å –Ω–∞–¥–æ —Ç–æ–ª—å–∫–æ –∑–∞–º–µ—Ç–∏—Ç—å, —á—Ç–æ –∑–¥–µ—Å—å –Ω–µ—Ç –Ω–∏–∫–∞–∫–æ–π –Ω–µ–æ–±—Ö–æ–¥–∏–º–æ—Å—Ç–∏ –≤ —Ç–æ–º, —á—Ç–æ–±—ã –∫–∞–∫ –º–æ–∂–Ω–æ —Å–∫–æ—Ä–µ–µ, –≤ –æ–¥–Ω—É —Å—Ç–æ—Ä–æ–Ω—É —Å–º–æ—Ç—Ä–µ—Ç—å, –∫–∞–∫ –ø—Ä–∏–µ–¥–µ–º, —Ç–∞–∫ –∏ –±—É–¥–µ–º.  –ê –ø—Ä–∏–µ–¥–µ–º –º—ã —Ç–æ–≥–¥–∞, –ø–æ—Ç–æ–º—É —á—Ç–æ –≤—Å–µ –±—É–¥–µ—Ç –≥–æ—Ç–æ–≤–æ.  –í—Å–µ –±—É–¥–µ—Ç –≥–æ—Ç–æ–≤–æ –∏ –ø–æ –∑–∞–∫–æ–Ω–∞–º, –∏ –ø–æ –∑–∞–∫–æ–Ω—É.  –ê –≥–ª–∞–≤–Ω–æ–µ, —á—Ç–æ –±—É–¥–µ—Ç —Ç–æ –∂–µ —Å–∞–º–æ–µ, —á—Ç–æ –∏
.  –ö–∞–∫ —Ç–æ–ª—å–∫–æ —Å –Ω–µ—é –ø–æ–∑–Ω–∞–∫–æ–º–∏–ª—Å—è, –µ–π —Å—Ç–∞–ª–æ –ª–µ–≥—á–µ, —Ç–∞–∫ –∏ –ø–æ–º–æ–ª–æ–¥–µ–ª–∞.  –ö –æ—Å–µ–Ω–∏, –Ω–∞–∫–æ–Ω–µ—Ü, —Å—Ç–∞–ª–æ —Ç–∞–∫ –∂–µ.  –ú—É–∂ —É–µ–∑–∂–∞–ª –≤ –ú–æ—Å–∫–≤—É, –∞ –¥–æ—á—å, —á—Ç–æ–±—ã –Ω–µ –µ–∑–¥–∏—Ç—å –∫ —Ç–µ—Ç–∫–µ, –æ—Å—Ç–∞–≤–∏–ª–∞ –µ–≥–æ —Å –∂–µ–Ω–æ–π –∏, –æ—Å—Ç–∞–≤—à–∏—Å—å –æ–¥–Ω–∞, –æ–ø—è—Ç—å –Ω–µ –≤—ã—à–ª–∞ –Ω–∞ —Ä–∞–±–æ—Ç—É. 
.  –ö–∞–∫ –∏ –¥—Ä—É–≥–∏–µ, —ç—Ç–∏, –∫ –±–æ–ª—å—à–æ–º—É —É–¥–æ–≤–æ–ª—å—Å—Ç–≤–∏—é –∏ –ø—Ä–∏—Å–∫–æ—Ä–±–Ω–æ—Å—Ç–∏, 

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã, –≤—Å–µ —Ä—É—Å—Å–∫–∏–µ, –Ω–µ –º–æ–≥–ª–∏ –æ—Å—Ç–∞–≤–∞—Ç—å—Å—è —Ä–∞–≤–Ω–æ–¥—É—à–Ω—ã–º–∏ –∏ –Ω–µ –º–æ–∂–µ–º, —á—Ç–æ–±—ã —Ç–µ, –∫–æ—Ç–æ—Ä—ã–µ –Ω–µ –º–æ–≥–ª–∏ –±—ã—Ç—å –¥–ª—è –Ω–∞—Å –Ω–µ–ø—Ä–∏—è—Ç–Ω—ã, –º—ã –Ω–µ –º–æ–∂–µ–º –Ω–µ —á—É–≤—Å—Ç–≤–æ–≤–∞—Ç—å —Å–≤–æ–µ–π —á–µ—Å—Ç–∏ –∏ –Ω–µ –¥–æ–ª–∂–Ω—ã –±—ã—Ç—å –¥–æ–ª–∂–Ω—ã –ø—Ä–æ—â–µ–Ω—ã, –∫–æ–≥–¥–∞ –º—ã —Ç–∞–∫ –º–∞–ª–æ —Å–¥–µ–ª–∞–ª–∏ –¥–ª—è –Ω–µ–µ. 
.  –ù–æ –¥–∞–∂–µ –µ—Å–ª–∏ –≤—ã —Å–µ–π—á–∞—Å –ø–æ–µ–¥–µ—Ç–µ –≤ –ª–µ—Å, –Ω–µ –Ω–∞–¥–æ –¥—É–º–∞—Ç—å, –∫–∞–∫ –≤–∞–º –Ω–∞–¥–æ –µ—Ö–∞—Ç—å.  –í–æ-–ø–µ—Ä–≤—ã—Ö, –≤—ã –Ω–µ –±—É–¥–µ—Ç–µ —Ç–∞–∫ –ª–µ–≥–∫–æ –∏ —Ö–æ—Ä–æ—à–æ –≥–æ–≤–æ—Ä–∏—Ç—å, –≤–æ-–≤—Ç–æ—Ä—ã—Ö, –≤—ã –Ω–µ –±—É–¥–µ—Ç–µ —Ç–∞–∫ –º–Ω–æ–≥–æ –¥—É–º–∞—Ç—å –∏ —Ç–∞–∫ —Å–∫—É—á–Ω–æ –≥–æ–≤–æ—Ä–∏—Ç—å, –∫–∞–∫ –≤—ã.  –ù–æ, –≤–æ-–ø–µ—Ä–≤—ã—Ö, –≤—ã –±—É–¥–µ—Ç–µ –Ω–µ —Ç–∞–∫ —Ö–æ—Ä–æ—à–æ –¥—É–º–∞—Ç—å –∏ –Ω–µ —Ç–∞–∫
.  –û–Ω, –∫–∞–∫ –∏ –≤—Å—è–∫–∏–π —á–µ–ª–æ–≤–µ–∫, –æ—á–µ–Ω—å –ø–æ—Ö–æ–∂ –Ω–∞ —á–µ–ª–æ–≤–µ–∫–∞.–û–Ω –Ω–µ –º–æ–∂–µ—Ç –Ω–∏ –¥–≤–∏–≥–∞—Ç—å—Å—è, –Ω–∏ –±–µ

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}





Saving model checkpoint to ./checkpoint-500
Configuration saved in ./checkpoint-500/config.json
Configuration saved in ./checkpoint-500/generation_config.json


.  –ù–æ, –∫–æ–≥–¥–∞ –æ–Ω–∞ –±—ã–ª–∞ –∑–¥–æ—Ä–æ–≤–∞ –∏ —Å—á–∞—Å—Ç–ª–∏–≤–∞, –∏ –µ–π –Ω–µ –Ω–∞–¥–æ –±—ã–ª–æ –Ω–∏ –¥—É–º–∞—Ç—å –æ —á–µ–º-—Ç–æ, –Ω–∏ –¥—É–º–∞—Ç—å, –∞ –±—ã–ª–æ –æ—á–µ–Ω—å –≤–∞–∂–Ω–æ –æ–¥–Ω–æ ‚Äì —á—Ç–æ–±—ã —ç—Ç–æ –±—ã–ª–æ —Ç–æ —Å–∞–º–æ–µ —Å–∞–º–æ–µ —Å—á–∞—Å—Ç—å–µ, –∫–æ—Ç–æ—Ä–æ–µ –æ–Ω–∞ –∂–µ–ª–∞–ª–∞ —Å–µ–±–µ –≤—Å—é –∂–∏–∑–Ω—å. 
.  –ò, –Ω–∞–∫–æ–Ω–µ—Ü, –≤¬†1853¬†–≥–æ–¥—É –ø–æ –≤–æ–∑–≤—Ä–∞—â–µ–Ω–∏–∏ –¥–æ–º–æ–π –≤ –ü–µ—Ç–µ—Ä–±—É—Ä–≥ –±—ã–ª –≤—ã–∑–≤–∞–Ω –ø–æ¬†—Å–ª–µ–¥—É –Ω–∞¬†–¥–µ–ª–æ.
. 
.  –í —Ç–µ—á–µ–Ω–∏–µ –ø—è—Ç–∏ –º–∏–Ω—É—Ç –ø—Ä–∏ –ø–æ–ª–Ω–æ–π —Ç–µ–º–Ω–æ—Ç–µ –∏ –æ—Å–≤–µ—â–µ–Ω–Ω–æ—Å—Ç–∏, –Ω–∞ –≤—Å–µ—Ö —É–≥–ª–∞—Ö –±—ã–ª–∏ —Ä–∞—Å—Å—Ç–∞–≤–ª–µ–Ω—ã –æ—Ä—É–¥–∏—è –∏ –±–æ–º–±—ã, –∏, –Ω–∞–∫–æ–Ω–µ—Ü, –Ω–∞ –º–µ—Å—Ç–µ, –≥–¥–µ –æ–Ω–∏ –¥–æ–ª–∂–Ω—ã –±—ã–ª–∏ –±—ã—Ç—å, –±—ã–ª –Ω–∞–π–¥–µ–Ω –Ω–∞—Å—Ç–æ—è—â–∏–π —Ç—Ä—É–ø.  –ù–µ —Å—á–∏—Ç–∞—è –Ω–µ—Å–∫–æ–ª—å–∫–∏—Ö —Ç—Ä—É–ø–æ–≤, –≤ —Ç–æ–º —á–∏—Å–ª–µ –æ–¥–Ω–æ–≥–æ –º–µ—Ä—Ç–≤–æ–≥–æ, –≤ —ç—Ç–æ–º —Ç—Ä—É–ø–µ –±—ã–ª–∏ —Ç–æ–ª—å–∫–æ –¥–≤–æ–µ —Ä—É—Å—Å–∫–∏—Ö –∏ —Ç

Model weights saved in ./checkpoint-500/pytorch_model.bin
Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã —Å –∂–µ–Ω–æ–π –ø–æ—à–ª–∏ –Ω–∞ —É–∂–∏–Ω, –∫–∞–∫ –≤–¥—Ä—É–≥ —Å–ª—ã—à–∏–º –≤ —Å–µ–Ω—è—Ö –∫—Ä–∏–∫: 
.  –ù–æ –Ω–µ –≤—Å–µ –æ–Ω–∏ –±—ã–ª–∏ –æ–¥–∏–Ω–∞–∫–æ–≤–æ —Ö–æ—Ä–æ—à–∏; –∫–∞–∫ –≤ –ø–µ—Ä–≤–æ–º —Å–ª—É—á–∞–µ, —Ç–∞–∫ –∏ –≤–æ –≤—Ç–æ—Ä–æ–º ‚Äî –Ω–∏ –æ–¥–Ω–∞ –ø–∞—Ä—Ç–∏—è, –Ω–∏ –æ–¥–∏–Ω –∏–≥—Ä–æ–∫ –Ω–µ –±—ã–ª, –∫—Ä–æ–º–µ –Ω–µ–≥–æ —Å–∞–º–æ–≥–æ, –æ—á–µ–Ω—å, –∫–∞–∂–µ—Ç—Å—è, –ª—É—á—à–∏–º –∏–∑ —Ç–µ—Ö, –∫–æ—Ç–æ—Ä—ã–µ –Ω–∞ –ø–µ—Ä–≤—ã–π —Ä–∞–∑ –¥–µ–ª–∞–ª–∏ —ç—Ç–æ –≤ –ø–µ—Ä–≤—ã–µ –≥–æ–¥—ã —Å–≤–æ–µ–π –∏–≥—Ä—ã.  –ù–æ –Ω–∞ —ç—Ç–æ—Ç —Å—á–µ—Ç –Ω–µ –±—ã–ª–æ –¥—Ä—É–≥–æ–≥–æ –º–Ω–µ–Ω–∏—è, –∫—Ä–æ–º–µ –æ–¥–Ω–æ–≥–æ: –æ—á–µ–Ω—å —Ç—Ä—É–¥–Ω–æ –≤
.  –≠—Ç–æ –±—ã–ª–æ –±—ã —Ç–∞–∫. 
.  –í –Ω–∞—á–∞–ª–µ —Å–≤–æ–µ–≥–æ –ø—É—Ç–∏ (–ø–æ—Å–ª–µ –¥–æ–ª–≥–æ–≥–æ —Ä–∞–∑–º—ã—à–ª–µ–Ω–∏—è) –æ–Ω –ø–æ–Ω–µ–≤–æ–ª—å–Ω–æ —É–∑–Ω–∞–µ—Ç –æ —Ç–æ–º, —á—Ç–æ –∏ –∫–∞–∫ –Ω–∞–¥–æ –¥—É–º–∞—Ç—å.


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í –Ω–∞—á–∞–ª–µ –ª–µ—Ç–∞ –æ–Ω –≤–µ—Ä–Ω—É–ª—Å—è –≤ —Å–≤–æ–∏ —Ä–æ–¥–Ω—ã–µ –º–µ—Å—Ç–∞, –æ—Å—Ç–∞–≤–∏–≤ –º–∞—Ç—å –∏ —Å–µ—Å—Ç—Ä—É. 
.  –ò —Ç–æ, —á—Ç–æ –æ–Ω —Ö–æ—Ç–µ–ª —Å–∫–∞–∑–∞—Ç—å, –±—ã–ª–æ –ø—Ä–∞–≤–¥–æ–π, –Ω–æ –¥–ª—è –º–µ–Ω—è —Ç–∞–∫ –∏ –æ—Å—Ç–∞–ª–æ—Å—å —Ç–∞–π–Ω–æ–π, —è –Ω–µ –∑–Ω–∞–ª —Ç–æ–≥–¥–∞, —á—Ç–æ –±—ã–ª–æ –±—ã –ª—É—á—à–µ, –µ—Å–ª–∏ –±—ã –æ–Ω —Å–∫–∞–∑–∞–ª, —á—Ç–æ —ç—Ç–æ —Ö–æ—Ä–æ—à–æ, —á—Ç–æ –æ–Ω –Ω–µ –ª—é–±–∏—Ç –º–µ–Ω—è, –Ω–æ, –≤–∏–¥–∏–º–æ, –¥—É–º–∞–ª, —á—Ç–æ –Ω–µ –ø–æ–Ω–∏–º–∞–µ—Ç, –ø–æ—Ç–æ–º—É —á—Ç–æ —è –ª—é–±–ª—é –µ–≥–æ.
.  –í —ç—Ç–∏—Ö —Å–ª–æ–≤–∞—Ö, —Å –∫–æ—Ç–æ—Ä—ã–º –∏ –≤ –ø–µ—Ä–≤—ã–π —Ä–∞–∑ –≤ –ø–µ—Ä–≤—ã–π —Ä–∞–∑ –≤ –µ–≥–æ –∂–∏–∑–Ω–∏, –æ–Ω –±—ã–ª –Ω–µ —Ç–æ–ª—å–∫–æ –ø–æ—Ä–∞–∂–µ–Ω —Å–ª–æ–≤–∞–º–∏, –Ω–æ –∏ —Å–æ–≤–µ—Ä—à–µ–Ω–Ω–æ —Å–µ—Ä—å–µ–∑–Ω–æ —É–¥–∏–≤–ª–µ–Ω —Ç–æ–º—É, –∫–∞–∫ —Ç–æ—á–Ω–æ —Ç–∞–∫ –∂–µ –æ–Ω –ø–æ–Ω–∏–º–∞–ª –∏—Ö –∏ –∑–Ω–∞–ª, –≤ –æ—Å–æ–±–µ–Ω–Ω–æ—Å—Ç–∏, –µ—Å–ª–∏ –æ–Ω –≤–µ—Ä–∏–ª, —á—Ç–æ –∏–º —É–¥–∞—Å—Ç—Å—è –≤—Å–µ —ç—Ç–æ —Å–∫–∞–∑–∞—Ç—å.  –û–Ω —Ç–æ–ª—å–∫–æ —Ç–µ–ø–µ—Ä—å –ø–æ–Ω—è



Training completed. Do not forget to share your model on huggingface.co/models =)


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ü—Ä–∏ —ç—Ç–æ–º –Ω–µ–æ–±—Ö–æ–¥–∏–º–æ —É—á–∏—Ç—ã–≤–∞—Ç—å, —á—Ç–æ —É –∫–∞–∂–¥–æ–≥–æ —á–µ–ª–æ–≤–µ–∫–∞ –±—ã–≤–∞—é—Ç —Å–≤–æ–∏ –∏–Ω–¥–∏–≤–∏–¥—É–∞–ª—å–Ω—ã–µ –ø—Ä–∏—á–∏–Ω—ã (–≤—ã—Å–æ–∫–∞—è –∏–ª–∏ –º–∞–ª–µ–Ω—å–∫–∞—è —Ç–µ–º–ø–µ—Ä–∞—Ç—É—Ä–∞ –≤–æ–∑–¥—É—Ö–∞, –≥–æ–ª–æ–≤–Ω–∞—è –±–æ–ª—å, –ø–ª–æ—Ö–æ–µ —Å–∞–º–æ—á—É–≤—Å—Ç–≤–∏–µ). 
.  –° –ø–æ–º–æ—â—å—é —ç—Ç–∏—Ö —Å–æ–≤–µ—Ç–æ–≤ –≤—ã –Ω–µ —Ç–æ–ª—å–∫–æ –∏–∑–±–∞–≤–∏—Ç–µ—Å—å –æ—Ç –±–æ–ª–∏ –≤ –∂–µ–ª—É–¥–∫–µ –∏ –ø–æ–¥–Ω–∏–º–∏—Ç–µ –µ–≥–æ –∞–ø–ø–µ—Ç–∏—Ç, –Ω–æ –∏ –±—É–¥–µ—Ç–µ –∑–Ω–∞—Ç—å, –∫–∞–∫ –≤ –¥–æ–º–∞—à–Ω–∏—Ö —É—Å–ª–æ–≤–∏—è—Ö —É—Å—Ç—Ä–∞–Ω–∏—Ç—å —ç—Ç—É –Ω–µ–ø—Ä–∏—è—Ç–Ω—É—é –ø—Ä–æ–±–ª–µ–º—É. 
. 
.  –û–Ω–∞ —Å–∏–¥–µ–ª–∞ –≤ –≥–ª—É–±–æ–∫–æ–º –∫—Ä–µ—Å–ª–µ, –ª–∏—Ü–æ–º –∫ –ª–∏—Ü—É —Å –ü–µ—Ç—Ä–æ–º.  –ü–æ —Ç–æ–º—É, –∫–∞–∫ –æ–Ω–∞ —Å—Ç–∞—Ä–∞–ª–∞—Å—å –ø–æ–¥–∞–≤–∏—Ç—å —Å—Ç—Ä–∞—Ö, –æ–Ω –∑–∞–º–µ—Ç–∏–ª, —á—Ç–æ –æ–Ω–∞ –ø—Ä–∏—Å—Ç–∞–ª—å–Ω–æ, –≤–Ω–∏–º–∞—Ç–µ–ª—å–Ω–æ —Å–ª–µ–¥–∏—Ç –∑–∞ –∫–∞–∂–¥—ã–º –µ–≥–æ —Å–ª–æ–≤–æ–º.  –û–Ω–∞ –º–æ–ª—á–∞–ª–∞.  –û–Ω, –≤ —Ç–æ–º –∂–µ –ø–æ–ª–æ–∂–µ–Ω–∏–∏

Saving model checkpoint to .
Configuration saved in ./config.json
Configuration saved in ./generation_config.json
Model weights saved in ./pytorch_model.bin


In [14]:
print_generations(prefix="–í 2024 –≥–æ–¥—É", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



–í 2024 –≥–æ–¥—É –≤ –ü–µ—Ç–µ—Ä–±—É—Ä–≥–µ –≤ –ü–µ—Ç–µ—Ä–±—É—Ä–≥–µ –±—ã–ª –ø–æ—Å—Ç—Ä–æ–µ–Ω –Ω–æ–≤—ã–π —Ç–∏–ø–æ–≤–æ–π –¥–æ–º –¥–ª—è –ø–µ—Ç–µ—Ä–±—É—Ä–≥—Å–∫–æ–≥–æ –∫—É–ø–µ—á–µ—Å—Ç–≤–∞. –ö–Ω—è–∑—å –î–º–∏—Ç—Ä–∏–π, –Ω–µ –¥–æ–∂–¥–∞–≤—à–∏—Å—å —Ä–∞–∑—Ä–µ—à–µ–Ω–∏—è –≤–æ–π—Ç–∏ –≤ –Ω–µ–≥–æ, –≤–æ—à–µ–ª —Å –∂–µ–Ω–æ–π –≤ —Å–≤–æ—é —Å–ø–∞–ª—å–Ω—é –∏ –ø—Ä–∏ —É—á–∞—Å—Ç–∏–∏ —Å—É–ø—Ä—É–≥–∏. –í –Ω–µ–π –≤ –∫–æ–º–Ω–∞—Ç–µ –≤ —ç—Ç—É –º–∏–Ω—É—Ç—É –±—ã–ª –∏ —Å—ã–Ω –∫–Ω—è–∑—è –î–º–∏—Ç—Ä–∏—è, –∫–æ—Ç–æ—Ä—ã–π –±—ã–ª –≤ —ç—Ç–æ –≤—Ä–µ–º—è –æ–¥–∏–Ω –∏ —Å –º–∞—Ç–µ—Ä—å—é –∏ —Å –¥—è–¥–µ–π –∏, –≤–º–µ—Å—Ç–µ —Å —Å–≤–æ–µ—é –¥–æ—á–µ—Ä—å–º–∏, –≤ —Å–ø–∞–ª—å–Ω–µ –≤ –∫–æ–º–Ω–∞—Ç–µ –∫–Ω—è–∂–Ω—ã. –ö–Ω—è–∑—å –î–º–∏—Ç—Ä–∏–π, –æ—Å—Ç–∞–≤—à–∏—Å—å –≤ –æ–¥–∏–Ω–æ—á–µ—Å—Ç–≤–µ –≤ –∫–æ–º–Ω–∞—Ç–µ –∏ –Ω–µ —Å–º–µ—è –≤–æ–π—Ç–∏ –≤ –Ω–µ–µ, —Å —Å–≤–æ–µ–π –∂–µ–Ω–æ–π, –≤ —ç—Ç–æ –≤—Ä–µ–º—è –Ω–∞—Ö–æ–¥–∏–ª—Å—è –≤ –∫–æ–º–Ω–∞—Ç–µ –∫–Ω—è–∂–Ω—ã.
–í 2024 –≥–æ–¥—É –†–æ—Å—Å–∏—è –ø–µ—Ä–µ–∂–∏–ª–∞ –ø–µ—Ä–≤—É—é –í–µ–ª–∏–∫—É—é –≤–æ–π–Ω—É, –∫–æ–≥–¥–∞ —Ä—É—Å—Å–∫–∏–π —Ñ–ª–

# –°–æ–±—Ä–∞–Ω–∏–µ —Å–æ—á–∏–Ω–µ–Ω–∏–π –õ–µ–Ω–∏–Ω–∞

In [15]:
model, tokenizer = get_ru_model()
freeze_layers(model, 6)
finetune(model, tokenizer, LENIN_PATH)

loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--sberbank-ai--rugpt3small_based_on_gpt2/snapshots/f2f7c585b05a16726efe8974586e10b4d5939082/config.json
Model config GPT2Config {
  "_name_or_path": "sberbank-ai/rugpt3small_based_on_gpt2",
  "activation_function": "gelu_new",
  "architectures": [
    "GPT2LMHeadModel"
  ],
  "attn_pdrop": 0.1,
  "bos_token_id": 50256,
  "embd_pdrop": 0.1,
  "eos_token_id": 50256,
  "gradient_checkpointing": false,
  "initializer_range": 0.02,
  "layer_norm_epsilon": 1e-05,
  "model_type": "gpt2",
  "n_ctx": 2048,
  "n_embd": 768,
  "n_head": 12,
  "n_inner": null,
  "n_layer": 12,
  "n_positions": 2048,
  "reorder_and_upcast_attn": false,
  "resid_pdrop": 0.1,
  "scale_attn_by_inverse_layer_idx": false,
  "scale_attn_weights": true,
  "summary_activation": null,
  "summary_first_dropout": 0.1,
  "summary_proj_to_labels": true,
  "summary_type": "cls_index",
  "summary_use_proj": true,
  "transformers_version": "4.2

SETTING N_EPOCHS TO  0.14183550978504744


Loading features from cached file /content/gdrive/MyDrive/datasets/cached_lm_GPT2TokenizerFast_256_lenin.txt [took 1.256 s]
PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
***** Running training *****
  Num examples = 32598
  Num Epochs = 1
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 578
  Number of trainable parameters = 42528768


Step,Training Loss
50,3.3899
100,3.2751
150,3.2767
200,3.2754
250,3.2126
300,3.197
350,3.1459
400,3.146
450,3.2098
500,3.1729


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω, –ø–æ —Å—É—Ç–∏, –±–æ—Ä–µ—Ç—Å—è —Å "–≤—Ä–∞–≥–∞–º–∏" –∏ –ø—Ä–æ—Ç–∏–≤–æ–ø–æ–ª–∞–≥–∞–ª–Ω–∏–∫–∞–º–∏. (–°–º–µ—Ö. ).  –û–Ω –ø—Ä–∏–∑—ã–≤–∞–µ—Ç –∫ —Ä–µ—à–∏—Ç–µ–ª—å–Ω–æ–π –º–µ—Ä–µ —Å–æ—Ü–∏–∞–ª—å–Ω–æ–π –ø–æ–ª–∏—Ç–∏–∫–∏ –∫ —É–∫—Ä–µ–ø–ª–µ–Ω–∏—é –º–µ—Å—Ç–Ω–æ–≥–æ —Å–∞–º–æ—É–ø—Ä–∞–≤–ª–µ–Ω–∏—è.  –≠—Ç–æ –±—ã–ª –æ–¥–∏–Ω –∏–∑ —Ç–µ—Ö —É—Ä–æ–∫–æ–≤, –∫–æ—Ç–æ—Ä—ã–µ –Ω–µ —Ä–∞–∑ –±—ã–ª–∏ –ø–æ–¥–¥–µ—Ä–Ω—É—Ç—ã.  –ò —Å–µ–≥–æ–¥–Ω—è, –≤ —É—Å–ª–æ–≤–∏—è—Ö –º–∏—Ä–∞ –∏ –º–∏—Ä–∞, –º—ã –¥–æ–ª–∂–Ω—ã –ø–æ–∫–∞–∑–∞—Ç—å,
.  –í. –ò. –õ–µ–Ω–∏–Ω –≤ —Å–≤–æ–µ–π ¬´–≠–∫–æ–Ω–æ–º–∏—á–µ—Å–∫–æ–π –ø—Ä–æ–≥—Ä–∞–º–º–µ¬ª, –Ω–∞–ø–∏—Å–∞–Ω–Ω–æ–π –≤ 1913 –≥–æ–¥—É, –æ—Ç–º–µ—á–∞–µ—Ç: "–ï—Å–ª–∏ –º—ã –Ω–µ –º–æ–∂–µ–º –ø—Ä–∏–Ω—è—Ç—å —Ç–∞–∫–æ–π –º–µ—Ç–æ–¥, –∫–∞–∫ –ª–∏–∫–≤–∏–¥–∞—Ü–∏—è –≤–æ–π–Ω—ã, —Ç–æ –Ω—É–∂–Ω–æ –æ—Ç–∫–∞–∑–∞—Ç—å—Å—è –æ—Ç —ç—Ç–æ–≥–æ –º–µ—Ç–æ–¥–∞ –≤–æ –≤—Å–µ–π –µ–≥–æ –ø–æ–ª–Ω–æ—Ç–µ.  –í –†–æ—Å—Å–∏–∏, –≤ –æ—Å–æ–±–µ–Ω–Ω–æ—Å—Ç–∏, –≤ –æ–±–ª–∞—Å—Ç–∏ –≤–æ–µ–Ω–Ω–æ–≥–æ —Å—Ç—Ä–æ–∏—Ç–µ–ª—å—Å—Ç–≤–∞ –∏ –ø—Ä–æ–º—ã—à–ª–µ–Ω–Ω–æ—Å—Ç–∏, –Ω–µ –º–æ–∂

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –í –∫–∞—á–µ—Å—Ç–≤–µ –æ—Å–Ω–æ–≤—ã –¥–ª—è —ç—Ç–æ–≥–æ –ø—Ä–æ–µ–∫—Ç–∞ –≤—ã—Å—Ç—É–ø–∞–µ—Ç –ø—Ä–æ–µ–∫—Ç "–°–æ—Ü–∏–∞–ª–∏–∑–∞—Ü–∏—è –º–æ–ª–æ–¥–µ–∂–∏".  –í —ç—Ç–æ–π —Ä–∞–±–æ—Ç–µ –º—ã –≤—ã—Å—Ç—É–ø–∞–µ–º –Ω–µ —Ç–æ–ª—å–∫–æ –∫–∞–∫ —Ä—É–∫–æ–≤–æ–¥—Å—Ç–≤–æ, –Ω–æ –∏ –∫–∞–∫ –ø–æ—Å—Ä–µ–¥–Ω–∏–∫ –≤ —Ä–µ–∞–ª–∏–∑–∞—Ü–∏–∏ –ø—Ä–æ–µ–∫—Ç–∞; —ç—Ç–æ –∏ –µ—Å—Ç—å –≤–∞–∂–Ω–µ–π—à–∏–π –∞—Å–ø–µ–∫—Ç —ç—Ç–æ–π —Ä–∞–±–æ—Ç—ã, —ç—Ç–æ –∏–º–µ–Ω–Ω–æ —Ç–∞ –æ—Å–Ω–æ–≤–Ω–∞—è –∑–∞–¥–∞—á–∞, –∫–æ—Ç–æ—Ä–æ–π –¥–æ–ª–∂–µ–Ω –∑–∞–Ω–∏–º–∞—Ç—å—Å—è, —Å –æ–¥–Ω–æ–π —Å—Ç–æ—Ä–æ–Ω—ã, –ú–∞—Ä–∫—Å, —Å –¥—Ä—É–≥–æ–π —Å—Ç–æ—Ä–æ–Ω—ã, –≠–Ω–≥–µ–ª—å—Å,
.  –ò –µ—Å–ª–∏ –±—ã –Ω–µ —ç—Ç–∏ ¬´–∑–Ω–∞–º–µ–Ω–∏—Ç–æ—Å—Ç–∏¬ª –∏ ¬´–∏–∑—è—â–Ω—ã–µ¬ª –∏—Ö ¬´–ø–æ–∑—ã¬ª,¬†‚Äì –µ—Å–ª–∏ –±—ã –Ω–µ –∏—Ö ¬´–ø–æ–∑—ã¬ª,¬†‚Äì –µ—Å–ª–∏ –±—ã –Ω–µ —ç—Ç–∏ ¬´–∑–Ω–∞–º–µ–Ω–∏—Ç–æ—Å—Ç–∏¬ª,¬†‚Äì –µ—Å–ª–∏ –±—ã –Ω–µ —ç—Ç–∏ ¬´–∑–Ω–∞–º–µ–Ω–∏—Ç–æ—Å—Ç–∏¬ª¬†‚Äì —Ç–æ –≤ –†–æ—Å—Å–∏–∏ –Ω–µ –æ—Å—Ç–∞–ª–æ—Å—å –±—ã –∏ —Å–ª–µ–¥–∞ –±—ã ¬´–±–ª–µ—Å—Ç—è—â–µ–π
.  –ù–∞ —ç—Ç–∏ ¬´–¥–æ–±—Ä–æ¬ª –¥–æ–ª–∂–Ω—ã –æ–ø–∏—Ä–

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–Ω –≥–æ–≤–æ—Ä–∏–ª, —á—Ç–æ —ç—Ç–æ ‚Äì –≤ –æ—Å–Ω–æ–≤–Ω–æ–º –ø–æ–ª–∏—Ç–∏—á–µ—Å–∫–∏–µ –ª–æ–∑—É–Ω–≥–∏: "–ù–∞—Ä–æ–¥–Ω–∞—è —Ä–µ–≤–æ–ª—é—Ü–∏—è", "–¥–µ–º–æ–∫—Ä–∞—Ç–∏—è", –∏ –≤—Å–µ —ç—Ç–æ ‚Äì –Ω–∞ –æ—Å–Ω–æ–≤–µ —Å–æ–∑–Ω–∞—Ç–µ–ª—å–Ω—ã—Ö –ø—Ä–µ–¥—Å—Ç–∞–≤–ª–µ–Ω–∏–π.  –ò –Ω–µ —Ç–æ–ª—å–∫–æ —Å–æ–∑–Ω–∞—Ç–µ–ª—å–Ω—ã—Ö, –Ω–æ –∏ –∏–∑–º—ã—à–ª–µ–Ω–Ω—ã—Ö.  –ö –ø—Ä–∏–º–µ—Ä—É, –Ω–µ —Å—Ç–æ–∏—Ç –ø—É—Ç–∞—Ç—å –±–æ–ª—å—à–µ–≤–∏—Å—Ç—Å–∫—É—é –ø–ª–∞—Ç—Ñ–æ—Ä–º—É —Å –º–∞—Ä–∫—Å–∏—Å—Ç—Å–∫–æ-–ª–µ–Ω–∏–Ω—Å–∫–æ–π, –∏ –Ω–∞–æ–±–æ—Ä–æ—Ç, —ç—Ç–æ
.  –í—Å–µ —Ç—Ä–∏ –≤–∏–¥–∞ —Ä–∞–±–æ—á–∏—Ö —Ä–∞–±–æ—Ç –º–æ–≥—É—Ç –±—ã—Ç—å —Ä–∞—Å—Ü–µ–Ω–µ–Ω—ã –∫–∞–∫ —Ä–∞–∑–æ–≤–æ–µ –º–µ—Ä–æ–ø—Ä–∏—è—Ç–∏–µ.  –ü–æ—Å—Ç—Ä–æ—è—Ç –≤ –¥–µ–Ω—å –ø–æ –Ω–µ—Å–∫–æ–ª—å–∫–æ —Å–æ–æ—Ä—É–∂–µ–Ω–∏–π ‚Äì –∏ —Ç–æ –±–µ–∑ —Å–Ω–æ—Å–∞, –Ω–µ —Ä–∞–∑—Ä—É—à–∞—Ç –∏ –Ω–µ –∑–∞—Å—Ç–∞–≤—è—Ç —Å–Ω–µ—Å—Ç–∏ –Ω–µ—Å–∫–æ–ª—å–∫–æ –¥–µ—Å—è—Ç–∫–æ–≤ –¥–æ–º–æ–≤, –Ω–µ –ø–æ–¥–æ—Ä–≤—É—Ç –Ω–∞—Å–µ–ª–µ–Ω–∏–µ. 
.  –ü–æ–¥—Ä–∞–∑—É–º–µ–≤–∞–µ—Ç—Å—è —Ç–∞–∫–∂–µ –∏ –≤ —Ç–æ–º, —á—Ç–æ –º—ã –¥–æ–ª–∂–Ω—ã —É–∫–∞–∑–∞—Ç—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ü. –ì. –≠–Ω–≥–µ–ª—å—Å, –í. –ò. –õ–µ–Ω–∏–Ω, –°–æ—á–∏–Ω–µ–Ω–∏—è.  –¢. I, –∏–∑–¥. —Ç–∏–ø. –ø–∞—Ä—Ç–∏–∏, —Å—Ç—Ä. 322‚Äì323. 
.  –í—Å–µ –æ–Ω–∏ –±—ã–ª–∏ "–Ω–µ –Ω–∞ —à—É—Ç–∫—É" –∑–∞–∏–≥—Ä—ã–≤–∞—é—Ç —Å –ø—Ä–µ–¥—Å—Ç–∞–≤–∏—Ç–µ–ª—è–º–∏ —Ä–∞–±–æ—á–∏—Ö, –ø—Ä–∏—É—á–∞—é—Ç –∏—Ö –∫ —Ç–æ–º—É, —á—Ç–æ —Ä–∞–±–æ—á–∏–µ —è–≤–ª—è—é—Ç—Å—è —Ö–æ–∑—è–µ–≤–∞–º–∏ –≤ –º–∏—Ä–µ, —á—Ç–æ —Ä–∞–±–æ—á–∏–µ –¥–æ–ª–∂–Ω—ã –≤—Å–µ–≥–¥–∞ —Å—Ç–æ—è—Ç—å –Ω–∞ —Å–≤–æ–∏—Ö –æ–±—è–∑–∞–Ω–Ω–æ—Å—Ç—è—Ö, –∑–∞–±–æ—Ç–∏—Ç—å—Å—è –æ —Å–≤–æ–µ–º ¬´–≤—ã–ø–æ–ª–Ω–µ–Ω–∏–∏" –∏¬†–≤—ã–ø–æ–ª–Ω–µ–Ω–∏–∏ —Å–≤–æ–∏—Ö –æ–±—è–∑–∞–Ω–Ω–æ—Å—Ç–µ–π, —á—Ç–æ —Ä–∞–±–æ—á–∏–µ –≤—Å–µ–≥–¥–∞ –¥–æ–ª–∂–Ω—ã –≤—ã–ø–æ–ª–Ω—è—Ç—å —Å–≤–æ–π –¥–æ–ª–≥ –ø–µ—Ä–µ–¥ —Ä–∞–±–æ—á–∏–º–∏ –∏ –≤–æ –≤—Å—è–∫–æ–º
.  –í —ç—Ç–æ–º —Å–º—ã—Å–ª–µ –æ–Ω –±—ã–ª –≤–µ—Å—å–º–∞ –ø–æ—Ö–æ–∂ –Ω–∞ —Ç–µ—Ö –∫—Ä–µ—Å—Ç—å—è–Ω—Å–∫–∏—Ö –æ—Ä–∞—Ç–æ—Ä–æ–≤, –∫–æ—Ç–æ—Ä—ã–µ –≥–æ–≤–æ—Ä–∏–ª–∏ –∏ –æ —Ç–æ–º, –∫–∞–∫ –ø—Ä–∞–≤–∏–ª—å–Ω–æ —Å—Ç—Ä–æ–∏—Ç—å –ø–∞—Ä—Ç–∏—é –∏ –∫–∞–∫ –µ–µ –ø—Ä–∏–º–µ–Ω—è—Ç—å. 
.  –ò —Ç–æ–ª—å–∫–æ –Ω–∞ —Ç–æ –≤—Ä–µ–

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò–∑ –∫–Ω–∏–≥–∏ ¬´–§–∏–ª–æ—Å–æ—Ñ–∏—è —Ä–µ–ª–∏–≥–∏–∏ –≤ –†–æ—Å—Å–∏–∏¬ª (–í.–ò. –õ–µ–Ω–∏–Ω.  –°–ø–±., 1909, —Å—Ç—Ä. 7). –í —ç—Ç–æ–º —Ç—Ä—É–¥–µ –æ–Ω–∞ –∏–∑–ª–∞–≥–∞–µ—Ç –≤–∑–≥–ª—è–¥—ã –§. –≠–Ω–≥–µ–ª—å—Å–∞ –Ω–∞ –≤–æ–ø—Ä–æ—Å –æ –ø—Ä–∏—á–∏–Ω–∞—Ö —Ä–µ–≤–æ–ª—é—Ü–∏–∏ –≤ –ì–µ—Ä–º–∞–Ω–∏–∏. –ó–∞—Ç–µ–º –∞–≤—Ç–æ—Ä –¥–æ–∫–∞–∑—ã–≤–∞–µ—Ç –Ω–µ–æ–±—Ö–æ–¥–∏–º–æ—Å—Ç—å –±–æ—Ä—å–±—ã –ø—Ä–æ–ª–µ—Ç–∞—Ä–∏–∞—Ç–∞ –ø—Ä–æ—Ç–∏–≤ ¬´—Ñ–µ–æ–¥–∞–ª–∏–∑–º–∞¬ª –∏ —Å –∫–ª–∞—Å—Å–∞–º–∏ –º–µ–ª–∫–æ–π –±—É—Ä–∂—É–∞–∑–∏–∏ –∏ –º–µ–ª–∫–æ–π
.  –í–æ –≤—Å—è–∫–æ–º —Å–ª—É—á–∞–µ, –º—ã –≤–∏–¥–∏–º, —á—Ç–æ –∏–º–µ–Ω–Ω–æ –∏–∑ —ç—Ç–æ–≥–æ –∏—Å—Ç–æ—á–Ω–∏–∫–∞ –∏—Å—Ö–æ–¥–∏—Ç —Å–∞–º–∞—è –±–æ–ª—å—à–∞—è –¥–æ–ª—è –ø—Ä–∞–≤–¥—ã. 
.  –Ø –∏ —Å–∞–º —Å—á–∏—Ç–∞—é —Å–µ–±—è "–∑–∞" –∏–º–µ–Ω–Ω–æ —Ç–æ, —á—Ç–æ –≤ –†–æ—Å—Å–∏–∏, —Ç–∞–∫ –∫–∞–∫ –∏–º–µ–Ω–Ω–æ –∑–¥–µ—Å—å —è –¥–æ–ª–∂–µ–Ω –≤–∏–¥–µ—Ç—å, –¥–æ–ª–∂–Ω—ã –±—ã–ª–∏ –±—ã –∏ –¥–æ–ª–∂–Ω—ã –±—ã–ª–∏ –±—ã –ø–æ—Å—Ç–∞–≤–∏—Ç—å –†–æ—Å—Å–∏—é "–Ω–∞ –º–µ—Å—Ç–æ" –º–∏—Ä–æ–≤–æ–π —Ä–µ–≤–æ–ª—é—Ü–∏–∏.  –ê —Ç–æ –≤ –†–æ—Å—Å–∏–∏ "–Ω–µ 

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –Ø –≥–æ–≤–æ—Ä—é –æ —Ç–æ–º, —á—Ç–æ –º–Ω–µ –±—ã–ª–æ —Å–∫–∞–∑–∞–Ω–æ, —á—Ç–æ –Ω–∞ —Å—ä–µ–∑–¥–µ –Ω—É–∂–Ω–æ –±—ã–ª–æ —Å–∫–∞–∑–∞—Ç—å, —á—Ç–æ–±—ã —è –¥–∞–ª –≤—Å–µ–º, –∫—Ç–æ –Ω–µ –º–æ–∂–µ—Ç –ø—Ä–∏–Ω—è—Ç—å —ç—Ç–æ—Ç –æ—Ç–≤–µ—Ç, –Ω–µ–º–µ–¥–ª–µ–Ω–Ω–æ –æ–±—ä—è–≤–∏—Ç—å –µ–≥–æ —Ä–µ–∑–æ–ª—é—Ü–∏–µ–π, —ç—Ç–æ –Ω–µ –º–æ–µ —Ä–µ—à–µ–Ω–∏–µ. –Ø –Ω–µ –≥–æ–≤–æ—Ä—é –Ω–∏ —Å–ª–æ–≤–∞ –æ —Ç–æ–º, —á—Ç–æ —ç—Ç–æ –º–æ—è —Ä–µ–∑–æ–ª—é—Ü–∏—è, —á—Ç–æ –º—ã —Ö–æ—Ç–∏–º –≤ –Ω–µ–µ –≤—Å—Ç—É–ø–∏—Ç—å, —á—Ç–æ —ç—Ç–æ ‚Äì –Ω–µ –º–æ—è —Ä–µ–∑–æ–ª—é—Ü–∏—è
.  –í –†–æ—Å—Å–∏–∏, –≤ –ú–æ—Å–∫–≤–µ –∏ —Ä—è–¥–µ –∫—Ä—É–ø–Ω—ã—Ö –≥–æ—Ä–æ–¥–æ–≤ —É–∂–µ –±–æ–ª–µ–µ –≥–æ–¥–∞ —Å—É—â–µ—Å—Ç–≤—É—é—Ç –æ—Ä–≥–∞–Ω–∏–∑–æ–≤–∞–Ω–Ω—ã–µ –≤ –ú–æ—Å–∫–≤–µ –≥—Ä—É–ø–ø—ã –Ω–∞—Å–µ–ª–µ–Ω–∏—è. 
.  –° –¥—Ä—É–≥–æ–π —Å—Ç–æ—Ä–æ–Ω—ã, —ç—Ç–∏ –¥–∞–Ω–Ω—ã–µ –∏ ¬´—Å–ø—Ä–∞–≤–µ–¥–ª–∏–≤—ã–µ¬ª —Å—Ç–∞—Ç—å–∏ –¥–æ–∫–∞–∑—ã–≤–∞—é—Ç, —á—Ç–æ –ø—Ä–æ–ª–µ—Ç–∞—Ä–∏–∞—Ç –≤ –†–æ—Å—Å–∏–∏ –±—ã–ª –Ω–∞ —Å–∞–º–æ–º –¥–µ–ª–µ –≥–æ—Ä–∞–∑–¥–æ —Å–∏–ª—å–Ω–µ–µ, —á–µ–º –≤ —ç–∫–æ–Ω–æ–º–∏—á–µ—Å–∫–∏ –æ—Ç—Å—Ç–∞–ª—ã—Ö —

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –µ—Å–ª–∏ –º—ã –Ω–∞—Ç–∞–ª–∫–∏–≤–∞–µ–º—Å—è –Ω–∞ –∫–∞–∫—É—é-—Ç–æ –æ—à–∏–±–∫—É, —Ç–æ –Ω–µ–∏–∑–±–µ–∂–Ω–æ –Ω–∞—Ö–æ–¥–∏–º —ç—Ç—É –æ—à–∏–±–∫—É –∏ –Ω–∞—Ç–∞–ª–∫–∏–≤–∞–µ–º—Å—è –Ω–∞ –æ—à–∏–±–∫—É —Å —ç—Ç–æ–π —Å—Ç–æ—Ä–æ–Ω—ã, –∫–∞–∫ –Ω–∞ –Ω–µ –≤—Å–µ–≥–¥–∞ –∏–∑–≤–µ—Å—Ç–Ω—É—é, –º—ã –≥–æ–≤–æ—Ä–∏–º, —á—Ç–æ –µ—Å–ª–∏ –±—ã –º—ã —Ö–æ—Ç–µ–ª–∏ –Ω–∞–π—Ç–∏ –æ—à–∏–±–∫—É, –∫–æ—Ç–æ—Ä–∞—è –µ—Å—Ç—å –Ω–∞—à–∞ —Å–∞–º–∞—è –±–ª–∏–∑–∫–∞—è –∫ –∏—Å—Ç–∏–Ω–µ, –º—ã, –Ω–µ –∏–º–µ—è –≤–æ–∑–º–æ–∂–Ω–æ—Å—Ç–∏, –∞ –≤–µ—Ä–Ω–µ–µ —Å–∫–∞–∑–∞—Ç—å, –Ω–µ –∏–º–µ—è –ø—Ä–µ–¥—Å—Ç–∞–≤–ª–µ–Ω–∏—è –æ–± —ç—Ç–æ–º
.  –û ¬´—Ä–µ–∞–ª—å–Ω–æ–π —Å–≤–æ–±–æ–¥–µ¬ª –∏¬†–±–æ–ª—å—à–∏–Ω—Å—Ç–≤–µ –ø–æ–¥–æ–±–Ω—ã—Ö –ø—Ä–æ–≥—Ä–∞–º–º –≥–æ–≤–æ—Ä–∏—Ç—Å—è –≤ –ø–∏—Å—å–º–µ –æ—Ç 25 —è–Ω–≤–∞—Ä—è, –≤ –∫–æ—Ç–æ—Ä–æ–º –ø–æ–¥—á–µ—Ä–∫–∏–≤–∞–µ—Ç—Å—è, —á—Ç–æ "—ç—Ç–æ—Ç —Ä–µ–∂–∏–º –±–æ–ª—å—à–µ –Ω–µ —Å–æ–æ—Ç–≤–µ—Ç—Å—Ç–≤—É–µ—Ç –∏–Ω—Ç–µ—Ä–µ—Å–∞–º —Ä–∞–±–æ—á–∏—Ö –∏ —á—Ç–æ "–≤—Å–µ —Ä–∞–±–æ—á–∏–µ –Ω–∞—Ö–æ–¥—è—Ç—Å—è –ø–æ–¥ –∏—Ö —Ä—É–∫–æ–≤–æ–¥—Å—Ç–≤–æ–º", –∞ "–≤—Å—è –º–∞—Å—Å–∞ —Ä–∞–±–æ—á–∏—

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –≠—Ç–∏ –¥–≤–∞ –Ω–∞–ø—Ä–∞–≤–ª–µ–Ω–∏—è –æ–¥–∏–Ω–∞–∫–æ–≤–æ —Ö–æ—Ä–æ—à–æ —Ö–∞—Ä–∞–∫—Ç–µ—Ä–∏–∑—É—é—Ç —Å–µ–±—è –≤–æ –≤—Å–µ–º –±—É—Ä–∂—É–∞–∑–Ω–æ–º –æ–±—â–µ—Å—Ç–≤–µ –∏ –≤ –†–æ—Å—Å–∏–∏ –≤ –æ—Å–æ–±–µ–Ω–Ω–æ—Å—Ç–∏.  –ï—Å–ª–∏ –Ω–µ —É–¥–∞—Å—Ç—Å—è –ø–æ–ª–Ω–æ—Å—Ç—å—é –æ–≤–ª–∞–¥–µ—Ç—å –∏—Å–∫—É—Å—Å—Ç–≤–æ–º –¥–∏–∞–ª–µ–∫—Ç–∏–∫–∏, —Ç–æ —Ç–æ–ª—å–∫–æ –¥–ª—è —ç—Ç–æ–≥–æ –Ω–µ–æ–±—Ö–æ–¥–∏–º –∏ —ç—Ç–æ—Ç –º–µ—Ç–æ–¥, –ø–æ—Ç–æ–º—É —á—Ç–æ –∏–º–µ–Ω–Ω–æ –æ–Ω ‚Äì –¥–∏–∞–ª–µ–∫—Ç–∏–∫–∞ –≤–æ–æ–±—â–µ.  –≠—Ç–æ—Ç –º–µ—Ç–æ–¥ –æ—Å–æ–±–µ–Ω–Ω–æ –Ω–µ–æ–±—Ö–æ–¥–∏–º –¥–ª—è —Å–æ—Ü–∏–∞–ª–∏–∑–∞—Ü–∏–∏ –Ω–∞—Ä–æ–¥–∞. 
.  –ö–∞–∫ —Ç–æ–ª—å–∫–æ —Å –Ω–∞–º–∏ –≤ –æ–¥–Ω–æ–π —Ç–æ—á–∫–µ –æ–∫–∞–∂—É—Ç—Å—è –≤—Å–µ, —Ç–∞–∫ —É –Ω–∞—Å –±—É–¥–µ—Ç —É–≤–µ—Ä–µ–Ω–Ω–æ—Å—Ç—å, —á—Ç–æ –º—ã –Ω–µ –ø–æ–¥–≤–µ–¥–µ–º –¥–æ –ø–æ—Å–ª–µ–¥–Ω–µ–≥–æ.  –ù–µ –ø–æ–¥–≤–µ–¥–µ–º –¥–æ –∫–æ–Ω—Ü–∞.  –ú—ã —Å–¥–µ–ª–∞–µ–º –≤—Å–µ, —á—Ç–æ–±—ã –ø–æ–±–µ–¥–∏—Ç—å —ç—Ç—É –≥—Ä—É–ø–ø—É, –∫–∞–∫ –º–æ–∂–Ω–æ —Å–∫–æ—Ä–µ–µ.  –ú—ã –¥–æ–ª–∂–Ω—ã –∑–Ω–∞—Ç—å, —á—Ç–æ –º—ã –≤ —Å–∏–ª–∞—Ö –∏ –Ω–∞ —á—Ç–æ –Ω–∞–

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã, –≤—Å–µ —Ä—É—Å—Å–∫–∏–µ, –Ω–µ –æ—Ç—Ä–∏—Ü–∞–µ–º —Ç–æ–≥–æ, —á—Ç–æ –Ω–∞—à–∞ –≤–ª–∞—Å—Ç—å, –Ω–µ—Å–º–æ—Ç—Ä—è –Ω–∞ –≤—Å—é —Å–≤–æ—é –≤—Ä–∞–∂–¥–µ–±–Ω–æ—Å—Ç—å –∫ —ç—Ç–æ–º—É –¥–≤–∏–∂–µ–Ω–∏—é, –≤—Å–µ-—Ç–∞–∫–∏ –ø—Ä–æ–¥–æ–ª–∂–∞–µ—Ç –≤–µ—Å—Ç–∏ —Å –Ω–∏–º –±–æ—Ä—å–±—É.  –ú—ã –≤–∏–¥–∏–º, —á—Ç–æ –±–æ–ª—å—à–∏–Ω—Å—Ç–≤–æ –Ω–∞—à–∏—Ö –ø—Ä–æ—Ç–∏–≤–Ω–∏–∫–æ–≤, –Ω–µ—Å–º–æ—Ç—Ä—è –Ω–∞ –≤—Å–µ —É—Å–∏–ª–∏—è –Ω–∞—à–µ–π –ø–æ–ª–∏—Ç–∏–∫–∏, –ø—Ä–æ–¥–æ–ª–∂–∞—é—Ç –≤ —Ç–æ–º –∂–µ —Ä—É—Å–ª–µ –ø—Ä–æ–¥–æ–ª–∂–∞—Ç—å –±–æ—Ä—å–±—É –ø—Ä–æ—Ç–∏–≤ –Ω–∞—Ä–æ–¥–∞.  –ò –æ–Ω–∏ –±—É–¥—É—Ç –∏–¥—Ç–∏ –ø–æ —Ç–æ–º—É
.  –≠—Ç–æ ‚Äì —Å–∞–º–∞—è —Å–∏–ª—å–Ω–∞—è —Ä–µ–≤–æ–ª—é—Ü–∏—è —Ä—É—Å—Å–∫–æ–≥–æ –Ω–∞—Ü–∏–æ–Ω–∞–ª—å–Ω–æ–≥–æ –¥–≤–∏–∂–µ–Ω–∏—è –≤ –ø–µ—Ä–≤—ã–µ –≥–æ–¥—ã. 
.  –ù–∞ –¥–Ω—è—Ö, –≤ —Å–≤–æ–µ–º –ø–µ—Ä–≤–æ–º –Ω–æ–º–µ—Ä–µ "–ü—Ä–æ–ª–µ—Ç–∞—Ä—Å–∫–æ–≥–æ –†–∞–±–æ—á–µ–≥–æ¬ª, —Ä–µ–¥–∞–∫—Ü–∏—è –≤—Å—Ç—Ä–µ—Ç–∏–ª–∞ –∑–∞–º–µ—Ç–∫—É, –≤ –∫–æ—Ç–æ—Ä–æ–π –≤ –∫–∞—á–µ—Å—Ç–≤–µ –ø—Ä–µ–¥–∏—Å–ª–æ–≤–∏—è –∫ —Å—Ç–∞—Ç—å–µ –ø—Ä–∏–≤–æ–¥—è—Ç—Å—è —Å–ª–æ–≤–∞ –ø—Ä–æ—Ñ–µ—Å—Å–

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}





Saving model checkpoint to ./checkpoint-500
Configuration saved in ./checkpoint-500/config.json
Configuration saved in ./checkpoint-500/generation_config.json


.  –ù–æ, –∫–æ–≥–¥–∞ –æ–Ω–∏ –±—ã–ª–∏ —Å–æ–∑–¥–∞–Ω—ã –≤¬†–µ–¥–∏–Ω—Å—Ç–≤–µ –∏¬†–µ–¥–∏–Ω—Å—Ç–≤–µ, –æ–Ω–∏ –±—ã–ª–∏ —Ç–æ–ª—å–∫–æ —Å—Ä–µ–¥—Å—Ç–≤–æ–º –±–æ—Ä—å–±—ã –ø—Ä–æ—Ç–∏–≤ ¬´–≥—Ä—è–∑–Ω–æ–≥–æ –∏–º–ø–µ—Ä–∏–∞–ª–∏–∑–º–∞¬ª. –ò—Ç–∞–∫, –º–∞—Ä–∫—Å–∏–∑–º –ø—Ä–µ–¥—Å—Ç–∞–≤–ª—è–µ—Ç –∏–∑ —Å–µ–±—è –æ–¥–Ω—É –∏–∑ —Ñ–æ—Ä–º –≥–æ—Å–ø–æ–¥—Å—Ç–≤–∞ –±—É—Ä–∂—É–∞–∑–∏–∏ –Ω–∞–¥ –ø—Ä–æ–ª–µ—Ç–∞—Ä–∏–∞—Ç–æ–º, –∏–±–æ –∫–∞–ø–∏—Ç–∞–ª–∏–∑–º ‚Äì –µ—Å—Ç—å –∏–º–ø–µ—Ä–∏–∞–ª–∏—Å—Ç, –∞ –ø—Ä–æ–ª–µ—Ç–∞—Ä–∏–∞—Ç ‚Äì –≤ —Ç–æ –∂–µ –≤—Ä–µ–º—è —ç–∫—Å–ø–ª—É–∞—Ç–∏—Ä—É–µ—Ç –∫–∞–ø–∏—Ç–∞–ª–∏—Å—Ç–∏—á–µ—Å–∫–∏–µ –º–∞—Å—Å—ã
.  –ò, –Ω–∞–∫–æ–Ω–µ—Ü, –≤¬†1853¬†–≥. –ø–æ –∏–Ω–∏—Ü–∏–∞—Ç–∏–≤–µ —Å–æ—Ü–∏–∞–ª-–¥–µ–º–æ–∫—Ä–∞—Ç–∞ –ò. –í. –ú–∞—Ä—Ç–æ–≤–∞ (–ú. –ï.¬†‚Äì –≤ ¬´–ü–∏—Å—å–º–∞—Ö –ù. –õ.) –æ–Ω –±—ã–ª –∏–∑–±—Ä–∞–Ω –≤ –î—É–º—É.¬†‚Äì 164.¬†‚Äì 168, 228‚Äì230.
.  –û —Ç–æ–º, –∫–∞–∫ –Ω–∞ —Å–∞–º–æ–º –¥–µ–ª–µ –¥–æ–ª–∂–Ω—ã –±–æ—Ä–æ—Ç—å—Å—è –∑–∞ –†–æ—Å—Å–∏—é —Å–æ—Ü–∏–∞–ª-–¥–µ–º–æ–∫—Ä–∞—Ç—ã, —Å –æ–¥–Ω–æ–π —Å—Ç–æ—Ä–æ–Ω—ã, –∏ –±–æ–ª—å—à–∏–Ω—Å—Ç–≤–æ —Å–æ—Ü–∏–∞–ª-–¥–

Model weights saved in ./checkpoint-500/pytorch_model.bin
Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –ò –º—ã —Å –∂–µ–Ω–æ–π —Ç–æ–∂–µ –Ω–∞ –Ω–∏—Ö —Å—Å—ã–ª–∞–µ–º—Å—è, –∞ –ø–æ—Ç–æ–º—É –∏ —Å–∞–º–∏ –Ω–∞ –Ω–∏—Ö —Å—Å—ã–ª–∞–µ–º—Å—è.  –ê —Ç–µ–ø–µ—Ä—å –º—ã —Å –∂–µ–Ω–æ–π –Ω–∞ –Ω–µ–µ —Å—Å—ã–ª–∞–µ–º—Å—è, –∞ –º—ã ‚Äì –Ω–∞ –Ω–µ–µ.  –ò, –µ—Å–ª–∏ —É –Ω–∞—Å –Ω–µ—Ç –Ω–∏–∫–∞–∫–æ–≥–æ –Ω–∞–º–µ—Ä–µ–Ω–∏—è, —Ç–æ –ø—É—Å—Ç—å –≤—Å–µ, –∫—Ç–æ –Ω–∞ –Ω–∞—Å —Å—Å—ã–ª–∞–µ—Ç—Å—è, –Ω–µ –æ–±–∏–∂–∞—é—Ç—Å—è.  –¢–∞–∫ –ø–æ—á–µ–º—É –∂–µ –æ–Ω–∏ –¥–æ–ª–∂–Ω—ã –æ–±–∏–∂–∞—Ç—å—Å—è
.  –ù–æ –Ω–µ –≤—Å–µ –æ–Ω–∏ –º–æ–≥—É—Ç –±—ã—Ç—å –ø—Ä–∞–≤—ã; –∫–∞–∫ –Ω–µ –≤—Å–µ–≥–¥–∞ –º–æ–∂–Ω–æ –∏ –Ω–µ –≤—Å–µ–≥–¥–∞ –Ω—É–∂–Ω–æ –∏–º–µ—Ç—å –¥–µ–ª–æ —Å –ø—Ä–∞–≤—ã–º–∏, –ø—Ä–∞–≤—ã–º–∏ –∏–ª–∏ –ø—Ä–∞–≤—ã–º–∏,¬†‚Äì –≤–æ—Ç –≤ —á–µ–º, –∫–∞–∂–µ—Ç—Å—è, —Å—É—Ç—å –∏—Ö –≤–∑–∞–∏–º–æ–æ—Ç–Ω–æ—à–µ–Ω–∏–π. –ò –≤–æ—Ç –∫–∞–∫ –æ–±—Å—Ç–æ–∏—Ç –¥–µ–ª–æ —Å –ø—Ä–∞–≤–æ–º–µ—Ä–Ω–æ—Å—Ç—å—é —Ç–æ–≥–æ –∏–ª–∏ –¥—Ä—É–≥–æ–≥–æ? –ß—Ç–æ —è–≤–ª—è–µ—Ç—Å—è –ø—Ä–∞–≤–æ–º–µ—Ä–Ω—ã–º –≤ –ø—Ä–∞–≤–æ–º –ø–æ–≤–µ–¥–µ–Ω–∏–∏ —ç—Ç–∏—Ö –ø–æ–ª–∏—Ç–∏—á–µ—Å–∫–∏—Ö –ø–∞—Ä—Ç–∏–π? –≠—Ç–æ –≤–æ–ø—Ä–æ—Å –≤
.  –≠—Ç–æ –¥–



Training completed. Do not forget to share your model on huggingface.co/models =)


Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



.  –û–¥–Ω–∞–∫–æ –¥–ª—è –Ω–∞—Å, –≤—Å–µ—Ö —ç—Ç–∏—Ö –≥—Ä—É–ø–ø, –º—ã –¥–æ–ª–∂–Ω—ã —Å—Ç—Ä–µ–º–∏—Ç—å—Å—è –∫ —Ç–æ–º—É, —á—Ç–æ–±—ã –Ω–µ —Ç–æ–ª—å–∫–æ –≤ –≤–∏–¥–µ –∏—Å–∫–ª—é—á–µ–Ω–∏—è, –Ω–æ –∏ –≤ –≤–∏–¥–µ –∏—Å–∫–ª—é—á–µ–Ω–∏—è –∏–∑ –Ω–∞—à–µ–π –ø–æ–ª–∏—Ç–∏—á–µ—Å–∫–æ–π –ø–∞—Ä—Ç–∏–∏, –≤ –ø–∞—Ä—Ç–∏–∏, –∫–æ—Ç–æ—Ä–∞—è –±—ã –ø—Ä–µ–¥—Å—Ç–∞–≤–ª—è–ª–∞ —Å–æ–±–æ–π –±–æ–ª–µ–µ —Å–ø–ª–æ—á–µ–Ω–Ω—É—é –∏ —Å–ø–ª–æ—á–µ–Ω–Ω—É—é –≥—Ä—É–ø–ø—É.–ù–∞–æ–±–æ—Ä–æ—Ç, —ç—Ç–æ –º–æ–∂–µ—Ç –∏–¥—Ç–∏ –≤—Ä–∞–∑—Ä–µ–∑ —Å –ø–æ–ª–∏—Ç–∏—á–µ—Å–∫–æ–π –Ω–µ–æ–±—Ö–æ–¥–∏–º–æ—Å—Ç—å—é, –º–æ–∂–µ—Ç –±—ã—Ç—å, —Å —ç–∫–æ–Ω–æ–º–∏—á–µ—Å–∫–æ–π –ø–æ—Ç—Ä–µ–±–Ω–æ—Å—Ç—å—é, –∏–ª–∏ –∂–µ
.  –í —Å—É—â–Ω–æ—Å—Ç–∏, —ç—Ç–æ –¥–∞–∂–µ –∏ –≤ –≥–æ–ª–æ–≤—É –Ω–µ –ø—Ä–∏—Ö–æ–¥–∏–ª–æ, —á—Ç–æ –Ω–∞ –¥–µ–ª–µ, —Ö–æ—Ç—è –±—ã –∏ —Ç–µ–æ—Ä–µ—Ç–∏—á–µ—Å–∫–∏, –±–æ–ª—å—à–µ–≤–∏–∫–∏ —è–≤–ª—è—é—Ç—Å—è –¥–µ–º–æ–∫—Ä–∞—Ç–∞–º–∏, –∫–æ—Ç–æ—Ä—ã–µ –≤–µ–¥—É—Ç –±–æ—Ä—å–±—É —Å —Ä–µ–≤–æ–ª—é—Ü–∏–µ–π.  –ö. –ú–∞—Ä–∫—Å, –Ω–∞–ø—Ä–∏–º–µ—Ä, –¥–æ–∫–∞–∑—ã–≤–∞–ª, —á—Ç–æ —Ç–æ–ª—å–∫–æ —Ç–∞–∫ –º–æ–∂–Ω–æ –ø—Ä–æ–≤–µ—

Saving model checkpoint to .
Configuration saved in ./config.json
Configuration saved in ./generation_config.json
Model weights saved in ./pytorch_model.bin


In [16]:
print_generations(prefix=". —Å–∞–º–æ–µ –≤–∞–∂–Ω–æ–µ", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. —Å–∞–º–æ–µ –≤–∞–∂–Ω–æ–µ, —á—Ç–æ –º—ã –º–æ–∂–µ–º –¥–µ–ª–∞—Ç—å, —ç—Ç–æ —Å–æ–∑–¥–∞–≤–∞—Ç—å —á—Ç–æ –±—ã —Ç–æ –Ω–∏ –±—ã–ª–æ –±–æ–ª–µ–µ –∏–ª–∏ –º–µ–Ω–µ–µ –≤ —Ñ–æ—Ä–º–µ, –∫–æ–≥–¥–∞-–ª–∏–±–æ, –≤ —Ñ–æ—Ä–º–µ –¥–≤–∏–∂–µ–Ω–∏—è, –∏–ª–∏ –∏–Ω–∞—á–µ, –≤ —Ñ–æ—Ä–º–µ –æ—Ä–≥–∞–Ω–∏–∑–∞—Ü–∏–∏.
. —Å–∞–º–æ–µ –≤–∞–∂–Ω–æ–µ, —á–µ–≥–æ —Ö–æ—á–µ—Ç –¥–æ—Å—Ç–∏–≥–Ω—É—Ç—å –±—É—Ä–∂—É–∞–∑–Ω—ã–π –Ω–∞—Ä–æ–¥ –≤ —ç—Ç–æ–º —Å—Ç–æ–ª–µ—Ç–∏–∏,¬†‚Äì —ç—Ç–æ –ø–µ—Ä–µ—Ö–æ–¥–∞ –∫ –¥–µ–º–æ–∫—Ä–∞—Ç–∏–∏. –ò –∏–º–µ–Ω–Ω–æ –ø–æ—ç—Ç–æ–º—É ‚Äì –±–æ—Ä—å–±–∞ —Å –±—É—Ä–∂—É–∞–∑–Ω–æ–π –¥–µ–º–æ–∫—Ä–∞—Ç–∏–µ–π, –∫–∞–∫ –±—ã –æ–Ω–∞ –Ω–∏ –±—ã–ª–∞ –≤—Ä–µ–¥–Ω–∞ –¥–ª—è –±—É—Ä–∂—É–∞–∑–∏–∏ –≤ –†–æ—Å—Å–∏–∏, –∫–∞–∫ –±—ã –æ–Ω–∞ –Ω–∏ –±—ã–ª–∞ –≤—Ä–µ–¥–Ω–∞ –¥–ª—è –≤—Å–µ—Ö —É–≥–Ω–µ—Ç–µ–Ω–Ω—ã—Ö –Ω–∞—Ü–∏–π –≤ –º–∏—Ä–µ. –ù–æ –∏–º–µ–Ω–Ω–æ –±–ª–∞–≥–æ–¥–∞—Ä—è —ç—Ç–æ–º—É –ø–µ—Ä–µ—Ö–æ–¥—É –≤ –†–æ—Å—Å–∏–∏ –º–æ–∂–µ—Ç —Ç–µ–ø–µ—Ä—å –±—ã—Ç—å –∏ –±—É—Ä–∂—É–∞–∑–Ω–∞—è –¥–µ–º–æ–∫—Ä–∞—Ç–∏—è. –ù–æ –≤ —ç—Ç–æ–π –¥–µ–º–æ–∫—Ä–∞—Ç–∏–∏ –Ω–µ –¥–æ–ª–∂–Ω—ã –±—ã—Ç—å –Ω–µ—É—á—Ç–µ–Ω—ã –∏ —Ç–µ

In [17]:
print_generations(prefix=". —è –≤–µ—Ä—é, —á—Ç–æ", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. —è –≤–µ—Ä—é, —á—Ç–æ –º—ã,¬†‚Äì —Å–∫–∞–∑–∞–ª –§–æ–∫—Å, –Ω–µ –æ—Ç—Ä—ã–≤–∞—è—Å—å –æ—Ç –æ–∫–Ω–∞.¬†‚Äì –ú—ã –¥–æ–ª–∂–Ω—ã –±—ã—Ç—å –≥–æ—Ç–æ–≤—ã –∑–∞—â–∏—â–∞—Ç—å —Å–µ–±—è —Å–∞–º–∏. –ú—ã –Ω–µ —Ö–æ—Ç–∏–º –Ω–∏ –æ –∫–∞–∫–æ–π –∑–∞—â–∏—Ç–µ –Ω–∏ –ø—Ä–æ—Å–∏—Ç—å, –Ω–∏ –ø—Ä–æ—Å–∏—Ç—å, –∞ –¥–æ–ª–∂–Ω—ã –±–æ—Ä–æ—Ç—å—Å—è —Å–æ –≤—Å–µ–º–∏ —ç—Ç–∏–º–∏ –ø—Ä–æ—Ç–∏–≤–Ω–∏–∫–∞–º–∏. –ù–æ —Ç–æ–ª—å–∫–æ –º—ã –Ω–µ —Ö–æ—Ç–∏–º, —á—Ç–æ–± —ç—Ç–∏ –ø—Ä–æ—Ç–∏–≤–Ω–∏–∫–∏ –±—ã–ª–∏ –∏–∑-–∑–∞ —É–≥–ª–∞, –∏–∑-–∑–∞ –∑–∞–±–æ—Ä–∞, —Å —É–ª–∏—Ü—ã, –≤ –¥–µ—Ä–µ–≤–Ω–µ, –≤ —Å–≤–æ–µ–º –≥–æ—Ä–æ–¥–µ, —á—Ç–æ–±—ã –æ–Ω–∏ –Ω–µ –º–æ–≥–ª–∏ –∂–∏—Ç—å –≤ —Å–æ–±—Å—Ç–≤–µ–Ω–Ω–æ–º –¥–æ–º–µ, —á—Ç–æ–±—ã –Ω–µ –º–æ–≥–ª–∏ –Ω–∏ –≤ –∫–∞–∫–æ–π –º–µ—Ä–µ –≤–Ω—è—Ç—å –Ω–∞—à–µ–º—É –ø–æ–∂–µ–ª–∞–Ω–∏—é.
. —è –≤–µ—Ä—é, —á—Ç–æ –≤ —ç—Ç–æ–º –≤–æ–ø—Ä–æ—Å–µ –µ—Å—Ç—å —Å–º—ã—Å–ª. –ù–æ, –ø–æ–∂–∞–ª—É–π, –Ω–µ –±—ã–ª–æ –±—ã –≤ —ç—Ç–æ–π —Ä–∞–±–æ—Ç–µ –Ω–∏ –æ–¥–Ω–æ–π –ø—Ä–∞–≤–∏–ª—å–Ω–æ–π, –Ω–æ —á—Ä–µ–∑–≤—ã—á–∞–π–Ω–æ –ø–æ–ª–µ–∑–Ω–æ–π, —Ä–∞–±–æ—Ç—ã, –∫–æ—Ç–æ—Ä–∞—è –±—ã –≤ –∫–æ—Ä–Ω–µ –∏–∑–

In [18]:
print_generations(prefix=". —è –Ω–µ–Ω–∞–≤–∏–∂—É", max_len=200)

Generate config GenerationConfig {
  "bos_token_id": 50256,
  "eos_token_id": 50256,
  "transformers_version": "4.26.1"
}



. —è –Ω–µ–Ω–∞–≤–∏–∂—É –ª–∏–±–µ—Ä–∞–ª–æ–≤-–¥–µ–∫–∞–±—Ä–∏—Å—Ç–æ–≤-–º–æ–Ω–∞—Ä—Ö–æ–≤ –∏ –∏—Ö ¬´–ø–∞—Ç—Ä–∏–æ—Ç–∏—á–µ—Å–∫–∏–µ¬ª ¬´—É–∫–∞–∑–∞—Ç–µ–ª–∏¬ª –∏¬†–æ—Ç–¥–µ–ª—å–Ω—ã–µ —Å–ª–æ–≤–∞-–ª–∏—Ä–∏–∫–∏. –Ø –Ω–µ –Ω–µ–Ω–∞–≤–∏–∂—É –ª–∏–±–µ—Ä–∞–ª–æ–≤-–º–æ–Ω–æ—Ñ–∏–∑–∏—Ç–æ–≤, –∞ –≤ —Ç–æ–º, —á—Ç–æ –æ–Ω–∏ –Ω–∞–∑—ã–≤–∞—é—Ç –ª–∏–±–µ—Ä–∞–ª–æ–≤ ¬´–º–æ–Ω–∞—Ä—Ö–∞–º–∏¬ª –∏¬†—Ç. –∏¬†–º. –≤¬†—Å–ª–æ–≤–æ (–æ—Ç–¥–µ–ª—å–Ω–æ) ¬´–º–æ–Ω–∞—Ä—Ö–∏¬ª, —è –≤–∏–∂—É –Ω–µ –≤ —Ç–æ–º, —á—Ç–æ –æ–Ω–∏ –¥—É–º–∞—é—Ç, –∞ –≤ —Ç–æ–º, —á—Ç–æ –æ–Ω–∏ –≤–∏–¥—è—Ç –∏ –≥–æ–≤–æ—Ä—è—Ç (–≤–º–µ—Å—Ç–µ —Å —Ç–µ–º–∏ –ª–∏–±–µ—Ä–∞–ª–∞–º–∏, –∫–æ—Ç–æ—Ä—ã–µ –≥–æ–≤–æ—Ä—è—Ç: ¬´–º–æ–Ω–æ—Ñ–∏–∑–∏–∫–∞–º–∏¬ª, ¬´–ø—Ä–æ–ª–µ—Ç–∞—Ä–∏—è–º–∏¬ª, ¬´–¥–≤–æ—Ä—Ü–∞–º–∏¬ª –∏¬†—Ç.¬†–¥.). –ù–æ –æ–Ω–∏ –Ω–µ –≥–æ–≤–æ—Ä—è—Ç, –∞ –≥–æ–≤–æ—Ä—è—Ç, —á—Ç–æ –æ–Ω–∏ –≥–æ–≤–æ—Ä—è—Ç –∏ –¥–µ–ª–∞—é—Ç (–∏ –Ω–∞ —Å–∞–º–æ–º –¥–µ–ª–µ –æ–Ω–∏ –≥–æ–≤–æ—Ä—è—Ç –æ —Ç–æ–º, —á—Ç–æ –∏ –Ω–∞ —Å–∞–º–æ–º –¥–µ–ª–µ –≥–æ–≤–æ—Ä—è—Ç –æ —Å–µ–±–µ), –≥–æ–≤–æ—Ä—è—Ç, —á—Ç–æ –æ–Ω–∏ –¥–µ–ª–∞—é—Ç, –≥–æ–≤–æ—Ä—è—Ç, —á—Ç–æ –æ–Ω