In [None]:
!pip install -q -U transformer

In [None]:
import csv
from typing import Tuple
from transformers import (
    AutoModelForCausalLM,
    AutoTokenizer,
    PreTrainedModel,
    PreTrainedTokenizer
)

def load_model_and_tokenizer(model_name_or_path: str) -> Tuple[PreTrainedModel, PreTrainedTokenizer]:
    try:
        model = AutoModelForCausalLM.from_pretrained(model_name_or_path, trust_remote_code=True)
        tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, trust_remote_code=True)

        if tokenizer.pad_token is None:
            tokenizer.add_special_tokens({'pad_token': tokenizer.eos_token})

        return model, tokenizer
    except Exception as e:
        raise RuntimeError(f"Failed to load model and tokenizer: {e}")

def generate_text(
    model: PreTrainedModel,
    tokenizer: PreTrainedTokenizer,
    prompt: str,
    max_length: int = 100,
    temperature: float = 0.9
) -> str:
    input_ids = tokenizer(prompt, return_tensors="pt").input_ids

    gen_tokens = model.generate(
        input_ids,
        do_sample=True,
        temperature=temperature,
        max_length=max_length
    )

    gen_text = tokenizer.batch_decode(gen_tokens)[0]

    return gen_text

# Load the model and tokenizer once
model_name_or_path = "gpt2"
model, tokenizer = load_model_and_tokenizer(model_name_or_path)

# Specify the number of iterations to generate text
num_iterations = 100
file_csv='output2.csv'
# Generate text and write to CSV file
with open(file_csv, mode='w', newline='', encoding='utf-8') as csvfile:
    fieldnames = ['prompt', 'generated_text']
    writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
    writer.writeheader()

    for i in range(num_iterations):
        prompt_Q = " Generate unique coding questions in C, C++, and Python that focus on time and memory optimization, as well as advanced research topics. Please provide one question for each programming language. Note every time new question novel (first time people see in this earth) "
        Question = generate_text(model, tokenizer, prompt_Q)
        prompt_A=f'Compose a series of interconnected thoughts in a chain of thoughts format, demonstrating your expertise in advanced computer science and advanced higher mathematical skills.  {Question }'
        Answer = generate_text(model, tokenizer, prompt_A,max_length=100)
        writer.writerow({'prompt': Question, 'generated_text': Answer})


In [None]:
pip  install einops

In [None]:
import csv
from typing import Tuple
from transformers import (
    AutoModelForCausalLM,
    AutoTokenizer,
    PreTrainedModel,
    PreTrainedTokenizer
)

def load_model_and_tokenizer(model_name_or_path: str) -> Tuple[PreTrainedModel, PreTrainedTokenizer]:
    try:
        model = AutoModelForCausalLM.from_pretrained(model_name_or_path, trust_remote_code=True)
        tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, trust_remote_code=True)

        if tokenizer.pad_token is None:
            tokenizer.add_special_tokens({'pad_token': tokenizer.eos_token})

        return model, tokenizer
    except Exception as e:
        raise RuntimeError(f"Failed to load model and tokenizer: {e}")

def generate_text(
    model: PreTrainedModel,
    tokenizer: PreTrainedTokenizer,
    prompt: str,
    max_length: int = 100,
    temperature: float = 0.9
) -> str:
    input_ids = tokenizer(prompt, return_tensors="pt").input_ids

    gen_tokens = model.generate(
        input_ids,
        do_sample=True,
        temperature=temperature,
        max_length=max_length
    )

    gen_text = tokenizer.batch_decode(gen_tokens)[0]

    return gen_text

# Load the model and tokenizer once
model_name_or_path = "microsoft/phi-2"
model, tokenizer = load_model_and_tokenizer(model_name_or_path)

# Specify the number of iterations to generate text
num_iterations = 100
file_csv='output3.csv'
# Generate text and write to CSV file
with open(file_csv, mode='w', newline='', encoding='utf-8') as csvfile:
    fieldnames = ['prompt', 'generated_text']
    writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
    writer.writeheader()

    for i in range(num_iterations):
        prompt_Q = " Generate unique coding questions in C, C++, and Python that focus on time and memory optimization, as well as advanced research topics. Please provide one question for each programming language. Note every time new question novel (first time people see in this earth) "
        Question = generate_text(model, tokenizer, prompt_Q)
        prompt_A=f'Compose a series of interconnected thoughts in a chain of thoughts format, demonstrating your expertise in advanced computer science and advanced higher mathematical skills.  {Question }'
        Answer = generate_text(model, tokenizer, prompt_A,max_length=100)
        writer.writerow({'prompt': Question, 'generated_text': Answer})


In [None]:
from transformers import AutoModelForCausalLM, AutoTokenizer

# Load the Mistral 7B model and tokenizer
model_name = "mistralai/Mistral-7B-v0.1"
model = AutoModelForCausalLM.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

# Define the prompt or input text
prompt = "Your prompt goes here."

# Generate text using the Mistral 7B model
input_ids = tokenizer.encode(prompt, return_tensors="pt")
output = model.generate(input_ids, max_length=8000)

# Retrieve the generated text
generated_text = tokenizer.decode(output[0], skip_special_tokens=True)

print(generated_text)
