In [None]:
from IPython.display import Audio
from scipy.io.wavfile import write as write_wav
from clone.generation import SAMPLE_RATE, preload_models, codec_decode, generate_coarse, generate_fine, generate_text_semantic

In [None]:
semantic_path = "/content/drive/MyDrive/Capstone Dataset(Input and Output)/Model Weights/semantic_output_100epochs/semantic_prompt.bin" # set to None if you don't want to use finetuned semantic
coarse_path = "/content/drive/MyDrive/Capstone Dataset(Input and Output)/Model Weights/coarse_output_100epochs/coarse_prompt.bin" # set to None if you don't want to use finetuned coarse
fine_path = "/content/drive/MyDrive/Capstone Dataset(Input and Output)/Model Weights/fine_output_100epochs/fine_prompt.bin" # set to None if you don't want to use finetuned fine

In [None]:
preload_models(
    text_use_gpu=True,
    text_use_small=False,
    text_model_path=semantic_path,
    coarse_use_gpu=True,
    coarse_use_small=False,
    coarse_model_path=coarse_path,
    fine_use_gpu=True,
    fine_use_small=False,
    fine_model_path=fine_path,
    codec_use_gpu=True,
    force_reload=False,
    path="models"
)


In [None]:
def generate_with_settings(text_prompt, semantic_temp=0.7, semantic_top_k=50, semantic_top_p=0.95, coarse_temp=0.7, coarse_top_k=50, coarse_top_p=0.95, fine_temp=0.5, voice_name=None, use_semantic_history_prompt=False, use_coarse_history_prompt=True, use_fine_history_prompt=True, output_full=False):
    # generation with more control
    x_semantic = generate_text_semantic(
        text_prompt,
        history_prompt=voice_name if use_semantic_history_prompt else None,
        temp=semantic_temp,
        top_k=semantic_top_k,
        top_p=semantic_top_p,
    )

    x_coarse_gen = generate_coarse(
        x_semantic,
        history_prompt=voice_name if use_coarse_history_prompt else None,
        temp=coarse_temp,
        top_k=coarse_top_k,
        top_p=coarse_top_p,
    )
    x_fine_gen = generate_fine(
        x_coarse_gen,
        history_prompt=voice_name if use_fine_history_prompt else None,
        temp=fine_temp,
    )

    if output_full:
        full_generation = {
            'semantic_prompt': x_semantic,
            'coarse_prompt': x_coarse_gen,
            'fine_prompt': x_fine_gen,
        }
        return full_generation, codec_decode(x_fine_gen)
    return codec_decode(x_fine_gen)

## For single-single output audio inference from the dataset (train, valid or test) Recommended to Run this instead of the full output inference

In [None]:
# text_prompt = "lets see some examples so first right is above the domain adaptation so in this slide we will see our."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide3_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "we have another kind of datasets in the medical field for example we have the t one images and we have the flare images if we."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide3_0070-0080.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0070-0080.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and I will introduce one more of the previous that I developed out of those examples thats exactly how manifold."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide4_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide4_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "in this case its just a sixteen and theres a out is the outer is just about you know one the shape of your brain structure."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide5_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide5_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "different causes of the diseases if it is one it means normal if it is two it means its abnormal so sometimes you."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide7_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide7_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "left hand you see a lot of like noise you just you know bring it over but on your right hand once you get the denoised."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide9_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide9_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "here right and the same on the left hand the this figure is about noisy mixing birds by the right hand there are two different colors so."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide10_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide10_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and there is this one is a very pretty big."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide11_0040-0042.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide11_0040-0042.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and then this here is just our canvas page and then you can feel free to have some discussions online."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide13_0030-0039.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide13_0030-0039.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "in the office after any kind of questions okay."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide15_0030-0034.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide15_0030-0034.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
text_prompt = "its about thirty percentage for that reason your final project is like your first semester first year come to my office talk to me to."
filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide18_0040-0050.wav" # change this to your desired output path

audio_array = generate_with_settings(
    text_prompt,
    semantic_temp=0.80,
    semantic_top_k=50,
    semantic_top_p=0.99,
    coarse_temp=0.80,
    coarse_top_k=50,
    coarse_top_p=0.95,
    fine_temp=0.70,
    voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide18_0040-0050.npz",
    use_semantic_history_prompt=False,
    use_coarse_history_prompt=True,
    use_fine_history_prompt=True,
    output_full=False
)

write_wav(filepath, SAMPLE_RATE, audio_array)
print("--------------------------------------------")

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "yes we depending on your guys if you guys sound like, other at the most I would like to say two students per group."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide18_0130-0140.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide18_0130-0140.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and data pre processing in the third way we are talking about the classification after that we will talk about some regression and list."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "we have like neural network Anselm method and we are finished about the horse method I'll have to emphasize that soon."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0060-0070.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0060-0070.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "the final project professor yes let's go try to find it in our syllabus again so here is all the content that I will cover."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0130-0140.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0130-0140.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "are all the projects independent for that or like a teamwork professor you mean the homework student wanna know the project project."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0160-0170.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0160-0170.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "in your interview how you will implement the scale these kinds of algorithms like Gaussian Mixture Model how you will implement."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0220-0230.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0220-0230.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "immediately implemented and you definitely have a good impression of them so now the might need some might hire you immediately hopefully okay."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide20_0250-0260.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0250-0260.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "what about the other source this is so yeah it's still kinda often what about the other source of of from online students."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide22_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide22_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so first of all was the perceptron of we also say it as representation so in AI perceptron."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide24_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide24_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "but what about learning so the learning is the ability of a system to improve its behavior based on experience so."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide25_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide25_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "level and applying it at other level so then another question so among those four different aspects which."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide27_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide27_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Answer."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide27_0080-0082.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide27_0080-0082.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "verification and validation is more like you like your phone."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide29_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide29_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "especially the amount that data labeling is a big challenge for all existing machine learning for those you definitely need to provide feed."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide29_0100-0110.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide29_0100-0110.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "interaction the HCI and Israeli would like a little bit longer time than single computer models but you know."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide29_0160-0170.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide29_0160-0170.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "label the input data so then one features and labels professor feature and labels cn that's yes exactly."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide30_0060-0070.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0060-0070.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "you've got some stock price predictions so the stock price on your level our levels of it right giving you."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide30_0130-0140.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0130-0140.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "of that in the nineteen sixties like the earliest offer network it's called perception as it was born at that time."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide32_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide32_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "finding some tasks and learning some reinforcement learning and inductive logic programming etcetera."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide33_0020-0028.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide33_0020-0028.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "about two years ago in the two thousand tens in that stage and like deep learning is rarely and becomes popular right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide34_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide34_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so this is about the intuition of showing how it handles themselves actually there are no specific features that."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide37_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide37_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "yes right what about the world and that's about our children so really humanness learn from experience."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide37_0060-0070.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide37_0060-0070.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "model is bigger professor yes that's very good spectrum what about some thoughts about you guys use tradition."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide38_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "sum of if a statement and a check if that's related to a cat or not professor good you have a similar."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide38_0100-0110.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0100-0110.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "we want to detect the shape we want to detect the length and we have so many different if else statements so finally to decide."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide39_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide39_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "very challenging I mean different shape strange shape somehow has a cat more like water it can be in any shape right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide41_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide41_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so now we talk about the questions some what is machine learning and this is very important the early stage of computer."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide43_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide43_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "because we are human beings right and we are we were lazy we don't we cannot do everything we want some computers."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide44_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide44_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "the next question is why study machine learning why is it important here's the case in that we want to develop a better computer system."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide46_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide46_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
text_prompt = "users for example personalized news the mailing filtering for example sometimes you have some app."
filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide46_0060-0070.wav" # change this to your desired output path

audio_array = generate_with_settings(
    text_prompt,
    semantic_temp=0.80,
    semantic_top_k=50,
    semantic_top_p=0.99,
    coarse_temp=0.80,
    coarse_top_k=50,
    coarse_top_p=0.95,
    fine_temp=0.70,
    voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide46_0060-0070.npz",
    use_semantic_history_prompt=False,
    use_coarse_history_prompt=True,
    use_fine_history_prompt=True,
    output_full=False
)

write_wav(filepath, SAMPLE_RATE, audio_array)
print("--------------------------------------------")

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "learn is not intelligent so actually without learning everything is new right a system that cannot learn is not efficient because it."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide47_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide47_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "you will try to use machine learning for example in the speech recognition for example you will use siri and ask her to do."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide48_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide48_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and also we can recognize handwritten digits for example this kind of very weird right it's it is weird right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide51_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide51_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "been there before right who can use some robot machine help us be explored first right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide54_0010-0017.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide54_0010-0017.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
text_prompt = "another trend is about why machine learning models are so popular right because there are so many places that we needed to use machine learning."
filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide56_0000-0010.wav" # change this to your desired output path

audio_array = generate_with_settings(
    text_prompt,
    semantic_temp=0.80,
    semantic_top_k=50,
    semantic_top_p=0.99,
    coarse_temp=0.80,
    coarse_top_k=50,
    coarse_top_p=0.95,
    fine_temp=0.70,
    voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide56_0000-0010.npz",
    use_semantic_history_prompt=False,
    use_coarse_history_prompt=True,
    use_fine_history_prompt=True,
    output_full=False
)

write_wav(filepath, SAMPLE_RATE, audio_array)
print("--------------------------------------------")

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "to use machine learning and this is the key reason why machine learning nowadays is so popular and important."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide56_0090-0097.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide56_0090-0097.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "learning we have we will use labeled dataset right as the unsupervised learning just to discover patterns in unlabeled dataset."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide58_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide58_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "had a semi supervised another count between those ones as a majority we have three those three different categories for example is."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide59_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide59_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "unlabeled data is a traditional sense is a reinforcement learning an agent learns via its interactions with any environment."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide59_0050-0060.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide59_0050-0060.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "the perception especially about logistic regression I think all of you should know about from your first semester right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide60_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide60_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "the non parametric models they just they need just that those models vary depending on dataset they don't care."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide60_0070-0080.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide60_0070-0080.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "for majority of those kinds of methods we will cover the rest of the semester you will see about that."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide60_0120-0128.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide60_0120-0128.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "predictor labels right however why important the process is called feature extraction well done."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide62_0050-0060.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide62_0050-0060.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "method to extract some key features from data so here it is the images the key feature"
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide62_0100-0110.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide62_0100-0110.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "you will get more sense of it."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide62_0160-0163.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide62_0160-0163.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "based on some clustering method right for example that like some knn k nearest neighbor you will probably choose."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide63_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide63_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "those two different classes this is cool called unsupervised learning."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide63_0090-0097.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide63_0090-0097.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "anyway you guys will learn more details that in the AI artificial intelligence class or reinforcement learning class and specifically for."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide64_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide64_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
text_prompt = "we only utilize a kind of traditional machine learning models for example I like the decision tree the SVM the KNN the MLP."
filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide65_0010-0020.wav" # change this to your desired output path

audio_array = generate_with_settings(
    text_prompt,
    semantic_temp=0.80,
    semantic_top_k=50,
    semantic_top_p=0.99,
    coarse_temp=0.80,
    coarse_top_k=50,
    coarse_top_p=0.95,
    fine_temp=0.70,
    voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide65_0010-0020.npz",
    use_semantic_history_prompt=False,
    use_coarse_history_prompt=True,
    use_fine_history_prompt=True,
    output_full=False
)

write_wav(filepath, SAMPLE_RATE, audio_array)
print("--------------------------------------------")

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "works support vector machine and the symbolic functions we have decision trees processional logic rules for the first."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide66_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide66_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "for example this is very about the medical diseases diagnosis is left for about this image any idea about this image."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide68_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide68_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "your eyes where is your nose where is your mouse right it's funny areas right it's really about personal identification so."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide69_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide69_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "just tries to shoot a posture."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide71_0010-0012.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide71_0010-0012.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "right and theres thats theres some repetitive tasks for some tasks that you will repeatedly do it so."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide76_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide76_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "example like packaging the first need is to recollect objects so then you can package those objects."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide77_0020-0028.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide77_0020-0028.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and also about military suits or about this case try to do some detections some problem of it."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide82_0010-0018.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide82_0010-0018.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "you do not want to break it either to break the object or to break the robot itself what about this cleaner."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide84_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide84_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and this is a famous sentence from Birgitte that a breakthrough in machine learning will be worth ten microsofts is that."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide87_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide87_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "for example you guys have such a lot of those questions like machine learning and then thats the key reason you guys need to start in this."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide89_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide89_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "remind this class I will require you guys also to provide some answers from chat gpt answers okay so basically which means that."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide90_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide90_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so for example here is the example from me from me and since this is for the examples from the chat gpt but the question what is."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide91_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide91_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "well you cannot beat a machine right you cannot beat the a chat gpt with a good answer right try to avoid that okay others probably."
# filepath = "/content/drive/MyDrive/output/test_inference_output/clip_slide91_0070-0080.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide91_0070-0080.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so next I want to briefly mention about the history of the machine learning."
# filepath = "/content/drive/MyDrive/output/test_inference_output/slide31.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/slide31.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and also you know about the space robot that I mentioned before to try to explore the mars right."
# filepath = "/content/drive/MyDrive/output/test_inference_output/slide83.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/slide83.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

### For Validation Inference

In [None]:
# text_prompt = "Directions. So first of all, I will majorly talk about my papers. I'll focus on transfer learning. So Especially, I focused on."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide2_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide2_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Outline of the clipart domain. So now you will observe the difference between those two domains if you apply this on existing machine learning models."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide3_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "A very good accurate result because you see the difference between your tumor images and the flare images are even worse, your system."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide3_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Shoes, how monkey changes in the interviewer working human being. Right? So this corresponding to those plan."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide4_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide4_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And, specifically, we are reluctant to the outcome of diseases. If you found that your Cox group time is very small."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide5_0050-0060.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide5_0050-0060.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Just a few of them can get diseases, but then later, you will see some of a lot of them."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide7_0040-0046.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide7_0040-0046.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "The yellow color means the birdsong one, here, and the blue color means the birdsong two. So this is becomes."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide10_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide10_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Is our final scores. Right?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide12_0030-0033.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide12_0030-0033.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Of you guys, but not the, all of you. I did not speak in this matter, and then see you guys to come. Feel free to stop your."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide15_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide15_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "I will get it. But finally, I will only select the highest selection of them for your final grade. And lastly, it's about the final project."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide18_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide18_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And I think any of you are from the first semester? No? It's from the second semester. You should know about this."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide19_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide19_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "To implement or reimplement this decision tree from scratch. So so then during this this homework you."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide20_0100-0110.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0100-0110.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Professor, so here, in the big picture of machine learning, just a particular way, we are start from artificial"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide22_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide22_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So we will talk about AI a little bit for other differences between AI and the machine learning has already noticed in in this."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide22_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide22_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "But the reasoning reasoning is a way to infer facts from existing data it is a general process of thinking rationally"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide26_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide26_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So what about the bottleneck of the AI? So actually it's just about abstraction and reasoning, the key reasoning is about for the."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide28_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide28_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Robust AI is the AI only here just mentioned like of five different aspects like the."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide29_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide29_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Professor, now let's talk about what is different between AI and the machine learning. So you already noticed that machine learning is just a branch."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide30_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Have another kind of labeled datasets, but we will use this this time, and we will try to use trained machine learning models based on training stage. We."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide30_0150-0160.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0150-0160.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Ago, but that is in the nineteen fifties. The first light of machine learning is very related to the trick player. So."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide32_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide32_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Your your time series data and the year, another stage of of machine learning is called prediction or called the test stage. We."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide30_0140-0150.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0140-0150.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "In the nineteen seventees, we also have other common algorithms."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide32_0040-0046.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide32_0040-0046.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "so um, is going to increase that economy."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide34_0050-0055.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide34_0050-0055.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "The human mind is a set of cognitive, gadgets and, supposed to learn."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide36_0030-0039.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide36_0030-0039.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "We probably noticed that our eyes can take an image like every two hundred milliseconds and we have."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide37_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide37_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And then another good question about how machine learning is different from traditional programming. Here's an example here. If I."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide38_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "We really talk about some in the early stage without computer vision problems, but what the kind of."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide38_0050-0060.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0050-0060.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Solution to your classmates so let's see student 3 can I say something? Professor, professor, do you have another?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide38_0110-0120.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0110-0120.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Whether that is correct, but one question is, is that enough? How many those standard if if else statements do need to."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide39_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide39_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "You have more and more data, definitely, your machine learning algorithm can output a good accuracy, but we are hearing about that."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide42_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide42_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "If you have your own dataset, dataset especially in industry, every company even has their own dataset. Right?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide46_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide46_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And also, in the video recognition with machine learning to try to recognize whether this is a dog or whether that is."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide49_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide49_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Is really not a corpuscle sum. Remember, my previous slide is this part is really about corpuscle sum, this part and this part. So."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide55_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide55_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Another class for the artificial intelligence. Probably, I will teach it next semester. It depends on whether it is we have a lot we have."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide57_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide57_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Is this slide is more about it's just classified into three. And in the previous slide, we."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide59_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide59_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "About this logistic regression, about the support vector machine, SVM, and also about the neural networks. So all of those."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide60_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide60_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Dimensionality. The dimensionality reduction mentioned, like the PCA, like factor analysis, and so on. All of those are some."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide61_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide61_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Extra features. But in your another different, learning class, we will talk about how to extract those deep features or the traditional features."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide62_0130-0140.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide62_0130-0140.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Step. Right? You'll make some reward. You will get some scores or you will lost the scores. So that is probably reward here. But."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide64_0080-0090.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide64_0080-0090.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "All the predictive logic, and we have for the instant based functions. We have k nearest neighbor, and we have the case based."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide66_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide66_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "To unlock home using your finger. Right? In the early world, the windows like two thousand six and something like that."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide70_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide70_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Of some labels of those different objects like the cars, the roads, the trees. Right? All different kinds of labels. Yes?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide72_0010-0019.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide72_0010-0019.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "She'll learning to do that."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide74_0010-0012.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide74_0010-0012.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
text_prompt = "Material handling, some like packaging, machine loading, all kinds of different robotics. They have some machine learning algorithm inside for."
filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide77_0010-0020.wav" # change this to your desired output path

audio_array = generate_with_settings(
    text_prompt,
    semantic_temp=0.80,
    semantic_top_k=50,
    semantic_top_p=0.99,
    coarse_temp=0.80,
    coarse_top_k=50,
    coarse_top_p=0.95,
    fine_temp=0.70,
    voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide77_0010-0020.npz",
    use_semantic_history_prompt=False,
    use_coarse_history_prompt=True,
    use_fine_history_prompt=True,
    output_full=False
)

write_wav(filepath, SAMPLE_RATE, audio_array)
print("--------------------------------------------")

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "By others. So many inspections and blah blah as they assume can some kind of robotics you might have already."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide84_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide84_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Here's about your heart rate or some kind of measurement. All the all of them are machines. Right?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide85_0020-0027.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide85_0020-0027.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And you you definitely have more chance to get those three parts I list For example, the artificial intelligence engineering, some machine learning engineer."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide89_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide89_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Some come some sentences copy from online. You will probably have some trouble with that. I think you guys have already."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide90_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide90_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "That's about my last slide. I hope you guys have can any question re regarding the to any questions. Okay? Okay?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide91_0080-0089.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide91_0080-0089.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So, here's just about some automotive kind of machine here."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/slide79.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/slide79.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Explain what is domain adaptation mean here. Next, I'm interested in manifold."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide2_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide2_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Between your source domain and the target domain. So here, for example, those last three objects are from product domain, and here is just about."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide3_0030-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0030-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "The images and the task. Right? And then this is the problem of the domain adaptation that we want to mitigate. The difference between our training and our test."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide3_0110-0120.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide3_0110-0120.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So here, it's especially referred to the corpuscle sum, which is one of our brain structures that is related to your."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide5_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide5_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "After that, we can do some kind of process of the audios, but eventually upload and get some segmentation model. We can try to."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide8_0020-0030.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide8_0020-0030.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Becomes an image problem. Right?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide10_0030-0033.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide10_0030-0033.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So here is a textbook. You guys might need to read. It is called, like, bible in machine learning field. In it is."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide13_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide13_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Okay?"
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide14_0040-0040.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide14_0040-0040.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And also I will even next week, I will try to give you guys a quick review of some math that is required in this class And I think."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide17_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide17_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Exams or final exams. Are you ready? Complete? No? No? Nobody likes exams? Okay. So let's."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide18_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide18_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And again, about the details of our class schedule, so we are in the first week. And then next week, we will talk about best."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide20_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "All like, all the contents in this machine learning course are very important to you because of your future, interviews."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide20_0070-0080.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0070-0080.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Learning, and what is the future of it? Maybe next class, I will I want to give you guys a little bit easy stuff like that, And."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide20_0200-0210.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide20_0200-0210.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Exactly. You got it. In the next few slides, we are the first using AI and then we are talking about the machine learning."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide22_0080-0090.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide22_0080-0090.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Professor, what about abstraction? So abstraction is a fundamental mechanism underlying both human and artificial."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide27_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide27_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "If you want machine learning to do some tasks that have never turned before, it is very challenging for them."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide28_0030-0038.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide28_0030-0038.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Several different types like unsupervised learning, supervised learning, we also have reinforcement learning, etcetera, yeah."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide29_0140-0150.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide29_0140-0150.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Image of a cat. The label is a cat. You have labeled it, so it is a labeled dataset. Right? So for example."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide30_0120-0130.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide30_0120-0130.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So out of that, in the next decade, like, two thousand and ten, the deep learning is most likely everyday work."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide34_0040-0050.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide34_0040-0050.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "and definitely you can avoide providing some mistakes."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide37_0090-0094.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide37_0090-0094.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Is some kind of advanced solution."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide38_0150-0153.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide38_0150-0153.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "So also try to get some better results. Then models will be allowed to get an application plan."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide42_0040-0049.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide42_0040-0049.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And give you some exceeding news that you are about that. Right? But I keep giving you some coming out in this field."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide46_0070-0080.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide46_0070-0080.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Recommendation like a home assistant, they are uniquely, and we are uniquely. Everybody is a unique person. Right? We have lots."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide52_0010-0020.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide52_0010-0020.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And, also, there are lots of related displays. For example, it is directly related to the AI. I think you guys, We."
# filepath = "/content/drive/MyDrive/output/validation_inference_output/clip_slide57_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.80,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.80,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.70,
#     voice_name="/content/drive/MyDrive/Course_Audio/tokens/clip_slide57_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)
# print("--------------------------------------------")

# # Audio(audio_array, rate=SAMPLE_RATE)

## For Output Inference of all Audio in the datset train, test and validation dataset

In [None]:
# from tqdm import tqdm 
# def generate_and_save(text_prompt, output_path, voice_name):
#   """
#   Generates audio from text prompt, saves it, and plays it (optional).

#   Args:
#       text_prompt: Text prompt for speech generation.
#       output_path: Path to save the generated audio file (WAV format).
#       voice_name: Path to the voice encoder file (`.npz` format).
#   """
#   audio_array = generate_with_settings(text_prompt,
#                                        semantic_temp=0.80,
#                                        semantic_top_k=50,
#                                        semantic_top_p=0.99,
#                                        coarse_temp=0.80,
#                                        coarse_top_k=50,
#                                        coarse_top_p=0.95,
#                                        fine_temp=0.70,
#                                        voice_name=voice_name,
#                                        use_semantic_history_prompt=False,
#                                        use_coarse_history_prompt=True,
#                                        use_fine_history_prompt=True,
#                                        output_full=False)
#   write_wav(output_path, SAMPLE_RATE, audio_array)
#   # Audio(audio_array, rate=SAMPLE_RATE)  # Optional: Play the generated audio

# def load_filepaths_and_text(filename, split="|"):
#   with open(filename, encoding='utf-8', errors='ignore') as f:
#       filepaths_and_text = [line.strip().split(split) for line in f]
#       # base = os.path.dirname(filename)
#       # for j in range(len(filepaths_and_text)):
#       #     filepaths_and_text[j][0] = os.path.join(base, filepaths_and_text[j][0])
#   return filepaths_and_text

# def process_data_file(data_file, output_folder):
#   """
#   Processes a data file (train.txt, valid.txt, or test.txt).

#   Args:
#       data_file: Path to the data file containing audio paths and text prompts.
#       output_folder: Base folder to save generated audio (separate subfolders for train/val/test).
#   """
#   with tqdm(total = len(load_filepaths_and_text(data_file))) as pbar:
#     for wav_path, txt in load_filepaths_and_text(data_file):
#         # Construct output path with optional prefix (modify as needed)
#         temp = wav_path.split("/")[1]
#         output_path = os.path.join(output_folder, f"{temp}")  # Change "train" for validation/test sets

#       #   print(wav_path)

#       #   print(output_path)
#         # print(txt)

#         # Construct voice encoder path based on audio filename
#         voice_path = os.path.join(data_folder, 'tokens', os.path.basename(wav_path).replace('.wav', '.npz')).replace("\\", "/")
#       #   print(voice_path)

#         # Generate and save audio
#         generate_and_save(txt, output_path, voice_path)
#         pbar.update(1)

# # Define your data folders
# data_folder = "/content/drive/MyDrive/Course_Audio/"
# # output_folder_train = "/content/drive/MyDrive/output/train_inference_output/"
# output_folder_valid = "/content/drive/MyDrive/output/validation_inference_output/"
# # output_folder_test = "/content/drive/MyDrive/output/test_inference_output/"

# # Process train data files (modify calls for validation and test sets)
# # process_data_file(os.path.join(data_folder, "train.txt"), output_folder_train)
# process_data_file(os.path.join(data_folder, "sample_valid.txt"), output_folder_valid)
# # process_data_file(os.path.join(data_folder, "sample_test.txt"), output_folder_test)


In [None]:
# text_prompt = "These are about reason why the labeling is now still very challenging. Also, we have so many different implementing models or."
# filepath = "/content/drive/MyDrive/output/test_clip_slide29_0120-0130.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide29_0120-0130.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And check to make some predictions for the test dataset set and then even we want to evaluate the performance."
# filepath = "/content/drive/MyDrive/output/test_clip_slide30_0160-0170.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide30_0160-0170.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "We can make a classifier like logistic logistic stick regression, a classifier on a gradient boosting classifier, which classify"
# filepath = "/content/drive/MyDrive/output/test_clip_slide38_0130-0140.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide38_0130-0140.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "And even we can use machine learning to help us exploring something that not exist. For example, the navigation task because our human has."
# filepath = "/content/drive/MyDrive/output/test_clip_slide54_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide54_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "But the reasoning reasoning is a way to infer facts from existing data it is a general process of thinking rationally."
# filepath = "/content/drive/MyDrive/output/test_clip_slide26_0000-0010.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide26_0000-0010.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)

In [None]:
# text_prompt = "Some come some sentences copy from online. You will probably have some trouble with that. I think you guys have already."
# filepath = "/content/drive/MyDrive/output/test_clip_slide90_0090-0100.wav" # change this to your desired output path

# audio_array = generate_with_settings(
#     text_prompt,
#     semantic_temp=0.7,
#     semantic_top_k=50,
#     semantic_top_p=0.99,
#     coarse_temp=0.7,
#     coarse_top_k=50,
#     coarse_top_p=0.95,
#     fine_temp=0.5,
#     voice_name="/content/drive/MyDrive/Course Audio/tokens/clip_slide90_0090-0100.npz",
#     use_semantic_history_prompt=False,
#     use_coarse_history_prompt=True,
#     use_fine_history_prompt=True,
#     output_full=False
# )

# write_wav(filepath, SAMPLE_RATE, audio_array)

# Audio(audio_array, rate=SAMPLE_RATE)