In [3]:
import sys
import torch
import f5_tts

print(f"✅ Python: {sys.executable}")
print(f"✅ PyTorch: {torch.__version__}")
print(f"✅ F5-TTS importado")
print(f"\n🔍 ¿Usando venv?: {'.venv' in sys.executable}")

✅ Python: /mnt/c/Users/noel_/Desktop/TTS_HF/voice-clone-comparison/.venv/bin/python
✅ PyTorch: 2.8.0+cu128
✅ F5-TTS importado

🔍 ¿Usando venv?: True


In [6]:
# Intentar encontrar clases/funciones usables
submodules_v2 = [
    'f5_tts.infer.utils_infer',
    'f5_tts.model.model',
    'f5_tts.model.cfm',
    'f5_tts.infer.infer_process',
]

print("🔍 Buscando módulos internos:")
print("-" * 40)

for module_name in submodules_v2:
    try:
        mod = importlib.import_module(module_name)
        print(f"✅ {module_name}")
        
        # Ver qué tiene dentro
        funcs = [x for x in dir(mod) if not x.startswith('_') and callable(getattr(mod, x))]
        if funcs:
            print(f"   └─ Funciones: {', '.join(funcs[:5])}")
            
    except Exception as e:
        print(f"❌ {module_name}")

🔍 Buscando módulos internos:
----------------------------------------
✅ f5_tts.infer.utils_infer
   └─ Funciones: AudioSegment, CFM, ThreadPoolExecutor, Vocos, chunk_text
❌ f5_tts.model.model
✅ f5_tts.model.cfm
   └─ Funciones: CFM, Callable, MelSpec, default, exists
❌ f5_tts.infer.infer_process


In [8]:
from f5_tts.infer import utils_infer

print("🔍 Todos los elementos de utils_infer:")
print("-" * 40)

# Ver TODOS los no-privados
all_items = [x for x in dir(utils_infer) if not x.startswith('_')]

# Categorizar por tipo
functions = []
classes = []
variables = []

for item_name in all_items:
    item = getattr(utils_infer, item_name)
    item_type = type(item).__name__
    
    if item_type == 'function':
        functions.append(item_name)
    elif item_type == 'type':
        classes.append(item_name)
    else:
        variables.append(f"{item_name} ({item_type})")

print(f"\n📚 FUNCIONES ({len(functions)}):")
for f in functions:
    print(f"   • {f}")

print(f"\n🏗️ CLASES ({len(classes)}):")
for c in classes:
    print(f"   • {c}")

print(f"\n🔧 VARIABLES ({len(variables)}):")
for v in variables[:10]:  # Solo primeras 10
    print(f"   • {v}")

🔍 Todos los elementos de utils_infer:
----------------------------------------

📚 FUNCIONES (17):
   • chunk_text
   • convert_char_to_pinyin
   • files
   • get_tokenizer
   • hf_hub_download
   • infer_batch_process
   • infer_process
   • initialize_asr_pipeline
   • load_checkpoint
   • load_model
   • load_vocoder
   • pipeline
   • preprocess_ref_audio_text
   • remove_silence_edges
   • remove_silence_for_generated_wav
   • save_spectrogram
   • transcribe

🏗️ CLASES (4):
   • AudioSegment
   • CFM
   • ThreadPoolExecutor
   • Vocos

🔧 VARIABLES (29):
   • asr_pipe (NoneType)
   • cfg_strength (float)
   • cross_fade_duration (float)
   • device (str)
   • fix_duration (NoneType)
   • hashlib (module)
   • hop_length (int)
   • matplotlib (module)
   • mel_spec_type (str)
   • n_fft (int)


In [9]:
from f5_tts.infer.utils_infer import infer_process, load_model, load_vocoder

print("📖 Documentación de infer_process:")
print("=" * 50)
help(infer_process)

📖 Documentación de infer_process:
Help on function infer_process in module f5_tts.infer.utils_infer:

infer_process(ref_audio, ref_text, gen_text, model_obj, vocoder, mel_spec_type='vocos', show_info=<built-in function print>, progress=<module 'tqdm' from '/mnt/c/Users/noel_/Desktop/TTS_HF/voice-clone-comparison/.venv/lib/python3.12/site-packages/tqdm/__init__.py'>, target_rms=0.1, cross_fade_duration=0.15, nfe_step=32, cfg_strength=2.0, sway_sampling_coef=-1.0, speed=1.0, fix_duration=None, device='cuda')



In [10]:
print("\n📖 Documentación de load_model:")
print("=" * 50)
help(load_model)


📖 Documentación de load_model:
Help on function load_model in module f5_tts.infer.utils_infer:

load_model(model_cls, model_cfg, ckpt_path, mel_spec_type='vocos', vocab_file='', ode_method='euler', use_ema=True, device='cuda')



In [11]:
print("\n📖 Documentación de load_vocoder:")
print("=" * 50)
help(load_vocoder)


📖 Documentación de load_vocoder:
Help on function load_vocoder in module f5_tts.infer.utils_infer:

load_vocoder(vocoder_name='vocos', is_local=False, local_path='', device='cuda', hf_cache_dir=None)
    # load vocoder



In [None]:
print("\n📖 Documentación de load_model:")
print("=" * 50)
help(load_model)


📖 Documentación de load_model:
Help on function load_model in module f5_tts.infer.utils_infer:

load_model(model_cls, model_cfg, ckpt_path, mel_spec_type='vocos', vocab_file='', ode_method='euler', use_ema=True, device='cuda')

