In [3]:
import json
import torchaudio
import warnings
from tqdm import tqdm

warnings.filterwarnings("ignore")

In [2]:
def json_loader(file_path):
    data = []
    with open(file_path, 'r', encoding='utf-8') as f:
        for line in f:
            data.append(json.loads(line))
    return data

def audio_checker(file_path):
    try:
        waveform, sample_rate = torchaudio.load(file_path)
        return True
    except Exception as e:
        print(f"Error loading {file_path}: {e}")
        return False

def check_main(data):
    for entry in tqdm(data, total=len(data)):
        conversations = entry.get('conversation', [])
        for turn in conversations:
            message_type = turn.get('message_type', '')
            if message_type == 'audio':
                audio_path = turn.get('content', '')
                if not audio_checker(audio_path):
                    print(f"Invalid audio file: {audio_path}")

In [4]:
train_file = "/mnt/pfs_l2/jieti_team/SFT/hupeng/Kimi-Audio/data/sft/train/sft_train_with_semantic_codes.json"
eval_file = "/mnt/pfs_l2/jieti_team/SFT/hupeng/Kimi-Audio/data/sft/eval/sft_eval_with_semantic_codes.json"

train_json = json_loader(train_file)
eval_json = json_loader(eval_file)

In [22]:
check_main(train_json)

 44%|████▍     | 21965/49518 [03:17<03:40, 124.68it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17021228217021183134396510658560.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17021228217021183134396510658560.wav


 46%|████▋     | 22924/49518 [03:24<03:17, 134.39it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17020125514461182671889533816832.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17020125514461182671889533816832.wav


 55%|█████▌    | 27312/49518 [03:58<02:48, 131.70it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17021841281871183391534544900096.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17021841281871183391534544900096.wav


 58%|█████▊    | 28720/49518 [04:09<02:43, 126.95it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17031578393741187475575272439808.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17031578393741187475575272439808.wav


 59%|█████▉    | 29385/49518 [04:14<02:30, 133.90it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch7-10/17037737716781190058982598795264.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch7-10/17037737716781190058982598795264.wav


 72%|███████▏  | 35575/49518 [05:02<01:41, 137.62it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch1-3/16999376908581173969293471141888.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch1-3/16999376908581173969293471141888.wav


 76%|███████▌  | 37468/49518 [05:16<01:28, 136.24it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17021841281871183391534544900096.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17021841281871183391534544900096.wav


 85%|████████▍ | 42090/49518 [05:50<00:53, 137.61it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch7-10/17037737716781190058982598795264.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch7-10/17037737716781190058982598795264.wav


 87%|████████▋ | 43273/49518 [05:59<00:43, 142.30it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17031578393741187475575272439808.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch5/17031578393741187475575272439808.wav


 88%|████████▊ | 43577/49518 [06:01<00:43, 135.31it/s]

Error loading /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17020125514461182671889533816832.wav: Failed to decode audio.
Invalid audio file: /mnt/pfs_l2/jieti_team/SFT/hupeng/data/tal-k12/wavs/wav_batch6/17020125514461182671889533816832.wav


100%|██████████| 49518/49518 [06:46<00:00, 121.82it/s]


In [5]:
check_main(eval_json)

  0%|          | 0/5394 [00:00<?, ?it/s]

100%|██████████| 5394/5394 [00:45<00:00, 118.92it/s]
