In [11]:
import pandas as pd
import requests
import os
from tqdm.notebook import tqdm

In [12]:
def download_mirna_files(excel_path):
    # Read CSV file
    df = pd.read_excel(excel_path)
    
    # Get miRNA values from column B
    miRNAs = df['miRNA'].dropna().unique()  # Using unique() to avoid duplicate downloads
    
    # Create directory if it doesn't exist
    os.makedirs('downloaded_files', exist_ok=True)
    
    # Download files with progress bar
    for miRNA in tqdm(miRNAs, desc='Downloading files'):
        try:
            # Construct URL
            url = f'https://rnasysu.com/encori/moduleDownload.php?source=agoClipRNA&type=xls&value=hg38;lncRNA;{miRNA};1;0;0;1;None;all'
            
            # Send request
            response = requests.get(url)
            response.raise_for_status()  # Check for HTTP errors
            
            # Save file
            filename = f"downloaded_files/{miRNA.replace('/', '_')}.xls"  # Sanitize filename
            with open(filename, 'wb') as f:
                f.write(response.content)
                
        except Exception as e:
            print(f"Error downloading {miRNA}: {str(e)}")


In [13]:
download_mirna_files('get_id.xlsx')

Downloading files:   0%|          | 0/11 [00:00<?, ?it/s]