In [16]:
import requests
import boto3
import json
from botocore.exceptions import ClientError
import os

In [17]:
AWS_REGION = "eu-west-2" # London
TARGET_BUCKET = "steve-sagemaker-data-bucket"
API_BASE_URL = "https://api.semanticscholar.org/datasets/v1/release"

SECRET_NAME = 'semanticscholar_api_key'
SECRET_KEY = 'x-api-key'

In [18]:
def get_secret(region_name, secret_name):
    # Source of the function:
    # https://eu-west-2.console.aws.amazon.com/secretsmanager/secret?name=semanticscholar_api_key#secret-details-sample-code-section
    # Create a Secrets Manager client
    session = boto3.session.Session()
    client = session.client(
        service_name='secretsmanager',
        region_name=region_name
    )

    try:
        get_secret_value_response = client.get_secret_value(
            SecretId=secret_name
        )
    except ClientError as e:
        # For a list of exceptions thrown, see
        # https://docs.aws.amazon.com/secretsmanager/latest/apireference/API_GetSecretValue.html
        raise e

    secret = json.loads(get_secret_value_response['SecretString'])
    return secret

S2_API_KEY = get_secret(AWS_REGION, SECRET_NAME)[SECRET_KEY]

In [19]:
def get_release_ids():
    """Fetching the list of dataset release IDs."""
    response = requests.get(API_BASE_URL)
    response.raise_for_status()
    res = response.json()
    print(res)
    return res


def get_latest_metadata(release_id):
    """Fetch the metadata for the latest dataset release."""
    url = f'{API_BASE_URL}/{release_id}'
    response = requests.get(url)
    response.raise_for_status()
    res_json = response.json()
    res = []
    for dataset in res_json['datasets']:
        if dataset['name'] in ['papers', 's2orc']:
            res.append(dataset)
            display(dataset)
    return res
    

def get_releases_and_metadata():
    release_ids = get_release_ids()
    latest_release_id = release_ids[-1]

    get_latest_metadata(latest_release_id)
    return latest_release_id


S2_LATEST_RELEASE_ID = get_releases_and_metadata()

['2022-05-10', '2022-05-17', '2022-05-24', '2022-05-31', '2022-06-07', '2022-06-14', '2022-06-21', '2022-06-28', '2022-07-05', '2022-07-19', '2022-07-28', '2022-08-02', '2022-08-09', '2022-08-16', '2022-08-23', '2022-08-30', '2022-09-06', '2022-09-13', '2022-09-28', '2022-10-05', '2022-10-28', '2022-11-02', '2022-11-11', '2022-11-15', '2022-11-22', '2022-12-02', '2022-12-06', '2022-12-13', '2022-12-20', '2022-12-27', '2023-01-03', '2023-01-10', '2023-01-17', '2023-01-24', '2023-01-31', '2023-02-07', '2023-02-14', '2023-02-21', '2023-02-28', '2023-03-07', '2023-03-14', '2023-03-21', '2023-03-28', '2023-04-06', '2023-04-11', '2023-04-18', '2023-05-09', '2023-05-16', '2023-05-23', '2023-05-30', '2023-06-06', '2023-06-13', '2023-06-20', '2023-07-04', '2023-07-11', '2023-07-25', '2023-08-01', '2023-08-08', '2023-08-15', '2023-08-29', '2023-09-05', '2023-09-12', '2023-09-19', '2023-09-26', '2023-10-10', '2023-10-19', '2023-10-24', '2023-10-31', '2023-11-07', '2023-11-14', '2023-11-21', '2023

{'name': 'papers',
 'description': 'The core attributes of a paper (title, authors, date, etc.).\n200M records in 30 1.5GB files.',
 'README': 'Semantic Scholar Academic Graph Datasets\n\nThe "papers" dataset provides core metadata about papers.\n\nSCHEMA\nSee https://api.semanticscholar.org/api-docs/graph#tag/Paper-Data\n\nThis dataset does not contain information about a paper\'s references or citations.\nInstead, join with citingPaperId/citedPaperId from the "citations" dataset.\n\nLICENSE\nThis collection is licensed under ODC-BY. (https://opendatacommons.org/licenses/by/1.0/)\n\nBy downloading this data you acknowledge that you have read and agreed to all the terms in this license.\n\nATTRIBUTION\nWhen using this data in a product or service, or including data in a redistribution, please cite the following paper:\n\nBibTex format:\n@misc{https://doi.org/10.48550/arxiv.2301.10140,\n  title = {The Semantic Scholar Open Data Platform},\n  author = {Kinney, Rodney and Anastasiades, Ch

{'name': 's2orc',
 'description': 'Full-body paper text parsed from open-access PDFs. Identifies structural elements such as paragraphs, sections, and bibliography entries.\n10M records in 30 4GB files.',
 'README': 'Semantic Scholar Academic Graph Datasets\n\nThe "s2orc" dataset contains parsed full-body text from selected papers.\n\nA subset of this data was previously released (in a different format) as S2ORC https://github.com/allenai/s2orc\n\nThe body text is parsed from PDF documents using Grobid, documented at https://grobid.readthedocs.io.\nIts output is converted from XML into a single string with a set of annotation spans.\n\nSCHEMA\n - externalIds: IDs of this paper in different catalogs\n - content:\n   - source:\n\t   - pdfUrls: URLs to the PDF\n\t   - oaInfo: license/url/status information from Unpaywall\n   - text: Full body text as a single string\n   - annotations: Annotated spans of the full body text\n\n\nLICENSE\nThis collection is licensed under ODC-BY. (https://op

In [20]:
def get_dataset_download_urls(release_id, dataset_name):
    """Fetch the download URL for a specific dataset."""
    url = f'{API_BASE_URL}/{release_id}/dataset/{dataset_name}'
    response = requests.get(url, headers={'x-api-key': S2_API_KEY}
)
    response.raise_for_status()
    print(json.dumps(response.json(), indent=2, default=str))
    return response.json()['files']


s2orc_file_urls = get_dataset_download_urls('2025-06-10', 's2orc')

{
  "name": "s2orc",
  "description": "Full-body paper text parsed from open-access PDFs. Identifies structural elements such as paragraphs, sections, and bibliography entries.\n10M records in 30 4GB files.",
  "README": "Semantic Scholar Academic Graph Datasets\n\nThe \"s2orc\" dataset contains parsed full-body text from selected papers.\n\nA subset of this data was previously released (in a different format) as S2ORC https://github.com/allenai/s2orc\n\nThe body text is parsed from PDF documents using Grobid, documented at https://grobid.readthedocs.io.\nIts output is converted from XML into a single string with a set of annotation spans.\n\nSCHEMA\n - externalIds: IDs of this paper in different catalogs\n - content:\n   - source:\n\t   - pdfUrls: URLs to the PDF\n\t   - oaInfo: license/url/status information from Unpaywall\n   - text: Full body text as a single string\n   - annotations: Annotated spans of the full body text\n\n\nLICENSE\nThis collection is licensed under ODC-BY. (htt

In [None]:
from tqdm import tqdm

def download_and_upload_to_s3(counter, url, dataset_id, target_bucket, aws_region="eu-west-2", force_overwrite=False):
    """
    Downloads a file from a signed S3 URL and uploads it to another S3 bucket.

    Args:
        url (str): The signed S3 URL of the file to download.
        dataset_id (str): The dataset ID to use as the prefix for the target key.
        target_bucket (str): The name of the target S3 bucket.
        aws_region (str): The AWS region of the target S3 bucket.
        force_overwrite (bool): If False, skip downloading and uploading if the file already exists in S3.

    Returns:
        None
    """
    # Extract the filename from the URL
    filename = f"{url.split('/')[-1].split('?')[0]}"
    target_filename = f'{dataset_id}-part{counter}.jsonl.gz'
    target_key = f"00_raw/{dataset_id}/{target_filename}"

    # Step 1: Check if the file already exists in S3
    s3_client = boto3.client("s3", region_name=aws_region)
    if not force_overwrite:
        try:
            s3_client.head_object(Bucket=target_bucket, Key=target_key)
            print(f"File already exists in S3: s3://{target_bucket}/{target_key}. Skipping download and upload.")
            return
        except ClientError as e:
            if e.response['Error']['Code'] != "404":
                print(f"Error checking file in S3: {e}")
                return

    # Step 2: Download the file locally with a progress bar
    local_file = target_filename  # Use the filename as the local file name
    try:
        print(f"Downloading file from {url}...")
        response = requests.get(url, stream=True)
        response.raise_for_status()
        total_size = int(response.headers.get('content-length', 0))  # Get the total file size
    
        with open(local_file, "wb") as file, tqdm(
            total=total_size, unit="B", unit_scale=True, desc="Downloading"
        ) as progress_bar:
            for chunk in response.iter_content(chunk_size=8192):
                file.write(chunk)
                progress_bar.update(len(chunk))  # Update the progress bar
        print(f"File downloaded: {local_file}")
    except Exception as e:
        print(f"Error downloading file: {e}")
        return

    # Step 3: Upload the file to the target S3 bucket
    try:
        print(f"Uploading {local_file} to S3 bucket {target_bucket}...")
        s3_client.upload_file(local_file, target_bucket, target_key)
        print(f"File uploaded to S3: s3://{target_bucket}/{target_key}")
    except Exception as e:
        print(f"Error uploading file to S3: {e}")
    finally:
        # Clean up local file
        if os.path.exists(local_file):
            os.remove(local_file)


def process_files(file_urls, dataset_id, target_bucket, force_overwrite=False, min_index=0, max_index=100000, aws_region="eu-west-2"):
    """
    Processes a list of signed S3 URLs and uploads them to the target S3 bucket.

    Args:
        file_urls (list): List of signed S3 URLs.
        dataset_id (str): The dataset ID to use as the prefix for the target key.
        target_bucket (str): The name of the target S3 bucket.
        aws_region (str): The AWS region of the target S3 bucket.
        force_overwrite (bool): If False, skip downloading and uploading if the file already exists in S3.

    Returns:
        None
    """
    counter = 0
    for url in file_urls:
        if counter >= min_index and counter < max_index:
            download_and_upload_to_s3(counter, url, dataset_id, target_bucket, aws_region, force_overwrite)
        counter += 1
    print('DONE')


dataset_id = "s2orc"
target_bucket = "bsc-final-sagemaker-data-bucket"
process_files(s2orc_file_urls, dataset_id, target_bucket, False, 212, 100000)

Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_aca9cd32-cd1b-4fc5-8aa2-c20bbfdc2947.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=K0y%2FlAuicwr8%2BkV7xfZ4D1dnyG8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLxiu%2Fza%2FZHbzbenHchy4f0tRX69ti87s5aa3aE0%2BmmIaOM1dIsorFL4s8%2FSCAtZqHlflmaZSeCHYhtaHUQBFTuBr0TXPAIKvHdrclmzLc61KhTxctQaLVm9na0dKiwQhceMAunz5sMZAz6Spc7cqbpPhPVtElTNX%2BvpUeAmRxVZQZCmsxgZpOc6j%2Fm6E0Yui1U3q82WVa

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part212.jsonl.gz
Uploading s2orc-part212.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part212.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_acbfe4b9-fb52-4d54-9e8b-38350424f68a.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=2NRB95hHAEJ5QrV7m6xmXR4kcfE%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part213.jsonl.gz
Uploading s2orc-part213.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part213.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_ad482ad4-7c9d-44e6-9844-322b52708024.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=NkBTha3Nz71SERL7KeJAQQoA6AA%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part214.jsonl.gz
Uploading s2orc-part214.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part214.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b0bbecc6-cdce-4287-8351-fe798048a624.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=ToBOATraHn6IVvntw0g82ASSz1I%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part215.jsonl.gz
Uploading s2orc-part215.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part215.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b0f94273-13b5-4eee-a276-fb407e9fcd37.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=tXWxEYSsckjFYzQ421tm06s1XZs%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part216.jsonl.gz
Uploading s2orc-part216.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part216.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b3270995-b3e5-471b-bfcd-06e3374de6eb.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=D4W8DbdWaOrtIVFt9ZHWmMbGs7s%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part217.jsonl.gz
Uploading s2orc-part217.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part217.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b329e110-5659-4244-9a8d-cf12157ea01b.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=V0J60UxKph1dQTJDPYgILLUNenE%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.2MB/s] 


File downloaded: s2orc-part218.jsonl.gz
Uploading s2orc-part218.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part218.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b4969170-b28e-4ffd-8db9-aeec9a3a84ac.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=T98YqzOoNCZqtF2jBOftFsG%2FYGc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part219.jsonl.gz
Uploading s2orc-part219.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part219.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b66d23aa-17e1-4d49-a97d-191b184750e7.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=d%2FmfoPI6%2Ba79n9AiHbu3IxFX0h4%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [01:01<00:00, 17.4MB/s]  


File downloaded: s2orc-part220.jsonl.gz
Uploading s2orc-part220.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part220.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b712899e-e740-45ce-8e83-ca923ce8e6c9.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=m%2FgigvONMAR5qN7IobBE0KDCnts%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part221.jsonl.gz
Uploading s2orc-part221.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part221.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b8041485-436e-4f22-9dc0-c65e4c6ba9a6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=YYYHHrznpVEZm6vb5WZvad0rf4k%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part222.jsonl.gz
Uploading s2orc-part222.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part222.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b89c821a-3733-43bb-b9a3-2e7ce7311eac.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=J9lUvXiLHE3g72YLdq8eqfjVnzw%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part223.jsonl.gz
Uploading s2orc-part223.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part223.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b8f3aeb4-957c-4094-a761-6a408850f1c4.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=er2a1JDr4p1AieO3kDA%2FFhpE%2B1k%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:49<00:00, 21.9MB/s] 


File downloaded: s2orc-part224.jsonl.gz
Uploading s2orc-part224.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part224.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b94930c6-ea5a-4b44-9e26-ec78082cdd1d.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=306FwmIGKTJynV8lUNV4y05gSyk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:46<00:00, 23.3MB/s] 


File downloaded: s2orc-part225.jsonl.gz
Uploading s2orc-part225.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part225.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_b96c9793-c689-44f8-ac64-7708478dee03.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=Am7j8uBBvjyvjo1BbiZzgKuPqmI%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part226.jsonl.gz
Uploading s2orc-part226.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part226.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_bb864696-fd11-4a97-bdcd-faed06d9b688.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=s7t8k9GzspjAHPfet0nCL9xTJ9Y%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 435M/435M [00:20<00:00, 21.5MB/s] 


File downloaded: s2orc-part227.jsonl.gz
Uploading s2orc-part227.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part227.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_bc6a75c1-e656-42bd-9275-ac60d400b8e1.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=peNeWLy%2BggvthaBONP2JWS6TWmI%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:50<00:00, 21.1MB/s] 


File downloaded: s2orc-part228.jsonl.gz
Uploading s2orc-part228.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part228.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_bc792fbb-edb4-4b05-888f-d143ca03d753.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=3xgVJEBQmrOUd42WX0uGSK%2Fjlhc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part229.jsonl.gz
Uploading s2orc-part229.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part229.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_be096cb6-827b-4244-a939-dcfec49e850a.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=uAGBklJMAXP88OlKINlscZJ%2BnqQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:50<00:00, 21.3MB/s] 


File downloaded: s2orc-part230.jsonl.gz
Uploading s2orc-part230.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part230.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_bff10ca6-079f-490c-a538-f195f1393f2e.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=%2BeyzYjuDZsvbgRZAkF85%2B5IMZ00%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:46<00:00, 22.9MB/s] 


File downloaded: s2orc-part231.jsonl.gz
Uploading s2orc-part231.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part231.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c0598e4e-bcf6-43dc-81bf-2d532f381721.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=DjomSGjWmiASy9cLjhX7P4xqzkc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 713M/713M [00:40<00:00, 17.4MB/s]  


File downloaded: s2orc-part232.jsonl.gz
Uploading s2orc-part232.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part232.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c06e62c4-5156-40f5-a25d-e28f5c087a80.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=DXGLNW4SYQpgCs%2BcsrTWvpEQsvQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part233.jsonl.gz
Uploading s2orc-part233.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part233.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c0b6ca4c-88ee-4625-b1ef-c9197e89c649.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=R0Saajkd5p9qxaziMJzCzynV19s%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:51<00:00, 21.0MB/s] 


File downloaded: s2orc-part234.jsonl.gz
Uploading s2orc-part234.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part234.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c0bd459e-1fc5-4ea3-97fa-ac7b5c2f54e0.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=wYcin3o1ON7BLJcMJnaQiVZOXzc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:50<00:00, 21.1MB/s] 


File downloaded: s2orc-part235.jsonl.gz
Uploading s2orc-part235.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part235.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c15adfe8-22b1-4156-be70-21f4a126ac50.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=I%2Fw34c%2BZI6fwj9euL0DFIVqcXEY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part236.jsonl.gz
Uploading s2orc-part236.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part236.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c37311a5-c35d-4ceb-bbe2-9a399ce73122.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=ieBWnQ50Gjpi37LPzds6aGuugxY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:49<00:00, 21.5MB/s] 


File downloaded: s2orc-part237.jsonl.gz
Uploading s2orc-part237.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part237.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c391c1d4-a9f7-4947-aa5d-67a67e74daec.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=lQtRJIK8R%2Bzm2sVASzemuMM0u5M%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [01:01<00:00, 17.4MB/s]  


File downloaded: s2orc-part238.jsonl.gz
Uploading s2orc-part238.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part238.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c450f944-b2d0-4a6f-ae74-f689ff3954d6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=rsNsDnaDJ%2BqT%2BeOBvzlIC%2B8fNZk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLW

Downloading: 100%|██████████| 544M/544M [00:27<00:00, 19.8MB/s] 


File downloaded: s2orc-part239.jsonl.gz
Uploading s2orc-part239.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part239.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c5230f30-0f25-4ef2-8fc2-594070615e63.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=UWo873nPfe8URPX%2Bj5PWxHLuc%2B0%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part240.jsonl.gz
Uploading s2orc-part240.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part240.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c59c1acc-eb1d-49c9-9906-71290fb404f6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=wbCI4Lxp9yY4vssTf8J5P9ooZGw%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:51<00:00, 20.8MB/s] 


File downloaded: s2orc-part241.jsonl.gz
Uploading s2orc-part241.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part241.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c74c0dc4-da3e-4c6d-9bea-e495ab25d547.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=jKQY1VW%2FvyAA288awgruDJcUps4%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part242.jsonl.gz
Uploading s2orc-part242.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part242.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c7966968-ce83-46ea-9771-d5d87fee51f4.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=0LY5i87tJ2KR7I5PElhgTXe7QK0%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part243.jsonl.gz
Uploading s2orc-part243.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part243.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c88386bb-fcd2-4cb3-841c-cc9bf2739b5b.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=taDhnqGNr8r%2Fd57f1L%2BjbE0qDzk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 317M/317M [00:15<00:00, 20.9MB/s] 


File downloaded: s2orc-part244.jsonl.gz
Uploading s2orc-part244.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part244.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c8f1132a-99c2-4a96-9eba-cf43829f253c.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=ViP%2FaOlyCM7PvBTRZXBY82NqEj8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part245.jsonl.gz
Uploading s2orc-part245.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part245.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_c9ffc8a8-c19e-4242-abd1-c1ed918de543.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=cAa6DfapYeRWGBzcMMXSAH1MlqY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part246.jsonl.gz
Uploading s2orc-part246.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part246.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_ce2d1448-3d15-4144-8e7c-202117833be6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=OiW%2Fbvlik6T5WqymYS8fSzMaenQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 272M/272M [00:12<00:00, 21.6MB/s] 


File downloaded: s2orc-part247.jsonl.gz
Uploading s2orc-part247.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part247.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_cef37b14-85c0-4974-9521-e29dfdfd36d8.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=A4Jta5mUUsz4LzBXFImlsRuXy9A%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:49<00:00, 21.6MB/s] 


File downloaded: s2orc-part248.jsonl.gz
Uploading s2orc-part248.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part248.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d1916f1e-d778-491b-a3d6-c8730a7c7336.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=x8dSjBmJ5vVpYczyRnYnzjK7mdA%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:46<00:00, 23.3MB/s] 


File downloaded: s2orc-part249.jsonl.gz
Uploading s2orc-part249.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part249.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d31fb00d-ebd7-4493-94a6-7dc315f21e5c.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=xKUFJz0S0uvtQhbxleBnW%2F4Xuig%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part250.jsonl.gz
Uploading s2orc-part250.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part250.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d3759dfb-e0a7-4e9c-aa0e-deb0d3c7bd32.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=dbl8AXGJQxwC5A%2BIDHnhH1u0b3E%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:46<00:00, 23.0MB/s] 


File downloaded: s2orc-part251.jsonl.gz
Uploading s2orc-part251.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part251.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d3852972-f058-46c2-91bd-e280b46d18ba.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=q1NuPbINQblIwuNa5khmdxwmFXQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part252.jsonl.gz
Uploading s2orc-part252.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part252.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d40373d5-8de5-49c9-a429-c5172f7e0e84.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=5ykntvZJxv%2BxLoCnZzFz2m%2FklB4%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.2MB/s] 


File downloaded: s2orc-part253.jsonl.gz
Uploading s2orc-part253.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part253.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d4503dc2-bec4-4417-a989-64f9b1d6e7ce.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=AU0IcjPOE7hDvJRcw1ZbRaCbtwY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [01:01<00:00, 17.5MB/s]  


File downloaded: s2orc-part254.jsonl.gz
Uploading s2orc-part254.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part254.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d4571551-6e6a-4439-be2e-c5f5d45911fa.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=gMcq1XSOFPZSOxMAiTrFQ8Ig4Ag%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part255.jsonl.gz
Uploading s2orc-part255.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part255.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d6ea2e71-423c-479e-8dbf-6e328f3bb82a.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=VsMNYFvLnOI%2Fg8o502q990uxDWY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part256.jsonl.gz
Uploading s2orc-part256.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part256.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d807dde8-7a21-433c-8e70-cdfc88f7df95.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=%2FSRnolm4s92UTX23O7S5%2BF5yrp8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part257.jsonl.gz
Uploading s2orc-part257.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part257.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d856613f-1abd-4dba-b4e8-b72fdf354652.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=VPi7yQO4prTv7bHkeCgfPMT%2FLhE%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part258.jsonl.gz
Uploading s2orc-part258.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part258.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d88efc15-83bb-4b1b-8ea1-2a6f197b6ed4.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=Eupuv5qP80vVJoc3UabWFeZgsrc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part259.jsonl.gz
Uploading s2orc-part259.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part259.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_d94e2599-eea0-4487-9fe7-dbdcd56920b9.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=sQE5m63cHXp1REX%2F9yN6bO2k9GA%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part260.jsonl.gz
Uploading s2orc-part260.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part260.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_da219912-be1a-49ce-a64a-c3917d42070b.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=348ZsjxjjqjreHwXjnVVdsjtuog%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:51<00:00, 20.9MB/s] 


File downloaded: s2orc-part261.jsonl.gz
Uploading s2orc-part261.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part261.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_db00e7a2-e8a2-4008-ac50-443356248505.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=tcucpqy93DfCsxgi0ALglz7vL2c%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [01:01<00:00, 17.4MB/s]  


File downloaded: s2orc-part262.jsonl.gz
Uploading s2orc-part262.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part262.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_db39296e-080b-4416-9013-4d745b84cf23.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=bXacpTpNDqUq4g13Q1Jq7HwYLrk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part263.jsonl.gz
Uploading s2orc-part263.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part263.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_dba76d29-99ae-415c-8886-0973a0c1eb94.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=99XX7JZ44dlziKrP%2B9ax2c14oE8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.2MB/s] 


File downloaded: s2orc-part264.jsonl.gz
Uploading s2orc-part264.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part264.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_dbd1f271-b452-42d0-8016-795d7f1fd1a0.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=n7tpFQhXNjZr4vsyI%2F26v7sZN74%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part265.jsonl.gz
Uploading s2orc-part265.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part265.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_dcfdb875-9595-472a-8e0f-5e8c0abe4de7.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=hjJSptaxs6KQYFwEKaeLxekW4jQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:46<00:00, 22.9MB/s] 


File downloaded: s2orc-part266.jsonl.gz
Uploading s2orc-part266.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part266.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_de589476-51db-4c3e-8a09-6d095c8ba8c0.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=sJ2cHA9SaHPuG5OjkR%2Bel6g9ujI%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part267.jsonl.gz
Uploading s2orc-part267.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part267.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_df03b22c-7b0a-43a5-ac90-ca6419bf9f80.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=DS8Q45hDBf%2FC70QyCTD8NG8CTPo%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.8MB/s] 


File downloaded: s2orc-part268.jsonl.gz
Uploading s2orc-part268.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part268.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e07729a9-718f-47bf-b507-50a842d13817.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=CIn1aln7rq8w71vH8NQqGrOeLAw%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part269.jsonl.gz
Uploading s2orc-part269.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part269.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e158c9cf-2b64-4597-adfb-ead1af629937.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=gyOaN6G8crF3n0NM%2B%2Ffz87Vj5Nk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part270.jsonl.gz
Uploading s2orc-part270.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part270.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e3c183e6-3ec8-46ab-b193-2e16341a279e.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=4HDofdAHUqveC1tQAWbQ8%2FIOlNc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.2MB/s] 


File downloaded: s2orc-part271.jsonl.gz
Uploading s2orc-part271.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part271.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e5328b4f-810f-41d2-a9cf-99d2eea7221e.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=Rdn4yFBU8T%2FQQ86Z9X6IJ0ZRZJ8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.7MB/s] 


File downloaded: s2orc-part272.jsonl.gz
Uploading s2orc-part272.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part272.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e6696be3-4ed2-4e37-8270-ba01975c7d5c.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=4oN5jvoaxR%2BimVxfYaDDUanYg78%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 435M/435M [00:19<00:00, 21.8MB/s] 


File downloaded: s2orc-part273.jsonl.gz
Uploading s2orc-part273.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part273.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e733957b-7738-496e-bd79-1348b3bb79fa.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=1cUupGVFjz98mCB4UVN4WKhWCMQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part274.jsonl.gz
Uploading s2orc-part274.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part274.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e7fa95d2-6db7-426c-bf88-fe99ee9bcb61.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=xBitZsLW106kDvjkOnIGs4Vj08U%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part275.jsonl.gz
Uploading s2orc-part275.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part275.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e8905c4a-5de4-4145-b69e-8e66a3747ead.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=p4dt8ExYq0Br%2FfyPSLW4zE5fDVQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 515M/515M [00:24<00:00, 21.2MB/s] 


File downloaded: s2orc-part276.jsonl.gz
Uploading s2orc-part276.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part276.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e8d09ac5-9996-449a-9928-d6dc5a3511e7.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=X4sy2F%2Bqbx3ob9l9%2FrfHRfUwQRc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:55<00:00, 19.4MB/s] 


File downloaded: s2orc-part277.jsonl.gz
Uploading s2orc-part277.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part277.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e8e8d76f-375f-4e4a-ad55-484b1a31bd65.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=HRfU%2BeURUXx0SKQsEEe8XezY7Jc%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.4MB/s] 


File downloaded: s2orc-part278.jsonl.gz
Uploading s2orc-part278.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part278.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e9935594-ce6f-48fc-992c-7e1a283c50fc.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=qpdwnWnNPsXJWH0jrh2%2B%2Fx4pD04%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.2MB/s] 


File downloaded: s2orc-part279.jsonl.gz
Uploading s2orc-part279.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part279.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_e9e6d004-4da5-4466-9804-3af652ed3d12.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=sagnZw2dTPYM9OywPli6g1M8Jt0%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part280.jsonl.gz
Uploading s2orc-part280.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part280.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_eaec8bc0-b4da-44b6-aef6-72994c61c34a.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=%2BIsksI9WtIJQjwGuSYk7dhR9I8E%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part281.jsonl.gz
Uploading s2orc-part281.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part281.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_ebf905a6-5a5d-42cd-8d33-0f599ba1c3f6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=k2m5d3FGpmx3xL8VkT1JiZUKPcM%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part282.jsonl.gz
Uploading s2orc-part282.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part282.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f0e3c54c-8b04-4cf2-8493-4642833abbbf.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=stkJiUnoIhQckmIwud4PIW3gGDE%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part283.jsonl.gz
Uploading s2orc-part283.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part283.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f1952a55-8d1e-4fb9-8a9b-8c32548af611.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=KD1cJ8nJilAW4bc%2FGFxROsxfRhs%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 444M/444M [00:20<00:00, 22.1MB/s] 


File downloaded: s2orc-part284.jsonl.gz
Uploading s2orc-part284.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part284.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f1ada418-38b1-42b5-bbfc-20ed9d7dd5db.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=zS3mXW9XBTo5YjyIRs%2B2ARszbXk%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part285.jsonl.gz
Uploading s2orc-part285.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part285.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f279cdee-b8e6-4069-9fb2-0ac829929de6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=D0YkeBLtooy6xNi1zr8GzxGXyjo%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.5MB/s] 


File downloaded: s2orc-part286.jsonl.gz
Uploading s2orc-part286.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part286.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f2927fc5-0728-4370-8ca8-5d7416776305.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=ZVQqB8yrqAxlqHLL3VfmZndlHJo%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 21.9MB/s] 


File downloaded: s2orc-part287.jsonl.gz
Uploading s2orc-part287.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part287.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f451bc3c-0abd-4384-842d-afda78135dca.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=iO7OUfILPimiSnBP29aaDSKHc%2B0%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.1MB/s] 


File downloaded: s2orc-part288.jsonl.gz
Uploading s2orc-part288.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part288.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f6589a7e-5df7-45b1-9839-aa039d0ea9a0.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=aSFiYp3OKScjvDJRabbOYfggvao%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.3MB/s] 


File downloaded: s2orc-part289.jsonl.gz
Uploading s2orc-part289.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part289.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f7d8095a-8283-4680-b927-82ec04ede06b.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=9igaROvQJX%2B%2Bbqb5Fkopem%2BocH4%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLW

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part290.jsonl.gz
Uploading s2orc-part290.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part290.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f80b3829-3e97-474c-b9c2-c429c959a9af.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=BSv9bK8noKi%2FbuTULCRJsAXG000%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 21.9MB/s] 


File downloaded: s2orc-part291.jsonl.gz
Uploading s2orc-part291.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part291.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f98087b9-9090-45ad-a6d3-c924cab2e115.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=OVszBRzWy6IS09sYvWhYXYY6sMY%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [01:32<00:00, 11.6MB/s] 


File downloaded: s2orc-part292.jsonl.gz
Uploading s2orc-part292.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part292.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_f9c45561-6d3b-486c-b0cf-4cfafa2fc2e6.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=TbBAJ%2BSU0em9ZdlZ6OzVI8g%2FKb8%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPW

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part293.jsonl.gz
Uploading s2orc-part293.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part293.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_fa2ee3b5-2ee7-4f23-a567-ef8b3b2d07ff.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=lMYXKTIo1zDjxJx8grXqCmaZA%2FA%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:48<00:00, 22.0MB/s] 


File downloaded: s2orc-part294.jsonl.gz
Uploading s2orc-part294.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part294.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_fa3a2594-750b-4644-b414-18b676f37b7b.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=kt9qSNUnOCRKrjA%2Ff3Dvobl26io%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:49<00:00, 21.8MB/s] 


File downloaded: s2orc-part295.jsonl.gz
Uploading s2orc-part295.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part295.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_fac2f35f-12a3-400f-856b-a39135806110.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=llk2Icu8AhV7kVXplcz3Vo%2Fdeow%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part296.jsonl.gz
Uploading s2orc-part296.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part296.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_fd65996b-ac48-4b4a-9d1a-ce0760973ba8.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=e14hpYoofHleCxrcyrirLV%2B7I3U%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqX

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.4MB/s] 


File downloaded: s2orc-part297.jsonl.gz
Uploading s2orc-part297.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part297.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_ffc79af0-c1c6-46dc-b96f-4694dad3b219.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=Iu2F6CwxdiQWrDDQmSvgeZgvTLQ%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.8MB/s] 


File downloaded: s2orc-part298.jsonl.gz
Uploading s2orc-part298.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part298.jsonl.gz
Downloading file from https://ai2-s2ag.s3.amazonaws.com/staging/2025-06-10/s2orc/20250613_113338_00044_nz7vq_ffdb9fe5-1dce-420c-b323-d2fc8294c3da.gz?AWSAccessKeyId=ASIA5BJLZJPW7ETHHVSL&Signature=sv2yowq23E5FkDjoUXvVNDr94lw%3D&x-amz-security-token=IQoJb3JpZ2luX2VjEE8aCXVzLXdlc3QtMiJGMEQCIDHM6usw9S1K1eRlU%2FALwGemQM%2FptFnfx16ZCBSgfF06AiAjTCzuJ%2FmwKPV86IqACv%2BXeVUNaKDQDSKO9PckmRQbCyr%2FAwg4EAAaDDg5NjEyOTM4NzUwMSIMTj1B64mMyZF3JXbqKtwDiUNkQ2VvJ93lCCsv3EeHqUFkilhfgPMgHjiLAztoT4dxFBCw5tp5AN6Sf6CQNBgVaSNulhejqEXHvlFxMyrvCs0CgN6YRXioUiSJkC9nTIIX7MAfSL1xAHQ7%2BJI0Dh%2BOJqo7w0SD49flNTDZx11t5otPNxfh1LlgPtv2PkJ449hr8zj2al3VyYF%2BYaKUkwl3dmEO9tv4xxza%2B4tndlGPOrJKexEi73%2FMO1Djx5qoozW8SYDR7gepgjeM77yfCk%2BwcnFfCcUABXFH3IvQvU5vJ7rUQcWAJl6IshoWVh1OFPZLhxS9eofZjR4eAUDeH3IvZEGTKVjGLWPWqXLx

Downloading: 100%|██████████| 1.07G/1.07G [00:47<00:00, 22.6MB/s] 


File downloaded: s2orc-part299.jsonl.gz
Uploading s2orc-part299.jsonl.gz to S3 bucket bsc-final-sagemaker-data-bucket...
File uploaded to S3: s3://bsc-final-sagemaker-data-bucket/00_raw/s2orc/s2orc-part299.jsonl.gz
DONE
