In [1]:
# CELL 1: LIBRARIES & IMPORTS
import pandas as pd
import numpy as np
import json
import re
import os
import yaml
import glob
from pathlib import Path
from datetime import datetime
import synapseclient
from synapseclient.models import (
    Column, ColumnType, Dataset, EntityRef, File, Folder, Project, FacetType, DatasetCollection, JSONSchema, SchemaOrganization
)
import time
from pprint import pprint
from synapseclient.core.utils import make_bogus_data_file

# 1. Set up Synapse Python client
syn = synapseclient.Synapse()
syn.login()
from typing import Dict, List, Any, Set, Union
from synapseclient import Wiki
from collections import defaultdict, Counter
import warnings
warnings.filterwarnings('ignore')


Welcome, ram.ayyala!



In [5]:
# Replace your own project name here
PROJECT_ENT = Project(name="Mock ALS Project").get()
# Replace your own json schema organization name here
ORG_NAME = "ampals.schemas"
VERSION = "0.0.1"
NEW_VERSION = "0.0.2"

SCHEMA_NAME = "OmicFile"

title = "ALS Omic File Schema"
schema_body = {
  "$schema": "https://json-schema.org/draft-07/schema",
  "$id": "https://repo-prod.prod.sagebase.org/repo/v1/schema/type/registered/org.synapse.ampals-omic-file",
  "title": "OmicFile",
  "type": "object",
  "description": "File containing omic data such as sequencing, expression, or proteomics data",
  "additionalProperties": {},
  "properties": {
    "FACSPopulation": {
      "description": "FACS-sorted cell population description",
      "title": "FACS Population",
      "type": "string"
    },
    "GEOSuperSeries": {
      "description": "GEO SuperSeries identifier",
      "title": "GEO SuperSeries",
      "type": "string"
    },
    "alternateName": {
      "description": "An alternate name that can be used for search and discovery improvement.",
      "title": "Alternate Name",
      "type": "string"
    },
    "analysisTypes": {
      "description": "Computational and statistical analysis methods applied to the data",
      "items": {
        "description": "Computational and statistical analysis methods applied to the data",
        "enum": [
          "Normalized Protein Expression (NPX)",
          "GeneSetEnrichmentAnalysis",
          "differential_expression",
          "pathway_enrichment",
          "network_analysis",
          "proteomics_analysis",
          "metabolomics_analysis",
          "longitudinal_analysis",
          "survival_analysis",
          "meta_analysis",
          "correlation_analysis",
          "multivariate_analysis",
          "machine_learning"
        ],
        "title": "AnalysisMethodEnum",
        "type": "string"
      },
      "title": "Analysis Types",
      "type": "array"
    },
    "annotations": {
      "description": "Types of biological databases and annotations referenced in this file",
      "items": {
        "description": "Types of biological databases and annotation references",
        "enum": [
          "KEGG",
          "GO",
          "UniProt",
          "Ensembl",
          "HGNC",
          "RefSeq",
          "MONDO",
          "HPO",
          "SNOMED",
          "ICD",
          "pathway_enrichment",
          "protein_pathway",
          "metabolic_pathway",
          "signaling_pathway"
        ],
        "title": "AnnotationTypeEnum",
        "type": "string"
      },
      "title": "Biological Annotations",
      "type": "array"
    },
    "assay": {
      "description": "What's used to generate data in file, typically referring to the assay. Omit if not applicable.",
      "items": {
        "description": "",
        "enum": [
          "2D AlamarBlue absorbance",
          "2D AlamarBlue fluorescence",
          "3D confocal imaging",
          "3D electron microscopy",
          "3D imaging",
          "3D microtissue viability",
          "actigraphy",
          "AlgometRx Nociometer",
          "auditory brainstem response",
          "ATAC-seq",
          "ATPase activity assay",
          "BrdU proliferation assay",
          "Bru-seq",
          "BruChase-seq",
          "CAPP-seq",
          "CUT&RUN",
          "ChIP-seq",
          "Child Behavior Checklist for Ages 1.5-5",
          "Child Behavior Checklist for Ages 6-18",
          "CODEX",
          "CROP-seq",
          "confocal microscopy",
          "Corsi blocks",
          "current clamp assay",
          "DART-seq",
          "diffusion MRI",
          "distortion product otoacoustic emissions",
          "DNA optical mapping",
          "ELISA",
          "ERR bisulfite sequencing",
          "EdU proliferation assay",
          "FIA-MSMS",
          "FLIPR high-throughput cellular screening",
          "Fluorescence In Situ Hybridization",
          "Focus group",
          "FTIR spectroscopy",
          "HI-C",
          "HPLC",
          "Interview",
          "ISO-seq",
          "MIB/MS",
          "MeRIP-seq",
          "Matrigel-based tumorigenesis assay",
          "MudPIT",
          "NIH Toolbox",
          "NOMe-seq",
          "RNA array",
          "RNA-seq",
          "RPPA",
          "Riccardi and Ablon scales",
          "SNP array",
          "SUSHI",
          "Sanger sequencing",
          "Social Responsiveness Scale",
          "Social Responsiveness Scale, Second Edition",
          "SomaScan",
          "T cell receptor repertoire sequencing",
          "TIDE",
          "TMT quantitation",
          "TriKinetics activity monitoring",
          "Von Frey test",
          "active avoidance learning behavior assay",
          "array",
          "atomic force microscopy",
          "autoradiography",
          "bisulfite sequencing",
          "blood chemistry measurement",
          "blue native PAGE",
          "body size trait measurement",
          "bone histomorphometry",
          "brightfield microscopy",
          "cAMP-Glo Max Assay",
          "CAGE-seq",
          "calcium retention capacity assay",
          "cell competition",
          "cell count",
          "cell painting",
          "cell proliferation",
          "cell viability assay",
          "clinical data",
          "CLIP-seq",
          "cNF-Skindex",
          "cognitive assessment",
          "combination library screen",
          "combination screen",
          "complex II enzyme activity assay",
          "compound screen",
          "contextual conditioning behavior assay",
          "conventional MRI",
          "Children's Dermatology Life Quality Index Questionnaire",
          "differential scanning calorimetry",
          "dynamic light scattering",
          "electrochemiluminescence",
          "electrophoretic light scattering",
          "elevated plus maze test",
          "FACE-Q Appearance-related Distress",
          "FACS",
          "flow cytometry",
          "focus forming assay",
          "functional MRI",
          "gait measurement",
          "gel filtration chromatography",
          "gel permeation chromatography",
          "genotyping",
          "high content screen",
          "high frequency ultrasound",
          "high-performance liquid chromatography/tandem mass spectrometry",
          "immunoassay",
          "immunocytochemistry",
          "immunofluorescence",
          "immunohistochemistry",
          "in silico synthesis",
          "in vitro tumorigenesis",
          "in vivo PDX viability",
          "in vivo bioluminescence",
          "in vivo tumor growth",
          "jumping library",
          "LCM",
          "label free mass spectrometry",
          "laser speckle imaging",
          "light scattering assay",
          "liquid chromatography-electrochemical detection",
          "liquid chromatography/mass spectrometry",
          "liquid chromatography/tandem mass spectrometry",
          "lncRNA-seq",
          "local field potential recording",
          "long term potentiation assay",
          "mRNA counts",
          "m6A array",
          "magnetic resonance angiography",
          "magnetic resonance spectroscopy",
          "Magnetization-Prepared Rapid Gradient Echo MRI",
          "mass spectrometry",
          "massively parallel reporter assay",
          "metabolic screening",
          "methylation array",
          "miRNA array",
          "miRNA-seq",
          "microrheology",
          "Skindex-16",
          "multi-electrode array",
          "nanoparticle tracking analysis",
          "NanoString nCounter Analysis System",
          "n-back task",
          "neuropsychological assessment",
          "next generation targeted sequencing",
          "novelty response behavior assay",
          "open field test",
          "optical tomography",
          "optical coherence tomography",
          "optokinetic reflex assay",
          "oscillatory rheology",
          "oxBS-seq",
          "oxygen consumption assay",
          "pattern electroretinogram",
          "perineurial cell thickness",
          "pharmocokinetic ADME assay",
          "phase-contrast microscopy",
          "photograph",
          "polymerase chain reaction",
          "polysomnography",
          "positron emission tomography",
          "PROMIS Cognitive Function",
          "Olink Proximity Extension Assay",
          "pure tone average",
          "quantitative PCR",
          "Quant-seq",
          "questionnaire",
          "reactive oxygen species assay",
          "reporter gene assay",
          "rheometry",
          "RIP-seq",
          "ribo-seq",
          "rotarod performance test",
          "sandwich ELISA",
          "scCGI-seq",
          "scale",
          "SaferSeqS",
          "single molecule drug screen assay",
          "single-cell RNA-seq",
          "single cell ATAC-seq",
          "snATAC-seq",
          "snRNA-seq",
          "single-nucleus RNA-seq",
          "small molecule library screen",
          "sorbitol dehydrogenase activity level assay",
          "spatial frequency domain imaging",
          "spatial transcriptomics",
          "static histomorphometry",
          "static light scattering",
          "survival",
          "targeted exome sequencing",
          "traction force microscopy",
          "transcranial doppler ultrasonography",
          "twin spot assay",
          "ultra high-performance liquid chromatography/tandem mass spectrometry",
          "western blot",
          "whole exome sequencing",
          "whole genome sequencing",
          "whole-cell patch clamp",
          "word recognition score",
          "STR profile",
          "Extension control 1",
          "Incubation control 1",
          "Amplification control 1",
          "Protein target assay"
        ],
        "title": "Assay",
        "type": "string"
      },
      "title": "Measurement Technique",
      "type": "array"
    },
    "biospecimenType": {
      "description": "Type of biological specimen(s) in the file.",
      "items": {
        "description": "",
        "enum": [
          "blood",
          "plasma",
          "serum",
          "csf",
          "brain_tissue",
          "spinal_cord",
          "muscle",
          "fibroblast",
          "ipsc",
          "motor_neuron",
          "unknown"
        ],
        "title": "BiospecimenTypeEnum",
        "type": "string"
      },
      "title": "Biospecimen Type",
      "type": "array"
    },
    "cellType": {
      "description": "Type of cell or cell line used in the file.",
      "items": {
        "description": "",
        "enum": [
          "motor_neuron",
          "astrocyte",
          "microglia",
          "oligodendrocyte",
          "fibroblast",
          "pbmc",
          "whole_blood",
          "unknown"
        ],
        "title": "CellTypeEnum",
        "type": "string"
      },
      "title": "Cell Type",
      "type": "array"
    },
    "citation": {
      "description": "identifies academic articles that are recommended by the data provider be cited in addition to the file itself.",
      "items": {
        "type": "string"
      },
      "title": "Citation",
      "type": "array"
    },
    "collection": {
      "description": "Associated collection(s)",
      "items": {
        "description": "Original collection, e.g. the consortium that the dataset comes from.",
        "enum": [
          "ALS Knowledge Portal",
          "Answer ALS",
          "CReATe Consortium",
          "Genomic Translation for ALS Care (GTAC)",
          "New York Genome Center ALS Consortium",
          "National Institutes of Health",
          "Project MinE",
          "ALS Compute",
          "amp_als",
          "target_als",
          "all_als",
          "c_path",
          "alsdb",
          "geo",
          "sra",
          "als_compute"
        ],
        "title": "CollectionEnum",
        "type": "string"
      },
      "title": "Collection",
      "type": "array"
    },
    "contributor": {
      "description": "Institution or person responsible for collecting and managing the files and records in the file.",
      "items": {
        "type": "string"
      },
      "title": "Contributor(s)",
      "type": "array"
    },
    "creator": {
      "description": "Properly formatted name of the organization or person that is creator of the file (e.g. \"Sage Bionetworks\" or \"John Doe\"), not an id. Most preferred is the project PI or data lead who's responsible for its conception and initial content creation.",
      "items": {
        "type": "string"
      },
      "title": "Creator",
      "type": "array"
    },
    "dataType": {
      "description": "Omic data types (genomics, transcriptomics, proteomics, etc.)",
      "items": {
        "description": "Types of omic data contained in files",
        "enum": [
          "raw_sequencing",
          "aligned_reads",
          "variant_calls",
          "genome_annotation",
          "gene_expression",
          "transcript_counts",
          "differential_expression",
          "splice_variants",
          "methylation",
          "chromatin_accessibility",
          "histone_modification",
          "protein_abundance",
          "peptide_identification",
          "protein_modification",
          "metabolite_abundance",
          "metabolic_pathways",
          "integrated_omics",
          "network_analysis",
          "raw_data",
          "processed_data",
          "analyzed_results",
          "proteomics",
          "geneExpression",
          "transcriptomics",
          "transcriptomics_nascent",
          "epigenomics",
          "metabolomics",
          "kinomics",
          "isoformExpression",
          "chromatinActivity",
          "AlignedReads",
          "genomicVariants",
          "genomicFeatures",
          "SomaticVariants",
          "GermlineVariants",
          "CopyNumberVariants",
          "StructuralVariants",
          "AnnotatedSomaticVariants",
          "AnnotatedGermlineVariants",
          "raw_counts",
          "RawIntensities",
          "NormalizedIntensities"
        ],
        "title": "OmicDataTypeEnum",
        "type": "string"
      },
      "title": "Data Type",
      "type": "array"
    },
    "description": {
      "description": "Blurb for the file; should be no more than 500 characters.",
      "title": "Description",
      "type": "string"
    },
    "disease": {
      "description": "Disease(s) or condition(s) studied in the file.",
      "items": {
        "description": "",
        "enum": [
          "ALS",
          "FTD",
          "Control",
          "Unknown"
        ],
        "title": "DiseaseEnum",
        "type": "string"
      },
      "title": "Disease",
      "type": "array"
    },
    "fileFormat": {
      "description": "Format of the omic data file (FASTQ, BAM, VCF, etc.)",
      "title": "File Format",
      "type": "string"
    },
    "includedInDataCatalog": {
      "description": "Link(s) to known data catalog(s) the file is included in.",
      "title": "Included In Data Catalog",
      "type": "string"
    },
    "individualCount": {
      "description": "Number of unique individuals included in the file (whether as individual-level or as aggregate data). Omit if not applicable/unknown.",
      "title": "Individual Count",
      "type": "integer"
    },
    "keywords": {
      "items": {
        "type": "string"
      },
      "title": "Keywords",
      "type": "array"
    },
    "libraryLayout": {
      "description": "Single-end or paired-end sequencing layout for files containing sequencing data.",
      "items": {
        "description": "",
        "enum": [
          "single",
          "paired"
        ],
        "title": "LibraryLayoutEnum",
        "type": "string"
      },
      "title": "Library Layout",
      "type": "array"
    },
    "libraryStrategy": {
      "description": "Sequencing library strategy (RNA-seq, WGS, ChIP-seq, etc.)",
      "title": "Library Strategy"
    },
    "license": {
      "description": "Unless information for license is clear, this should default to UNKNOWN.",
      "title": "License"
    },
    "originalSampleName": {
      "description": "Original sample name from data source",
      "title": "Original Sample Name",
      "type": "string"
    },
    "platform": {
      "description": "Sequencing or analysis platform used",
      "title": "Platform",
      "enum": [
        "7T Bruker Biospec",
        "10x Visium Spatial Gene Expression",
        "2D CellTiter-Glo",
        "2D Incucyte",
        "Affymetrix Genome-Wide Human SNP 5.0 Array",
        "Affymetrix Genome-Wide Human SNP 6.0 Array",
        "Affymetrix Human Gene 1.0 ST Array",
        "Affymetrix Human Genome U133 Plus 2.0 Array",
        "Affymetrix U133AB",
        "Agilent 44Karray",
        "BD FACS Calibur",
        "BD FACSymphony",
        "BGISEQ-500",
        "Bionano Irys",
        "Caliper",
        "Cherry Imaging FACE Platform",
        "Cherry Imaging TRACE Platform",
        "Chromium X",
        "EnVision 2103 Multiplate Reader",
        "GE Discovery MR750 3T",
        "GE Optima MR450W 1.5T",
        "GE Signa HDxt 1.5T",
        "GE Signa Genesis 1.5T",
        "GE Signa HDxt 3T",
        "GE Signa Premier 3T",
        "GE Signa Excite 1.5T",
        "Hitachi Echelon 1.5T",
        "Hitachi Oasis 1.2T",
        "IVIS Spectrum In Vivo Imaging System",
        "Illumina 1M",
        "Illumina Genome Analyzer IIx",
        "Illumina HiSeq 2000",
        "Illumina HiSeq 2500",
        "Illumina HiSeq 3000",
        "Illumina HiSeq 4000",
        "Illumina HiSeq X",
        "Illumina Human660W-Quad v1.0 BeadChip",
        "Illumina HumanHap300",
        "Illumina HumanMethylation450",
        "Illumina HumanOmni1-Quadv1.0",
        "Illumina HumanOmniExpress-24 v1.0 BeadChip",
        "Illumina HumanOmniExpress-24 v1.2 BeadChip",
        "Illumina Infinium MethylationEPIC BeadChip v1.0 (850k)",
        "Illumina Infinium MethylationEPIC BeadChip v2.0 (935k)",
        "Illumina MiSeq",
        "Illumina MouseWG-6 v2.0 expression beadchip",
        "Illumina NextSeq 1000",
        "Illumina NextSeq 2000",
        "Illumina NextSeq 500",
        "Illumina NextSeq 550",
        "Illumina NovaSeq 6000",
        "Illumina NovaSeq X",
        "Illumina NovaSeq X Plus",
        "Illumina Omni2pt5M",
        "Illumina Omni5M",
        "Illumina WholeGenome DASL",
        "Illumina h650",
        "Infinium HumanOmniExpressExome",
        "LI-COR Odyssey CLx",
        "LTQ Orbitrap XL",
        "Leica Aperio AT2",
        "Leica MZ16",
        "Leica S9 Stereomicroscope",
        "LifeViz Infinity System",
        "LifeViz Micro System",
        "MGI T-series",
        "Malvern Zetasizer",
        "NanoFCM",
        "NanoString Human nCounter PanCancer IO360 Panel",
        "Nanostring Counter",
        "Nanostring GeoMx",
        "Not Applicable",
        "Olympus DP80",
        "Olympus IX73",
        "Orbitrap Fusion Lumos Tribrid",
        "Other Platform",
        "Oxford Nanopore",
        "PacBio RS II",
        "PacBio Sequel II System",
        "PacBio Sequel IIe System",
        "Pannoramic 250 Flash",
        "Perlegen 300Karray",
        "Philips Achieva 1.5T",
        "Philips Achieva 3T",
        "Philips FEI Tecnai 12",
        "Philips Intera Achieva 3T",
        "Philips Ingenia 1.5T",
        "Philips Ingenia 3T",
        "Philips Panorama 1.0T",
        "Promega GloMax Discover",
        "Q Exative HF",
        "Scale",
        "Siemens Avanto 1.5T",
        "Siemens Avanto Fit 1.5T",
        "Siemens Magnetom Aera 1.5T",
        "Siemens Magnetom Espree 1.5T",
        "Siemens Magnetom Prisma 3T",
        "Siemens Magnetom Skyra 3T",
        "Siemens Magnetom Trio 3T",
        "Siemens Magnetom Verio 3T",
        "Siemens Magnetom Prisma Fit 3T",
        "Spectramax M Series",
        "TOOsonix System ONE-M",
        "Toshiba Vantage Titan 1.5T",
        "Varioskan LUX",
        "Vectra H1 3D Imaging System",
        "Ventana Benchmark XT",
        "Vevo 3100 Imaging System",
        "XF24 Extracellular Flux Analyzer",
        "Zeiss LSM",
        "Zeiss LSM 700",
        "Zeiss LSM 980",
        "Zeno Electronic Walkway",
        "ZetaView"
      ],
      "type": "string"
    },
    "processingLevel": {
      "description": "Level of data processing (raw, processed, analyzed)",
      "title": "Processing Level"
    },
    "publisher": {
      "description": "Name of the organization or person responsible for making the file available.",
      "title": "Publisher",
      "type": "string"
    },
    "sameAs": {
      "description": "Another platform's URI or compact URI for this same resource. See https://www.w3.org/TR/owl-ref/#sameAs-def.",
      "title": "Same As",
      "type": "string"
    },
    "sampleIdColumn": {
      "description": "Name of the column containing sample identifiers",
      "title": "Sample ID Column",
      "type": "string"
    },
    "source": {
      "description": "Host platform from which the file was sourced.",
      "title": "Source",
      "type": "string"
    },
    "species": {
      "description": "Species of the organism(s) from which the data were generated. Omit property if not applicable, such as for data like compounds or other non-biological data.",
      "items": {
        "description": "",
        "enum": [
          "Rattus norvegicus",
          "Gallus gallus",
          "Pan troglodytes",
          "Mus musculus (humanized)",
          "Homo sapiens",
          "Danio rerio",
          "Drosophila melanogaster",
          "Rhesus macaque",
          "Sus scrofa",
          "Oryctolagus cuniculus",
          "Mus musculus"
        ],
        "title": "SpeciesEnum",
        "type": "string"
      },
      "title": "Species",
      "type": "array"
    },
    "subject": {
      "description": "Applicable subject term(s) for file cataloging; use the Library of Congress Subject Headings (LCSH) scheme.",
      "items": {
        "type": "string"
      },
      "title": "Subject",
      "type": "array"
    },
    "title": {
      "title": "Title",
      "type": "string"
    },
    "url": {
      "description": "URL for the original file location at source.",
      "title": "URL",
      "type": "string"
    }
  },
  "required": [
    "title",
    "creator",
    "keywords",
    "source",
    "url"
  ]
}


In [6]:
organization = SchemaOrganization(name=ORG_NAME)
try:
    organization.store()
except Exception as e:
    organization.get()

schemas = list(organization.get_json_schemas())
for schema in schemas:
    print(schema)

schema = JSONSchema(name=SCHEMA_NAME, organization_name=ORG_NAME)
try:
    schema.get()
except Exception as e:
    schema.store(schema_body=schema_body, version=VERSION)

schema.get_body()

JSONSchema(name='OmicDataset', organization_name='ampals.schemas', organization_id='1415', id='9261', created_on='2026-02-10T05:25:09.007Z', created_by='3436666', uri='ampals.schemas-OmicDataset')


/schema/type/create/async: 100%|██████████| 100/100 [00:01<00:00, 89.1it/s]


{'$schema': 'https://json-schema.org/draft-07/schema',
 '$id': 'https://repo-prod.prod.sagebase.org/repo/v1/schema/type/registered/ampals.schemas-OmicFile',
 'type': 'object',
 'properties': {'url': {'type': 'string',
   'title': 'URL',
   'description': 'URL for the original file location at source.'},
  'assay': {'type': 'array',
   'items': {'type': 'string',
    'title': 'Assay',
    'description': '',
    'enum': ['2D AlamarBlue absorbance',
     '2D AlamarBlue fluorescence',
     '3D confocal imaging',
     '3D electron microscopy',
     '3D imaging',
     '3D microtissue viability',
     'actigraphy',
     'AlgometRx Nociometer',
     'auditory brainstem response',
     'ATAC-seq',
     'ATPase activity assay',
     'BrdU proliferation assay',
     'Bru-seq',
     'BruChase-seq',
     'CAPP-seq',
     'CUT&RUN',
     'ChIP-seq',
     'Child Behavior Checklist for Ages 1.5-5',
     'Child Behavior Checklist for Ages 6-18',
     'CODEX',
     'CROP-seq',
     'confocal microscopy'

In [7]:
# Create a test folder for JSON schema experiments
test_folder = Folder(name="test_folder", parent_id=PROJECT_ENT.id).store()

bound_schema = test_folder.bind_schema(
    json_schema_uri=schema.uri, enable_derived_annotations=True
)
json_schema_version_info = bound_schema.json_schema_version_info
syn.logger.info("JSON schema was bound successfully. Please see details below:")
pprint(vars(json_schema_version_info))

JSON schema was bound successfully. Please see details below:
{'created_by': '3436666',
 'created_on': '2026-02-10T05:32:11.885Z',
 'id': 'ampals.schemas-OmicFile-0.0.1',
 'json_sha256_hex': 'e2eda85d5bac2faab6ed71c002727307367719300e8c0731fc9784ccc9fe0a0e',
 'organization_id': '1415',
 'organization_name': 'ampals.schemas',
 'schema_id': '9262',
 'schema_name': 'OmicFile',
 'semantic_version': '0.0.1',
 'version_id': '52794'}


In [8]:
# 5. Retrieve the Bound Schema
schema = test_folder.get_schema()
syn.logger.info("JSON Schema was retrieved successfully. Please see details below:")
pprint(vars(schema))

JSON Schema was retrieved successfully. Please see details below:
{'created_by': '3436666',
 'created_on': '2026-02-10T05:32:56.004Z',
 'enable_derived_annotations': True,
 'json_schema_version_info': JSONSchemaVersionInfo(organization_id='1415',
                                                   organization_name='ampals.schemas',
                                                   schema_id='9262',
                                                   id='ampals.schemas-OmicFile-0.0.1',
                                                   schema_name='OmicFile',
                                                   version_id='52794',
                                                   semantic_version='0.0.1',
                                                   json_sha256_hex='e2eda85d5bac2faab6ed71c002727307367719300e8c0731fc9784ccc9fe0a0e',
                                                   created_on='2026-02-10T05:32:11.885Z',
                                                   created_by=

In [9]:
validation_statistics = test_folder.get_schema_validation_statistics()
syn.logger.info(
    "Validation statistics were retrieved successfully. Please see details below:"
)

Validation statistics were retrieved successfully. Please see details below:


In [10]:
invalid_validation = invalid_results = test_folder.get_invalid_validation()
for child in invalid_validation:
    syn.logger.info("See details of validation results: ")

See details of validation results: 
