In [40]:
from google.colab import drive
import numpy as np
drive.mount("/content/drive")

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [41]:
!pip install rdflib




In [42]:
import pandas as pd
from rdflib import Graph, Literal, Namespace, URIRef

# Create an RDF graph
g = Graph()

# Define a namespace for medical code data
ns = Namespace("http://example.org/hippapart2_codes#")

# Specify the directory path where your files are located
directory_path = '/content/drive/My Drive/Hippa part2/data/'

# Specify the CSV file name (replace 'your_data.csv' with your actual file name)
csv_file_name = 'Data.csv'

# Read your CSV data into a DataFrame with the 'latin-1' encoding
df = pd.read_csv(directory_path + 'Data.csv', encoding='latin-1')

# Create a single node for "hippapart2"
hippa_part2 = URIRef(ns + 'hippapart2')

# Connect all RDF triples to "hippapart2"
for index, row in df.iterrows():
    subject = URIRef(ns + row['Code'])
    description = Literal(row['Description'])
    code_system = Literal(row['CodeSystem'])
    code_type = Literal(row['CodeType'])
    hipaa_value_set_name = Literal(row['HIPPAValueSetName'])

    # Add RDF triples using human-readable predicate names
    g.add((subject, URIRef("CODE_IS_A_SUBTYPE_OF"), code_system))
    g.add((subject, URIRef("REPRESENTING_A"), code_type))
    g.add((subject, URIRef("RELATED_TO"), hipaa_value_set_name))
    g.add((subject, URIRef("DESCRIBES"), description))

    # Connect each code node to "hippapart2" using your namespace for relationships
    g.add((hippa_part2, ns["INCLUDES"], subject))

# Serialize the RDF graph to Turtle format
rdf_data = g.serialize(format='turtle')

# Specify the output file path
output_file_path = '/content/drive/My Drive/Hippa part2/data/hippapart2.ttl'

# Save the RDF data to a file with error handling
try:
    with open(output_file_path, 'w', encoding='utf-8') as f:
        f.write(rdf_data)
    print("RDF data saved to", output_file_path)
except Exception as e:
    print("Error:", e)


RDF data saved to /content/drive/My Drive/Hippa part2/data/hippapart2.ttl
