# MongoDB Data Verification – Converted OpenFDA Database
This notebook verifies the field conversions and data integrity in the MongoDB collection `full_reports`.

In [None]:
import pymongo
from bson import json_util
from pprint import pprint

# Connect to MongoDB
client = pymongo.MongoClient("mongodb://localhost:27017")
db = client["openfda_converted"]
collection = db["full_reports"]

## 1. Check total number of inserted reports

In [None]:
total_reports = collection.count_documents({})
print(f"Total inserted reports: {total_reports}")

## 2. Verify integer fields

In [None]:
query = {"safetyreportversion": {"$type": "int"}}
docs = list(collection.find(query).limit(5))
for doc in docs:
    pprint(doc)

## 3. Verify date normalization

In [None]:
query = {"drug.0.drugstartdate": {"$type": "date"}}
docs = list(collection.find(query).limit(5))
for doc in docs:
    pprint(doc["drug"][0]["drugstartdate"])

## 4. Check that oversized reports were skipped (logged to file)

In [None]:
with open("skipped_reports.log", "r") as f:
    skipped = f.readlines()
print(f"Total oversized reports skipped: {len(skipped)}")
print("First few entries:")
print("".join(skipped[:3]))