### Working With JSON In Python

#### Differences Between Python dict And JSON

JSON vs python dict/list in brief:

| Feature         | JSON                                    | Python dict                                |
|-----------------|-----------------------------------------|--------------------------------------------|
| Purpose         | Data exchange                           | In-memory data structure                   |
| Data types      | Limited set of data types               | Wide range of Python data types            |
| Keys            | Strings only                            | Any immutable, hashable type               |
| Ordering        | Order of keys in objects not guaranteed | Order of keys in guaranteed in 3.7+        |
| Absence of value| null                                    | None                                       |
| Booleans        | true, false                             | True, False                                |
| Comments        | not supported                           | supported                                  |
| Trailing commas | not supported                           | supported                                  |

#### The json Module And Serialization

> * serialization: python object -> JSON
> * deserialization: JSON -> python object

In [1]:
person_data = {
    "name": "John Doe",
    "age": 30,
    "city": "New York"
}

In [2]:
type(person_data)

dict

In [3]:
import json

In [6]:
test = json.dumps(person_data)
test

'{"name": "John Doe", "age": 30, "city": "New York"}'

In [7]:
type(test)

str

In [8]:
print(json.dumps(person_data, indent=4))

{
    "name": "John Doe",
    "age": 30,
    "city": "New York"
}


In [9]:
with open("person.json", "w") as file:
    # json.dump(person_data, file, indent=4)
    json.dump(person_data, file)

#### Deserialization

> * deserialization: JSON -> python object

In [10]:
json_data = '{"name": "John Doe", "age": 30, "city": "New York"}'

In [11]:
import json

In [12]:
person = json.loads(json_data)

In [13]:
type(person)

dict

In [14]:
print(person)

{'name': 'John Doe', 'age': 30, 'city': 'New York'}


In [16]:
person["age"]

30

In [None]:
with open("person.json", "r") as file:
    person_from_disk = json.load(file)

In [None]:
type(person_from_disk)

dict

In [None]:
person_from_disk

{'name': 'John Doe', 'age': 34, 'city': 'New York'}

#### Web Requests And APIs

> * HTTP is Hypertext Transfer Protocol; used for transmitting hypertext requests and information between servers and browsers
> * client makes request; server responds with some data

In [None]:
# requests (next)
# httpx

In [None]:
import urllib.request

In [None]:
url = "https://www.andybek.com/api/data/persons"

In [None]:
with urllib.request.urlopen(url) as response:
    response_data = response.read().decode("utf-8")

In [None]:
response_data

'[{"id":1,"name":"Emily Johnson","age":32},{"id":2,"name":"David Smith","age":25},{"id":3,"name":"Olivia Williams","age":41},{"id":4,"name":"Noah Brown","age":38},{"id":5,"name":"Emma Jones","age":29},{"id":6,"name":"William Miller","age":52},{"id":7,"name":"Ava Garcia","age":35},{"id":8,"name":"James Rodriguez","age":46},{"id":9,"name":"Isabella Wilson","age":22},{"id":10,"name":"Liam Anderson","age":30},{"id":11,"name":"Sophia Taylor","age":44},{"id":12,"name":"Mason Jackson","age":27},{"id":13,"name":"Amelia Thomas","age":39},{"id":14,"name":"Ethan White","age":55},{"id":15,"name":"Harper Moore","age":24},{"id":16,"name":"Elijah Martin","age":36},{"id":17,"name":"Ava Thompson","age":49},{"id":18,"name":"Lucas Garcia","age":21},{"id":19,"name":"Mia Martinez","age":33},{"id":20,"name":"Noah Robinson","age":47}]'

In [None]:
type(response_data)

str

In [None]:
import json

json_data = json.loads(response_data)

In [None]:
type(json_data), type(json_data[3])

(list, dict)

#### A Better Alternative: The requests Library

In [None]:
url = "https://www.andybek.com/api/data/persons"

In [None]:
import requests

In [None]:
response = requests.get(url)

In [None]:
data = response.json()

type(data), type(data[2])

(list, dict)

In [None]:
# quick demo - won't work!

In [None]:
data = {
    "name": "Alice"
}

In [None]:
# send to server as JSON

In [None]:
requests.post(false_post_url, json=data)

#### Edge Cases In Serialization

In [None]:
from datetime import datetime, date

In [None]:
now = datetime.now()

In [None]:
import json

In [None]:
json.dumps(now)

TypeError: Object of type datetime is not JSON serializable

In [None]:
dog_data = {
    "name": "Spot",
    "breed": "Dalmatian",
    "birthday": date(2019, 5, 12)
}

In [None]:
dog_data

{'name': 'Spot', 'breed': 'Dalmatian', 'birthday': datetime.date(2019, 5, 12)}

In [None]:
json.dumps(dog_data)

TypeError: Object of type date is not JSON serializable

In [None]:
from json import JSONEncoder

In [None]:
class CustomEncoder(JSONEncoder):
    def default(self, obj):

        if isinstance(obj, date) or isinstance(obj, datetime):
            return obj.isoformat()

        return super().default(obj)

In [None]:
json.dumps(dog_data, cls=CustomEncoder)

'{"name": "Spot", "breed": "Dalmatian", "birthday": "2019-05-12"}'

#### Serializing User-Defined Classes

In [None]:
class Person:
    def __init__(self, name, born):
        self.name = name
        self.born = born

In [None]:
john = Person("John Doe", 1990)

In [None]:
import json

In [None]:
json.dumps(john)

TypeError: Object of type Person is not JSON serializable

In [None]:
john.__dict__

{'name': 'John Doe', 'born': 1990}

In [None]:
json.dumps(john.__dict__)

'{"name": "John Doe", "born": 1990}'

In [None]:
from datetime import datetime

class Person:
    def __init__(self, name, born):
        self.name = name
        self.born = born

    @property
    def age(self):
        return datetime.now().year - self.born

In [None]:
john = Person("John Doe", 1990)

In [None]:
john.name

'John Doe'

In [None]:
john.age

34

In [None]:
json.dumps(john.__dict__)

'{"name": "John Doe", "born": 1990}'

In [None]:
def seriealize_person(obj):
    if isinstance(obj, Person):
        return {
            "name": obj.name,
            "age": obj.age
        }

    raise TypeError("Object not serializable")

In [None]:
json.dumps(john, default=seriealize_person)

'{"name": "John Doe", "age": 34}'

In [None]:
john.__dict__, john.age

({'name': 'John Doe', 'born': 1990}, 34)

#### Skill Challenge: JSON Data Transformation Challenge

> #### JSON Data Transformation Challenge

Your task is to retrieve and process JSON data from a given URL containing information about books. Follow the steps below to complete the challenge:

* Use the provided URL: https://www.andybek.com/api/data/books to fetch all the books.

* Save the raw JSON data to a file named "books-original.json".

* Deserialize the JSON data and remove the "ranks" and "release dates" from each book entry.

* Save the modified books data to a new file named "books-cleaned.json".

#### Solution

In [None]:
import requests
import json

In [None]:
API_URL = "https://www.andybek.com/api/data/books"
ORIGINAL_FILE = "books-original.json"
CLEANED_FILE = "books-cleaned.json"

In [None]:
def fetch_and_clean_books():
    try:
        response = requests.get(API_URL)
        response.raise_for_status()

        books_data = response.json()

        with open(ORIGINAL_FILE, "w") as f:
            json.dump(books_data, f, indent=2)

        for book in books_data:
            del book["rank"]
            del book["release_date"]

        with open(CLEANED_FILE, "w") as f:
            json.dump(books_data, f, indent=2)
    except requests.exceptions.RequestException as e:
        print(f"Error fetching data: {e}")
    except json.JSONDecodeError as e:
        print(f"Error decording JSON data: {e}")
    except Exception as e:
        print(f"An unexpected error occured: {e}")

In [None]:
# if __name__ == "__main__":
#     fetch_and_clean_books()

fetch_and_clean_books()