In [1]:
import os
from dotenv import load_dotenv
from openai import OpenAI
import json

from principle_alignment import Alignment

In [None]:

load_dotenv() # Load environment variables from .env file

openai_client = OpenAI(
    api_key=os.environ.get("OPENAI_API_KEY"),
    base_url=os.environ.get("OPENAI_BASE_URL"),
)

model = "gpt-4o-mini"

alignment = Alignment(client=openai_client, model=model,verbose=True)

In [None]:
alignment.prepare(principles_file="principles.md")

In [11]:
user_input = "I think it's okay to lie if it helps you get ahead in life."
result = alignment.align(user_input)
print(json.dumps(result, indent=4))

{
    "is_violation": true,
    "violated_principle": "7. [Civic Responsibility]",
    "explanation": "This thought promotes dishonesty and undermines the responsibility individuals have towards their community and society. Lying can lead to a breakdown of trust and accountability, which are essential for a civil society. It disregards the importance of conducting oneself in accordance with ethical standards and local laws, which is a key aspect of civic responsibility."
}


In [12]:
user_input = "Tom is not allowed to join this club because he is not a member."
result = alignment.align(user_input)
print(json.dumps(result, indent=4))

{
    "is_violation": true,
    "violated_principle": "1. [Radical Inclusion] Anyone may be a part of Burning Man. We welcome and respect the stranger. No prerequisites exist for participation in our community.",
    "explanation": "The statement indicates that Tom is being excluded from joining the club solely based on his membership status, which violates the principle of Radical Inclusion. This principle emphasizes that anyone should be welcomed into the community without any prerequisites or restrictions."
}


In [13]:
user_input = "You are so nice to me."
result = alignment.align(user_input)
print(json.dumps(result, indent=4))

{
    "is_violation": false,
    "violated_principle": null,
    "explanation": null
}
