# database and table configs

## This cell creates a new table in database
we need one for each fallacy

In [0]:
%sql
CREATE DATABASE IF NOT EXISTS workspace.logical_fallacy_data;

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.red_herring (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.straw_man (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.slippery_slope (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.hasty_generalization (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.attacking (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.ignorance (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.hypocrisy (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.stacking_deck (
  text STRING,
  label BOOLEAN
);

In [0]:
%sql
CREATE TABLE IF NOT EXISTS logical_fallacy_data.ad_hominem (
  text STRING,
  label BOOLEAN
);

# Access

In [0]:
%sql
GRANT USE SCHEMA ON SCHEMA logical_fallacy_data TO `ryabumoto1655@sdsu.edu`;


In [0]:
%sql
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.red_herring TO `ryabumoto1655@sdsu.edu`;
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.straw_man TO `ryabumoto1655@sdsu.edu`;
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.hasty_generalization TO `ryabumoto1655@sdsu.edu`;
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.slippery_slope TO `ryabumoto1655@sdsu.edu`;
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.attacking TO `ryabumoto1655@sdsu.edu`;
GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.ignorance TO `ryabumoto1655@sdsu.edu`;


# Populate Red-Herring Table

In [0]:
red_herring_examples = [
    "We shouldn’t worry about climate change when there are so many people unemployed.",
    "Why talk about school funding? Let’s focus on the real problem: declining family values.",
    "I know I made a mistake at work, but think of all the good things I’ve done.",
    "Sure, I didn’t clean the kitchen, but you never take the trash out!",
    "You're asking about taxes, but what about crime rates?",
    "Let’s not talk about the budget. Have you seen how poorly dressed the mayor is?",
    "We don’t need to fix the potholes. The real issue is people driving too fast.",
    "Yes, we need healthcare reform, but look at how much athletes get paid!","The suspect was wearing a red jacket, but have you noticed how high the crime rate is in this city?",
    "The victim was known to have a lot of enemies, but let’s focus on the time of day it happened.",
    "I know the evidence points to one person, but what about the history of the neighborhood?",
    "The room was locked from the inside, but I’ve been thinking about the victim’s past relationships.",
    "Sure, the fingerprints match, but the security system was malfunctioning all week.",
    "The car was seen near the scene, but have you ever thought about how this neighborhood is prone to accidents?",
    "We should examine the victim’s phone records, but there’s something odd about the weather that day.",
    "There’s a bloodstain on the floor, but don’t forget that the city has been experiencing a surge in burglaries.",
    "The security footage shows someone wearing a mask, but we should first explore the victim's financial troubles.",
    "They found a weapon in the room, but what if the victim had a history of mental health issues?",
    "The suspect had a motive, but have you heard about the strange rumors circulating in the town?",
    "There’s a trail of footprints leading away from the scene, but let’s not forget the local gang activity.",
    "The eyewitness testimony is shaky, but we need to look at the way the victim’s family reacts.",
    "The victim’s friend has an alibi, but the weather that night was absolutely horrific.",
    "We found a clue in the victim’s office, but let’s focus more on the nearby construction site.",
    "It’s possible the suspect had access to the victim’s house, but let’s talk about the strange behavior of the neighbors.",
    "The fingerprints found at the scene don’t match anyone in the database, but what if the culprit is from out of town?",
    "The weapon used was unusual, but what’s more interesting is the victim's connection to the community center.",
    "We found a phone at the scene, but I think it’s important to discuss the lack of streetlights in that area.",
    "Sure, there’s a suspect in mind, but did you know the power grid went down the night of the crime?",
    "We have a possible lead, but I’m more interested in the fact that the building was undergoing renovations.",
    "The victim had a history of gambling, but have you considered how the location of the incident might have influenced the event?",
    "The alibi of the suspect seems solid, but let’s not forget about the mysterious disappearances in the nearby town.",
    "The car was parked nearby, but I think we should focus on the suspicious construction workers in the area.",
    "There were multiple witnesses, but it’s worth considering the recent local protests happening around that time.",
    "The victim’s financial records are strange, but have you considered how the crime rate has been increasing in this area?",
    "The suspect’s fingerprints are all over the scene, but I’m more curious about the strange noises reported that night."
]

# Healthy counter-arguments (not fallacious)
healthy_arguments = [
    "I think we need to increase school funding because of declining test scores.",
    "While I understand your point, data shows climate change is a growing concern.",
    "It’s true that taxes are high, but healthcare access is crucial.",
    "Yes, unemployment is an issue, but we must also address climate change.",
    "Cleaning the kitchen is important; let’s both take responsibility.",
    "We need to discuss both crime rates and taxation separately.",
    "The suspect's motive was clear: financial gain. This directly ties into the victim’s recent large withdrawal.",
    "The fingerprints found on the weapon match the suspect, which places them at the crime scene.",
    "Witnesses described hearing a confrontation between the suspect and the victim minutes before the crime.",
    "Security footage shows the suspect entering the building at the same time the crime was committed.",
    "The timeline of events matches up perfectly with the suspect’s movements during the night of the crime.",
    "The victim’s recent behavior suggested they were under a lot of stress, which could explain their actions.",
    "The location of the crime is consistent with the suspect’s known residence, making it geographically relevant.",
    "The medical examiner confirmed the cause of death, which directly supports the suspect’s involvement in the crime.",
    "The victim’s phone records show text messages threatening harm from the suspect just days before the incident.",
    "The car seen near the scene was registered to the suspect, and forensic evidence links it to the crime.",
    "There are no signs of forced entry into the victim’s home, indicating the suspect may have had a key.",
    "The victim had recently filed a police report against the suspect for harassment, which strengthens the case.",
    "There were no power outages reported in the area, so there’s no reason to believe the security system would have failed.",
    "The weapon was found in the suspect’s possession, which directly links them to the crime scene.",
    "The suspect's alibi was verified by multiple independent sources, providing a clear defense against the accusation.",
    "Forensic evidence confirms that the victim was already dead before the fire started, ruling out certain theories.",
    "The suspect was in a public place at the time of the crime, with multiple witnesses who can corroborate their alibi.",
    "The victim’s personal history with the suspect, including recent arguments, is directly relevant to the case.",
    "The injuries on the victim’s body are consistent with the suspect’s known fighting style, further connecting them.",
    "A thorough investigation reveals that the suspect was involved in similar crimes in the past, adding credibility to the claim.",
    "A full toxicology report shows the victim had traces of the suspect’s medication in their system, linking them further.",
    "The time of death corresponds with the suspect’s arrival at their residence, narrowing down the window of opportunity.",
    "The suspect’s motive is based on solid financial records showing they stood to gain from the victim’s death.",
    "Witness testimony, backed by physical evidence, places the suspect at the crime scene shortly before the crime occurred.",
    "The location of the crime was chosen because the suspect knew the victim often worked late, making it a calculated decision."
]
# Neutral/non-argumentative
non_arguments = [
    "I love watching documentaries on space exploration.",
    "The weather has been nice lately.",
    "I prefer tea over coffee in the mornings.",
    "My dog just learned a new trick.",
    "you are awesome",
    "but why are we going there"
]

red_herring_non_examples = non_arguments + healthy_arguments

for example in red_herring_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.red_herring (text, label)
    VALUES ('{example.replace("'", "''")}', true)
    """
    spark.sql(query)



for example in red_herring_non_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.red_herring (text, label)
    VALUES ('{example.replace("'", "''")}', false)
    """
    spark.sql(query)

In [0]:
%sql
CREATE TABLE red_herring_new AS SELECT DISTINCT *
FROM logical_fallacy_data.red_herring;

DROP TABLE logical_fallacy_data.red_herring;

ALTER TABLE red_herring_new
RENAME TO logical_fallacy_data.red_herring;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.red_herring TO `ryabumoto1655@sdsu.edu`;

# Populate Straw-man Table

In [0]:
# Populate Straw-man

# Straw Man Fallacy examples
straw_man_examples = [
    "this is not an example"
]

# Healthy counter-arguments (not fallacious)
healthy_arguments = [
    "hey why dont you be more respectful"
]
# Neutral/non-argumentative
non_arguments = [
    "I love watching documentaries on space exploration.",
    "The weather has been nice lately.",
    "I prefer tea over coffee in the mornings.",
    "My dog just learned a new trick.",
    "you are awesome",
    "but why are we going there"
]

straw_man_non_examples = non_arguments + healthy_arguments

for example in straw_man_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.straw_man (text, label)
    VALUES ('{example.replace("'", "''")}', true)
    """
    spark.sql(query)

for example in straw_man_non_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.straw_man (text, label)
    VALUES ('{example.replace("'", "''")}', false)
    """
    spark.sql(query)

In [0]:
%sql
DROP TABLE IF EXISTS straw_man_new;
CREATE TABLE straw_man_new AS SELECT DISTINCT *
FROM logical_fallacy_data.straw_man;

DROP TABLE logical_fallacy_data.straw_man;

ALTER TABLE straw_man_new
RENAME TO logical_fallacy_data.straw_man;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.straw_man TO `ryabumoto1655@sdsu.edu`;

# Populate Slippery Slope

In [0]:
# Populate Slippery Slope

# Slippery Slope Fallacy examples
slippery_slope_examples = [
    "this is not an example"
]

# Healthy counter-arguments (not fallacious)
healthy_arguments = [
    "hey why dont you be more respectful"
]
# Neutral/non-argumentative
non_arguments = [
    "I love watching documentaries on space exploration.",
    "The weather has been nice lately.",
    "I prefer tea over coffee in the mornings.",
    "My dog just learned a new trick.",
    "you are awesome",
    "but why are we going there"
]

slippery_slope_non_examples = non_arguments + healthy_arguments

for example in slippery_slope_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.slippery_slope (text, label)
    VALUES ('{example.replace("'", "''")}', true)
    """
    spark.sql(query)

for example in slippery_slope_non_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.slippery_slope (text, label)
    VALUES ('{example.replace("'", "''")}', false)
    """
    spark.sql(query)

In [0]:
%sql
DROP TABLE IF EXISTS slippery_slope_new;
CREATE TABLE slippery_slope_new AS SELECT DISTINCT *
FROM logical_fallacy_data.slippery_slope;

DROP TABLE logical_fallacy_data.slippery_slope;

ALTER TABLE slippery_slope_new
RENAME TO logical_fallacy_data.slippery_slope;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.slippery_slope TO `ryabumoto1655@sdsu.edu`;

# Populate Hasty Generalizations

In [0]:
# Populate Hasty Generalization

# Hasty Generalization Fallacy examples
hasty_generalization_examples = [
    "this is not an example"
]

# Healthy counter-arguments (not fallacious)
healthy_arguments = [
    "hey why dont you be more respectful"
]
# Neutral/non-argumentative
non_arguments = [
    "I love watching documentaries on space exploration.",
    "The weather has been nice lately.",
    "I prefer tea over coffee in the mornings.",
    "My dog just learned a new trick.",
    "you are awesome",
    "but why are we going there"
]

hasty_generalization_non_examples = non_arguments + healthy_arguments

for example in hasty_generalization_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.hasty_generalization (text, label)
    VALUES ('{example.replace("'", "''")}', true)
    """
    spark.sql(query)

for example in hasty_generalization_non_examples:
    query = f"""
    INSERT INTO logical_fallacy_data.hasty_generalization (text, label)
    VALUES ('{example.replace("'", "''")}', false)
    """
    spark.sql(query)

In [0]:
%sql
DROP TABLE IF EXISTS hasty_generalization_new;
CREATE TABLE hasty_generalization_new AS SELECT DISTINCT *
FROM logical_fallacy_data.hasty_generalization;

DROP TABLE logical_fallacy_data.hasty_generalization;

ALTER TABLE hasty_generalization_new
RENAME TO logical_fallacy_data.hasty_generalization;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.hasty_generalization TO `ryabumoto1655@sdsu.edu`;

# Populate Attacking Table

In [0]:
from pyspark.sql import SparkSession

# Start Spark session
spark = SparkSession.builder \
    .appName("Insert Hasty Generalization Examples") \
    .enableHiveSupport() \
    .getOrCreate()

# Inlined data from the CSV
data = [
    ("Don't take his advice on health; he's overweight.", 1),
    ("Her financial advice is grounded in years of experience.", 0),
    ("Evidence should determine truth, not personal attacks.", 0),
    ("If we legalize this, what’s next? Total anarchy?", 0),
    ("Why should we take advice from someone who's been divorced three times?", 1),
    ("Don’t listen to her views on parenting—she doesn’t even have kids.", 1),
    ("He’s just a conspiracy theorist, so ignore him.", 1),
    ("You’re only saying that because you're jealous.", 1),
    ("He failed before, so this idea must fail too.", 0),
    ("Criticizing the person doesn't disprove the argument.", 0),
    ("We should evaluate the proposal based on its merits.", 0),
    ("What would a millennial like you know about hard work?", 1),
    ("She’s rich, so her opinion on poverty doesn’t matter.", 1),
    ("You can't trust John's views on politics—he dropped out of college.", 1),
    ("He opposes the war, but he's just a coward.", 1),
    ("His political views are supported by well-researched data.", 0),
    ("Only a fool would disagree with this plan.", 0),
    ("Since you can’t prove it’s false, it must be true.", 0),
    ("There's no evidence for ghosts, so they don't exist.", 0),
    ("It’s clearly wrong because it feels wrong.", 0),
    ("He’s just saying that because he’s a failed actor.", 1),
    ("That claim must be true—everyone believes it.", 0),
    ("We’ve always done it this way, so it must be right.", 0),
    ("The argument stands regardless of who presents it.", 0),
    ("Judging by appearance isn’t a valid counterargument.", 0),
    ("Let's consider the content of the idea, not the person.", 0),
    ("The government hasn’t denied it, so it must be real.", 0),
    ("Don't believe her argument about the environment; she flies everywhere.", 1),
    ("Her argument aligns with peer-reviewed research.", 0),
    ("Her stance on climate change is based on scientific studies.", 0),
    ("He made a good point about health risks supported by facts.", 0),
    ("Ignore his take on economics; he went bankrupt once.", 1),
    ("Of course he supports taxes—he’s a government employee.", 1),
    ("The data speaks louder than the person presenting it.", 0),
    ("The speaker provided evidence to support her position.", 0),
    ("This happened after that, so it must be the cause.", 0),
    ("You're only supporting that idea because you're lazy.", 1),
    ("We should focus on the issue, not the individual.", 0),
    ("Even if he's flawed, his logic is sound.", 0),
    ("She only supports that candidate because she’s from his hometown.", 1),
    ("You shouldn't listen to Nina; they're just a airhead.", 1),
    ("She only believes that because she's irrational.", 1),
    ("His argument is invalid because he's just a influencer.", 1),
    ("Even flawed people can present good ideas.", 0),
    ("You shouldn't listen to Ella; they're just a gold digger.", 1),
    ("The point should be considered independently of Susan's personal history.", 0),
    ("His argument is invalid because he's just a janitor.", 1),
    ("The point should be considered independently of Dan's personal history.", 0),
    ("She only believes that because she's young.", 1),
    ("You shouldn't listen to Susan; they're just a know-it-all.", 1),
    ("She only believes that because she's insecure.", 1),
    ("His argument is invalid because he's just a bartender.", 1),
    ("She only believes that because she's naive.", 1),
    ("His argument is invalid because he's just a YouTuber.", 1),
    ("His argument is invalid because he's just a comedian.", 1),
    ("The point should be considered independently of Jenny's personal history.", 0),
    ("She only believes that because she's jealous.", 1),
    ("Facts should not depend on the speaker's identity.", 0),
    ("She only believes that because she's old-fashioned.", 1),
    ("Her claim is valid regardless of her occupation.", 0),
    ("His argument is invalid because he's just a blogger.", 1),
    ("She only believes that because she's bitter.", 1),
    ("His argument is invalid because he's just a celebrity.", 1),
    ("Let's discuss the point, not the person making it.", 0),
    ("His argument is invalid because he's just a intern.", 1),
    ("The point should be considered independently of Tom's personal history.", 0),
    ("Reasoning matters more than reputation.", 0),
    ("The issue is more important than the messenger.", 0),
    ("You shouldn't listen to Jenny; they're just a drama queen.", 1),
    ("The point should be considered independently of Alex's personal history.", 0),
    ("You shouldn't listen to Tom; they're just a hypocrite.", 1),
    ("His argument is invalid because he's just a student.", 1),
    ("The point should be considered independently of Ella's personal history.", 0),
    ("Arguments must stand on logic, not personal backgrounds.", 0),
    ("You shouldn't listen to Mark; they're just a loser.", 1),
    ("The point should be considered independently of Rob's personal history.", 0),
    ("Evaluate the argument, not the arguer.", 0),
    ("He supports his point with strong evidence.", 0),
    ("You shouldn't listen to Rachel; they're just a attention seeker.", 1),
    ("You shouldn't listen to Dan; they're just a narcissist.", 1),
    ("She only believes that because she's privileged.", 1),
    ("You shouldn't listen to Alex; they're just a slacker.", 1),
    ("The point should be considered independently of Nina's personal history.", 0),
    ("She only believes that because she's emotional.", 1),
    ("She only believes that because she's rich.", 1),
]

# Create DataFrame
df = spark.createDataFrame(data, ["text", "label"])

# Write to Hive table
df.write.insertInto("logical_fallacy_data.attacking", overwrite=False)


In [0]:
%sql
DROP TABLE IF EXISTS attacking_new;
CREATE TABLE attacking_new AS SELECT DISTINCT *
FROM logical_fallacy_data.attacking;

DROP TABLE logical_fallacy_data.attacking;

ALTER TABLE attacking_new
RENAME TO logical_fallacy_data.attacking;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.attacking TO `ryabumoto1655@sdsu.edu`;

# Populate Ignorance Table

In [0]:
from pyspark.sql import SparkSession

# Start Spark session
spark = SparkSession.builder \
    .appName("Insert Appeal to Ignorance Examples") \
    .enableHiveSupport() \
    .getOrCreate()

# Inlined data from the Appeal to Ignorance CSV
data = [
    ("That new neighbor looks suspicious, so he probably is.", 0),
    ("If we don't act now, everything will collapse.", 0),
    ("No proof of Bigfoot has been found, so he doesn't exist.", 1),
    ("A theory must be falsifiable to be scientific.", 0),
    ("I had a dream about it, so it must mean something.", 0),
    ("You're just saying that because you're angry.", 0),
    ("Everybody believes it, so it can’t be wrong.", 0),
    ("This conclusion is based on available data, not speculation.", 0),
    ("If we ban cars, what's next? Bikes too?", 0),
    ("Ghost stories are not supported by scientific evidence.", 0),
    ("Unproven does not mean untrue, just unverified.", 0),
    ("No one’s ever returned from the afterlife, so it doesn’t exist.", 1),
    ("Logical reasoning requires evidence, not assumptions.", 0),
    ("You can't prove aliens aren't visiting us, so they must be.", 1),
    ("No one has proven that ghosts don't exist, so they must be real.", 1),
    ("Scientific claims must be supported by empirical data.", 0),
    ("No one has shown that the new policy is bad, so it must be good.", 1),
    ("Our conclusion should be based on what we know, not what we don’t.", 0),
    ("Since there's no evidence against the claim, it has to be true.", 1),
    ("To confirm the hypothesis, we need experimental validation.", 0),
    ("The burden of proof lies with the person making the claim.", 0),
    ("He’s a criminal, so his views on law reform are invalid.", 0),
    ("There’s no proof that vaccines don’t cause long-term harm, so they must be unsafe.", 1),
    ("Assertions require verification to be credible.", 0),
    ("Nobody has shown the new drug doesn’t work, so it must be effective.", 1),
    ("No one has proven climate change isn't a hoax, so it probably is.", 1),
    ("There’s no evidence that eating after 8 p.m. is harmful, so it must be fine.", 1),
    ("We cannot conclude the drug is safe without further testing.", 0),
    ("We haven’t found life on Mars yet, so there definitely isn’t any.", 1),
    ("There's no way to disprove fate, so it must be real.", 1),
    ("You can't prove I cheated, so I must be innocent.", 1),
    ("Skepticism is warranted without observable proof.", 0),
    ("He always lies, so this must be a lie too.", 0),
    ("Until you prove that the suspect is innocent, he must be guilty.", 1),
    ("She’s rich, so she must not understand poverty.", 0),
    ("Absence of evidence is not the same as evidence of absence.", 0),
    ("You haven't shown the machine won't explode, so it’s dangerous.", 1),
    ("My mom said it’s true, so it must be.", 0),
    ("Let’s withhold judgment until we have more evidence.", 0),
    ("Lack of evidence doesn't necessarily prove a claim is false.", 0),
    ("The new study seems promising, but we need evidence to confirm it.", 0),
    ("Dreams are sometimes symbolic, but we need evidence to confirm it.", 0),
    ("Some think the moon landing was fake, but we need evidence to confirm it.", 0),
    ("No one has shown that the earth being flat isn't true, so it must be.", 1),
    ("Astrology might have some patterns, but we need evidence to confirm it.", 0),
    ("No one has shown that miracles happening isn't true, so it must be.", 1),
    ("No one has shown that time travel existing isn't true, so it must be.", 1),
    ("No one has shown that astrology isn't true, so it must be.", 1),
    ("Alien life is a possibility, but we need evidence to confirm it.", 0),
    ("No one has shown that celebrities being clones isn't true, so it must be.", 1),
    ("No one has shown that the new diet being unhealthy isn't true, so it must be.", 1),
    ("No one has shown that the government hiding secrets isn't true, so it must be.", 1),
    ("You can't prove she's a good leader, so it must be false.", 1),
    ("You can't prove this medicine helps, so it must be false.", 1),
    ("You can't prove the test was fair, so it must be false.", 1),
    ("You can't prove aliens built the pyramids, so it must be false.", 1),
    ("No one has shown that the moon landing being fake isn't true, so it must be.", 1),
    ("Pollution statistics vary, but we need evidence to confirm it.", 0),
    ("No one has shown that video games causing violence isn't true, so it must be.", 1),
    ("You can't prove exercise improves mental health, so it must be false.", 1),
    ("Conspiracy theories are widespread, but we need evidence to confirm it.", 0),
    ("You can't prove the vaccine is safe, so it must be false.", 1),
    ("No one has shown that reincarnation being real isn't true, so it must be.", 1),
    ("You can't prove climate change is real, so it must be false.", 1),
    ("No one has shown that dreams predicting the future isn't true, so it must be.", 1),
    ("Many claim reincarnation is real, but we need evidence to confirm it.", 0),
    ("Nobody has shown the new drug doesn’t work, so it must be effective.", 1),
    ("Time travel is a popular sci-fi theme, but we need evidence to confirm it.", 0),
    ("New diets should be researched, but we need evidence to confirm it.", 0),
    ("You can't prove the study is accurate, so it must be false.", 1),
    ("You can't prove recycling reduces pollution, so it must be false.", 1),
    ("No one has shown that COVID being man-made isn't true, so it must be.", 1),
    ("You can't prove they are trustworthy, so it must be false.", 1),
    ("No one has shown that the cure for cancer being hidden isn't true, so it must be.", 1),
    ("Claims about vaccines must be tested, but we need evidence to confirm it.", 0),
    ("You can't prove this law benefits the people, so it must be false.", 1),
    ("No one has shown that aliens controlling governments isn't true, so it must be.", 1),
    ("You can't prove he's telling the truth, so it must be false.", 1),
    ("This medicine has potential, but we need evidence to confirm it.", 0),
    ("You can't prove this theory is valid, so it must be false.", 1),
]

# Create Spark DataFrame
df = spark.createDataFrame(data, ["text", "label"])

# Write to Hive table
df.write.insertInto("logical_fallacy_data.ignorance", overwrite=False)


In [0]:
%sql
DROP TABLE IF EXISTS ignorance_new;
CREATE TABLE ignorance_new AS SELECT DISTINCT *
FROM logical_fallacy_data.ignorance;

DROP TABLE logical_fallacy_data.ignorance;

ALTER TABLE ignorance_new
RENAME TO logical_fallacy_data.ignorance;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.ignorance TO `ryabumoto1655@sdsu.edu`;

# populate hypocrisy example

In [0]:
from pyspark.sql import SparkSession

# Start Spark session
spark = SparkSession.builder \
    .appName("Insert Hypocrisy Fallacy Examples") \
    .enableHiveSupport() \
    .getOrCreate()

# Inlined hypocrisy data (text, label)
data = [
    ("Eating meat has ethical implications depending on how animals are treated.", 0),
    ("You say I shouldn't cheat on my taxes, but you did it last year too.", 1),
    ("He says pollution is bad, yet he drives a gas-guzzling SUV.", 1),
    ("Aliens must exist because no one has proven they don't.", 0),
    ("You're telling me not to skip workouts, but you skipped last week.", 1),
    ("Investing in renewable energy helps reduce pollution.", 0),
    ("Cheating on taxes is illegal and undermines public services.", 0),
    ("Lying can damage trust and relationships.", 0),
    ("Saving money can lead to better financial stability.", 0),
    ("She lectures us on saving money, but spends a fortune on clothes.", 1),
    ("Don't tell me to study harder—you never studied and still passed.", 1),
    ("How can you criticize my spending when you waste money on gadgets?", 1),
    ("Following rules ensures safety and fairness for all.", 0),
    ("We’ve always done it this way, so it must be right.", 0),
    ("She thinks eating meat is unethical, but wears leather boots.", 1),
    ("You haven’t shown any evidence, so your argument must be false.", 0),
    ("You can't trust his argument about war; he's a soldier.", 0),
    ("Studying regularly improves academic performance.", 0),
    ("If we allow same-sex marriage, what's next? Marrying animals?", 0),
    ("You say we should follow the rules, but you always break them.", 1),
    ("Since there's no proof the policy works, it must be flawed.", 0),
    ("Spending habits should be evaluated based on priorities.", 0),
    ("You argue that lying is wrong, but you've lied before.", 1),
    ("Ghosts are real because I've seen one.", 0),
    ("Skipping workouts might slow down your progress.", 0),
    ("He claims to support equality, but he never promotes women at work.", 1),
    ("Don't listen to her opinion on diets, she’s overweight.", 0),
    ("Promoting equality helps create a fairer workplace.", 0),
    ("She’s a smoker, so ignore her views on health.", 0),
    ("He’s just a teenager, what does he know about politics?", 0),
    ("You tell me not to waste food, but you waste food all the time.", 1),
    ("A balanced diet is important for a healthy lifestyle.", 0),
    ("You tell me not to skip class, but you skipped class all the time.", 1),
    ("Just trust me, it’s common sense.", 0),
    ("You tell me not to ignore emails, but you ignored emails all the time.", 1),
    ("Following traffic laws is important for a healthy lifestyle.", 0),
    ("Good sleep is important for a healthy lifestyle.", 0),
    ("My grandfather smoked his whole life and lived to 100.", 0),
    ("How can she talk about climate change when she flies often?", 0),
    ("You tell me not to watch TV late, but you watch TV late all the time.", 1),
    ("If we don't act now, the world will end tomorrow.", 0),
    ("Time management is important for a healthy lifestyle.", 0),
    ("You tell me not to procrastinate, but you procrastinated all the time.", 1),
    ("Environmental awareness is important for a healthy lifestyle.", 0),
    ("Regular exercise is important for a healthy lifestyle.", 0),
    ("The new policy must be wrong because it's unpopular.", 0),
    ("You tell me not to miss deadlines, but you miss deadlines all the time.", 1),
    ("No one's disproved unicorns exist, so they might be real.", 0),
    ("It's always been done this way, so it's the best method.", 0),
    ("You tell me not to yell at people, but you yelled at people all the time.", 1),
    ("Financial planning is important for a healthy lifestyle.", 0),
    ("Learning continuously is important for a healthy lifestyle.", 0),
    ("Don't take his argument seriously—he's just a janitor.", 0),
    ("Community service is important for a healthy lifestyle.", 0),
    ("Effective communication is important for a healthy lifestyle.", 0),
    ("Without evidence, your argument is invalid.", 0),
    ("You tell me not to drive fast, but you drive fast all the time.", 1),
    ("Hydration is important for a healthy lifestyle.", 0),
    ("You tell me not to use your phone during meetings, but you used your phone during meetings all the time.", 1),
    ("He’s rich, so he must be wrong about poverty.", 0),
    ("You tell me not to use plastic, but you use plastic all the time.", 1),
    ("You tell me not to drink soda, but you drink soda all the time.", 1),
    ("Only idiots would disagree with this law.", 0),
    ("You tell me not to complain about work, but you complain about work all the time.", 1),
    ("Positive thinking is important for a healthy lifestyle.", 0),
]

# Create DataFrame
df = spark.createDataFrame(data, ["text", "label"])

# Insert into Hive table
df.write.insertInto("logical_fallacy_data.hypocrisy", overwrite=False)


In [0]:
%sql
DROP TABLE IF EXISTS hypocrisy_new;
CREATE TABLE hypocrisy_new AS SELECT DISTINCT *
FROM logical_fallacy_data.hypocrisy;

DROP TABLE logical_fallacy_data.hypocrisy;

ALTER TABLE hypocrisy_new
RENAME TO logical_fallacy_data.hypocrisy;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.hypocrisy TO `ryabumoto1655@sdsu.edu`;

# populate stacking the deck examples

In [0]:
from pyspark.sql import SparkSession
import csv
from io import StringIO

# Step 1: Start Spark session
spark = SparkSession.builder \
    .appName("Insert Stacking the Deck Examples") \
    .enableHiveSupport() \
    .getOrCreate()

# Step 2: Paste your full raw data here
raw_data = """
text,label
"While this method has worked well, other approaches should be weighed too.",healthy_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
My dog loves to run around in the backyard.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
My dog loves to run around in the backyard.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
My dog loves to run around in the backyard.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
I enjoy painting as a interest.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
My dog loves to run around in the backyard.,non_argument
"Our product is the greatest, just ask our most loyal customers.",stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
The traffic was terrible this morning.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
The traffic was terrible this morning.,non_argument
"Everyone agrees that this is the best way to go, so we shouldn’t even consider alternatives.",stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
I went shopping last weekend and bought a new jacket.,non_argument
The traffic was terrible this morning.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I enjoy painting as a interest.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
I enjoy painting as a hobby.,non_argument
My dog loves to run around in the backyard.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
The traffic was terrible this morning.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"Clearly, just fools would think differently.",stacking_deck
"Clearly, just fools would think differently.",stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"Our product is the greatest, just ask our most loyal customers.",stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"We should examine evidence from a range of sources, both for and against.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
My dog loves to run around in the backyard.,non_argument
"Clearly, just fools would think differently.",stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
I enjoy painting as a interest.,non_argument
I enjoy painting as a interest.,non_argument
My dog loves to run around in the backyard.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The traffic was terrible this morning.,non_argument
"Everyone agrees that this is the perfect way to go, so we shouldn’t even consider alternatives.",stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
I enjoy painting as a interest.,non_argument
"Clearly, just fools would think differently.",stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"While this method has worked well, other approaches should be considered too.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
I went shopping last evening and bought a new shirt.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
The traffic was terrible this morning.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
My dog loves to run around in the backyard.,non_argument
"Clearly, just fools would think differently.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
My dog loves to run around in the backyard.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
My dog loves to run around in the backyard.,non_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
"Our product is the top, just ask our most loyal customers.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
"Clearly, just fools would think differently.",stacking_deck
"Our product is the top, just ask our most loyal customers.",stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
My dog loves to run around in the backyard.,non_argument
"Clearly, just fools would think differently.",stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
The traffic was terrible this morning.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
The traffic was terrible this morning.,non_argument
I enjoy painting as a interest.,non_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
My dog loves to run around in the backyard.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
My dog loves to run around in the backyard.,non_argument
I enjoy painting as a interest.,non_argument
"Clearly, just fools would think differently.",stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The traffic was terrible this morning.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
The traffic was terrible this morning.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
"Our product is the top, just ask our most loyal customers.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
I went shopping last evening and bought a new shirt.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
My dog loves to run around in the backyard.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
I enjoy painting as a interest.,non_argument
"Clearly, just fools would think differently.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
The traffic was terrible this morning.,non_argument
My dog loves to run around in the backyard.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"Our product is the greatest, just ask our most loyal customers.",stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"Everyone agrees that this is the perfect way to go, so we shouldn’t even consider alternatives.",stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
I enjoy painting as a interest.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
My dog loves to run around in the backyard.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I enjoy painting as a interest.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
My dog loves to run around in the backyard.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
My dog loves to run around in the backyard.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
My dog loves to run around in the backyard.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
The traffic was terrible this morning.,non_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
I'm planning to cook pasta for dinner tonight.,non_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s consider both the advantages and the disadvantages before making a decision.,healthy_argument
I'm planning to cook pasta for dinner tonight.,non_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
My dog loves to run around in the backyard.,non_argument
The traffic was terrible this morning.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
I enjoy painting as a interest.,non_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
The traffic was terrible this morning.,non_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
"Clearly, just fools would think differently.",stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
"Clearly, just fools would think differently.",stacking_deck
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
It’s important to include perspectives that challenge our assumptions.,healthy_argument
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
"Our product is the top, just ask our most loyal customers.",stacking_deck
I enjoy painting as a interest.,non_argument
"Clearly, just fools would think differently.",stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
"Clearly, just fools would think differently.",stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
There’s a great movie playing at the cinema nearby.,non_argument
All experts agree on this — the ones who disagree aren’t real experts.,stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
"Clearly, just fools would think differently.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"Everyone agrees that this is the perfect way to go, so we shouldn’t even consider alternatives.",stacking_deck
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
I'm planning to cook pasta for dinner tonight.,non_argument
I went shopping last evening and bought a new shirt.,non_argument
"Clearly, only fools would think differently.",stacking_deck
It’s important to include perspectives that challenge our assumptions.,healthy_argument
There’s a great movie playing at the cinema nearby.,non_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"Everyone agrees that this is the greatest way to go, so we shouldn’t even consider alternatives.",stacking_deck
"Our product is the top, just ask our most loyal customers.",stacking_deck
I went shopping last evening and bought a new shirt.,non_argument
"While this method has worked well, other approaches should be weighed too.",healthy_argument
My dog loves to run around in the backyard.,non_argument
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
"Clearly, just fools would think differently.",stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
You’ve just heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"Our product is the perfect, just ask our most loyal customers.",stacking_deck
"While this method has worked well, other approaches should be weighed too.",healthy_argument
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
Let’s weigh both the advantages and the disadvantages before making a decision.,healthy_argument
"Clearly, just fools would think differently.",stacking_deck
"We should examine evidence from a range of perspectives, both for and against.",healthy_argument
"Our product is the best, just ask our most loyal customers.",stacking_deck
You’ve only heard the good things because the bad stuff isn’t worth discussing.,stacking_deck
"Everyone agrees that this is the top way to go, so we shouldn’t even consider alternatives.",stacking_deck
The traffic was terrible this morning.,non_argument
There’s a great movie playing at the cinema nearby.,non_argument
The facts all support my argument — just look at these hand-picked studies.,stacking_deck
Let’s just hear from the successful people; the rest probably have nothing valuable to add.,stacking_deck
The critics who liked it say it's great — ignore the negative reviews.,stacking_deck
My dog loves to run around in the backyard.,non_argument
"""

# Step 3: Convert label strings to binary (1 = stacking_deck, 0 = others)
label_map = {
    "stacking_deck": 1,
    "healthy_argument": 0,
    "non_argument": 0
}

# Step 4: Parse the string into a list of (text, label) tuples
reader = csv.reader(StringIO(raw_data.strip()))
data = [(text.strip(), label_map[label.strip()]) for text, label in reader if label.strip() in label_map]

# Step 5: Create a Spark DataFrame
df = spark.createDataFrame(data, ["text", "label"])

# Step 6: Insert into Hive table
df.write.insertInto("logical_fallacy_data.stacking_deck", overwrite=False)


In [0]:
%sql
DROP TABLE IF EXISTS stacking_new;
CREATE TABLE stacking_new AS SELECT DISTINCT *
FROM logical_fallacy_data.stacking_deck;

DROP TABLE logical_fallacy_data.stacking_deck;

ALTER TABLE stacking_new
RENAME TO logical_fallacy_data.stacking_deck;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.stacking_deck TO `ryabumoto1655@sdsu.edu`;

# populate ad-hominem data

In [0]:
from pyspark.sql import SparkSession

# Start Spark session
spark = SparkSession.builder \
    .appName("Insert Synthetic Stacking the Deck Data") \
    .enableHiveSupport() \
    .getOrCreate()

# Synthetic stacking_deck fallacy examples
synthetic_examples = [
    "You don't know anything about politics, you're just a student.", 
    "That's a ridiculous statement, you're too young to understand.",
    "Your argument is invalid because you're just a dumb person.",
    "You don’t have the expertise to be making these kinds of claims.",
    "What do you know about this? You’re just a student with no real experience.",
    "You're too young to understand the complexities of this topic.",
    "You're just an idealist; you don’t know how the world really works.",
    "You can’t possibly know anything about this; you’ve never worked a real job.",
    "You're just upset because things aren't going your way.",
    "You wouldn’t understand; you’re just a part-time worker.",
    "You're too inexperienced to have a valid opinion on this.",
    "You’re just repeating what everyone else says; you don’t think for yourself.",
    "How can you argue with me? You’ve never been in this field.",
    "What do you know about this? You’ve never even had a leadership role.",
    "You can't possibly understand, you're just a teenager with no experience.",
    "You're too emotional to be taken seriously on this matter.",
    "You can’t contribute to this conversation; you're just a beginner.",
    "You don’t have enough life experience to understand what's really going on.",
    "You're just a fan of that person; your opinion is biased.",
    "You can’t speak with authority because you're not qualified.",
    "How could you possibly know? You haven’t even been through a real struggle.",
    "You're too inexperienced to be discussing this seriously.",
    "You don’t know what you’re talking about; you’ve never been in my shoes.",
    "You’re just a blogger; your opinion doesn’t count.",
    "You're too young to see the big picture.",
    "You’re just a dreamer, not a realist.",
    "What do you know? You’ve never held a real job.",
    "You're just saying that because you haven’t lived long enough."
]

# Synthetic healthy arguments (non-fallacious)
synthetic_healthy_arguments = [
    "I understand your point, but I think the data shows something different.",
    "I see where you're coming from, but let's look at the facts before we make a decision.",
    "While I respect your perspective, I think we need to consider a wider range of views on this.",
    "That's an interesting point, but I believe the evidence suggests otherwise.",
    "I disagree with your conclusion, but let's explore the underlying reasoning together.",
    "I hear you, but from my experience, I believe the situation is more complex.",
    "I understand your concerns, and I think it’s important we weigh the pros and cons carefully.",
    "I appreciate your opinion, but I think it's crucial to also examine the long-term effects.",
    "You raise a valid point, but we also need to account for other factors in this situation.",
    "I think it’s important to keep an open mind, as there may be other perspectives to consider.",
    "I see what you’re saying, but have you thought about the potential downsides?",
    "I get that you’re frustrated, but let’s try to focus on finding a solution.",
    "I agree that this is an issue, but I think we should look at all sides before we act.",
    "I see your concerns, but I think we need to gather more information first.",
    "That’s a good point, but I think we need to look at this in a broader context.",
    "I understand your perspective, but the data we have doesn't fully support that view.",
    "You're right to be concerned, but I think there are other strategies we should also consider.",
    "I respect your opinion, but let’s take a closer look at the facts before making any conclusions.",
    "I agree that this could be an issue, but I think we need to address it in a more systematic way.",
    "I understand your viewpoint, but I think we need to evaluate the situation more thoroughly.",
    "I appreciate your viewpoint, but let’s also consider the other possible outcomes.",
    "I see your point, but we need to factor in other variables that might affect the outcome.",
    "I understand your frustration, but let’s focus on finding a constructive solution.",
    "I see where you're coming from, but I think it's important to keep the bigger picture in mind.",
    "I understand the concern, but I think we need to approach this more methodically.",
    "I respect your perspective, but I think we need to question our assumptions here.",
    "That’s a valid argument, but we also need to look at the data from multiple angles.",
    "I agree with your sentiment, but I think it’s essential to test this hypothesis before making a decision.",
    "I see your point, but I think we should gather more evidence before drawing conclusions.",
    "I agree that there is an issue, but I think we need to identify the root cause first.",
    "You make a good argument, but I think we should consider how this will affect the long term.",
    "I agree with you on some aspects, but we should also factor in other variables.",
    "I see the merit in your argument, but I believe the situation is more nuanced than that.",
    "I understand the concern, but perhaps a different approach might be more effective.",
    "I see your point, but I think it's important to focus on solutions rather than dwelling on the problem.",
    "I respect your opinion, but I think it’s important to consider the broader implications.",
    "I agree that change is necessary, but we need to look at sustainable options.",
    "That’s a good idea, but I think it’s important to balance that with other priorities.",
    "I understand your frustration, but I think we need to take a step back and look at the bigger picture.",
    "I appreciate your thoughts, but I believe we need to focus on actionable steps.",
    "You bring up a valid concern, but let’s also think about the long-term benefits of this decision.",
    "I see the logic behind your argument, but let’s take a more balanced approach.",
    "I agree with you on several points, but I think it’s important to consider other options as well.",
    "That’s a compelling argument, but I think we should explore other alternatives.",
    "I understand your point of view, but I believe we need to look at the evidence before moving forward.",
    "I agree that something needs to change, but I think we need a plan that addresses all the underlying issues.",
    "You have a strong argument, but I think we should be cautious about the potential risks.",
    "I agree that this is a pressing issue, but let's also consider the potential consequences of this action.",
    "I understand your reasoning, but I think it’s important to consider the different perspectives involved.",
    "I respect your opinion, but I believe we need to dig deeper into the facts before making a final decision."
]

# Synthetic neutral/non-arguments
synthetic_non_arguments = [
    "The weather today is very nice, with clear skies and a mild breeze.",
    "I enjoy listening to music in my free time.",
    "There’s a coffee shop near my house that I go to every weekend.",
    "I recently started reading a new book that seems really interesting.",
    "My favorite season of the year is autumn because of the colors of the leaves.",
    "I think I'll have pasta for dinner tonight.",
    "I like to go for walks in the park to relax.",
    "I noticed that the flowers in my garden are blooming beautifully this spring.",
    "I love watching documentaries on wildlife.",
    "My friend just adopted a dog, and it’s so cute."
]

# Combine healthy and non-argument into non-examples (label = 0)
synthetic_non_examples = synthetic_non_arguments + synthetic_healthy_arguments

# Construct final labeled dataset
examples = [(text, 1) for text in synthetic_examples] + [(text, 0) for text in synthetic_non_examples]

# Create Spark DataFrame
df = spark.createDataFrame(examples, ["text", "label"])

# Insert into the Hive table
df.write.insertInto("logical_fallacy_data.ad_hominem")


In [0]:
%sql
DROP TABLE IF EXISTS ad_hominem_new;
CREATE TABLE ad_hominem_new AS SELECT DISTINCT *
FROM logical_fallacy_data.ad_hominem;

DROP TABLE logical_fallacy_data.ad_hominem;

ALTER TABLE ad_hominem_new
RENAME TO logical_fallacy_data.ad_hominem;

GRANT ALL PRIVILEGES ON TABLE logical_fallacy_data.ad_hominem TO `ryabumoto1655@sdsu.edu`;