In [13]:
import sqlite3
import pandas as pd

# Define SQLite database file path
sqlite_db_path = './source/data/courses_gen.db'
df = pd.read_csv('./source/data/generate_preprocessing_table.csv', encoding ='utf-8')

# Connect to SQLite database (it will create the file if it doesn't exist)
conn = sqlite3.connect(sqlite_db_path)
cursor = conn.cursor()

# Define table schema and create the table
create_table_query = """
CREATE TABLE IF NOT EXISTS courses (
    id INTEGER PRIMARY KEY AUTOINCREMENT,
    department_major TEXT,
    course_number TEXT,
    section_number INTEGER,
    course_name TEXT,
    lecture_language TEXT,
    course_classification TEXT,
    elective_area TEXT,
    credits_theory_practice TEXT,
    year_semester INTEGER,
    target_course TEXT,
    course_summary TEXT,
    syllabus TEXT,
    main_department TEXT,
    professor_name TEXT,
    day_time TEXT,
    classroom TEXT,
    online_course TEXT,
    credits INTEGER,
    course_description TEXT
);
"""

cursor.execute(create_table_query)
conn.commit()

# Insert CSV data into the SQLite table
for _, row in df.iterrows():
    insert_query = """
    INSERT INTO courses (
        department_major, course_number, section_number, course_name, 
        lecture_language, course_classification, elective_area, credits_theory_practice, 
        year_semester, target_course, course_summary, syllabus, main_department, 
        professor_name, day_time, classroom, online_course, credits, course_description
    ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
    """
    
    cursor.execute(insert_query, (
        row['개설학과전공'], row['학수번호'], row['분반'], row['교과목명'],
        row['강의언어'], row['이수구분'], row['선택영역'], row['학점/이론/실습'],
        row['학년(학기)'], row['대상과정'], row['교과목개요'], row['수업계획서'],
        row['주관학과'], row['교수명'], row['요일 및 강의시간'], row['강의실'],
        row['사이버강좌'], row['학점'], row['교과목설명']
    ))

conn.commit()

# Close the connection
conn.close()

# Return the path to the created SQLite database
sqlite_db_path


'./source/data/courses_gen.db'

In [1]:
import sqlite3
import pandas as pd
df = pd.read_csv('./source/data/preprocessing_table.csv', encoding ='utf-8')


In [9]:
list(df['교과목명'].unique())

['서.복합매체기법',
 '멀티미디어와회화2',
 '미술교과교재연구및지도법',
 '미술논리및논술',
 '현대산수연구',
 '판화',
 '서.종합실기2',
 '한.종합실기2',
 '서.종합실기4',
 '한.종합실기4']

In [None]:
from langchain.llms import OpenAI
from langchain.chains import LLMChain
from langchain.prompts import PromptTemplate

llm = OpenAI(model="gpt-3.5-turbo")
prompt = PromptTemplate(
    input_variables=["course_name"],
    template="Provide a brief 3-line description for the course: {course_name}."
)

chain = LLMChain(llm=llm, prompt=prompt)
def generate_description(course_name):
    description = chain.run(course_name)
    return description