Import necessary packages

In [35]:
from langchain_core.prompts import ChatPromptTemplate, FewShotChatMessagePromptTemplate, MessagesPlaceholder, PromptTemplate
from langchain_openai import ChatOpenAI
from langchain_google_vertexai import ChatVertexAI
from langchain_anthropic import ChatAnthropic
from pathlib import Path
from langchain_core.output_parsers import StrOutputParser
from langchain.output_parsers import PydanticToolsParser, PydanticOutputParser
from langchain_core.pydantic_v1 import BaseModel, Field, validator
from langchain_core.messages import AIMessage, BaseMessage, HumanMessage
from typing import Sequence, List
from langgraph.graph import MessageGraph, END
from langchain_community.document_loaders import DirectoryLoader
from langchain_community.vectorstores import FAISS
from langchain_text_splitters import CharacterTextSplitter
from langchain_openai import OpenAIEmbeddings
from langchain_core.runnables import RunnablePassthrough
import json
import nest_asyncio
nest_asyncio.apply()


#function to call a path to the file and read it. 
def context_gen(file_name):
    Folder = "Context_files"
    here = Path(locals().get('__file__', Folder)).resolve()
    parameter = (here / file_name).read_text()
    return parameter

#remove code fences from the output
def remove_code_fences(text):
    lines = text.split("\n")
    lines = [line for line in lines if not line.strip().startswith('```')]
    lines[0] = lines[0].replace(' -', '-', 1)
    print()
    return "\n".join(lines)

#create inputs to the model, telling it what needs to be done. 
#provides system message
system1 = context_gen("system1.txt")

#provides the few shot examples
output_examples = context_gen("outputex.txt")

#provides the input examples
input_examples = context_gen("inputex.txt")

#provides the database schema
schema = context_gen("dataBaseSchema.txt")

refsystem = context_gen("ref_system copy.txt")

system3 = context_gen("system3.txt")

system2 = context_gen("system2.txt")

rag_prompt = context_gen("rag_prompt.txt")


#First input to the model, breaks query down and provides geometry definition

class analyzed_query(BaseModel):
    """Identifying whether a geometric feature is present in the database and stating the name of the feature"""
    answer: str= Field(description="YES or NO")
    features: List= Field(description="Name of the identified geometrical feature (Singular)")

class Response(BaseModel):
    """Listing the answer of whether the feature is present in the database and the name of the feature"""
    Response: List[analyzed_query]
    

chat_openai = ChatOpenAI(model="gpt-3.5-turbo", temperature=0.0)
chat_google = ChatVertexAI(model_name="gemini-1.0-pro", temperature=0.0, convert_system_message_to_ai=True)
chat_claude = ChatAnthropic(model_name = "claude-3-sonnet-20240229", temperature=0.0)
examples = [
    {"input": input_examples, "output": output_examples},
]

example_prompt = ChatPromptTemplate.from_messages([
    ("human", "{input}"),
    ("ai", "{output}"),
]
)

few_shot_prompt = FewShotChatMessagePromptTemplate(
    example_prompt=example_prompt,
    examples=examples,
)


In [33]:
'''change the human variable to test different inputs'''
human = ("select all leading edges")

def generate_yaml(human:str, chat):
    parser = PydanticOutputParser(pydantic_object=analyzed_query)
    prompt = ChatPromptTemplate.from_messages([("system", rag_prompt + "Answer the user query. Print the output in Json format according to the instructions.\n{format_instructions}",), ("human", human),]).partial(format_instructions=parser.get_format_instructions())
    chain = prompt | chat | parser
    feature_extractor = chain.invoke({})
    answer = feature_extractor.answer

    extracted_features = feature_extractor.features
    print(feature_extractor)
    print()
    loader = DirectoryLoader("RAG")
    raw_docs = loader.load()
    textsplitter = CharacterTextSplitter(chunk_size=2000, chunk_overlap=0)
    docs = textsplitter.split_documents(raw_docs)
    db = FAISS.from_documents(docs, OpenAIEmbeddings())
    retriever = db.as_retriever()
    

    prompt_for_rag = ChatPromptTemplate.from_template("""You are an assistant that is an expert at RAG (Retrieval Augmented Generation). You have been tasked with looking for the definition of the word provided to you as input and generate a summary of the available information."
                You will use only the context provided to you.                                 
                Context:{context}
                Query_to_db:{query}""")
    rag_chain = ({"context": retriever, "query": RunnablePassthrough()}) | prompt_for_rag | chat | StrOutputParser()
    #Base prompt chain, generates the first yaml version with minimal context

    base_prompt = ChatPromptTemplate.from_messages([("system", system1), few_shot_prompt, MessagesPlaceholder(variable_name="messages")])
    yaml_generator = base_prompt | chat 
    rag_output = rag_chain.invoke(f"What is the definition of {extracted_features}?")

    print(rag_output)
    print()

    def chain_yes():
        chain = yaml_generator | StrOutputParser()
        yaml = chain.invoke({"messages": [human]}, {"tags": ["chain_yes"]})
        print("RAG not required, generating YAML")
        print()
        print(yaml)
        print()
        return yaml

    def chain_no():
        chain = yaml_generator | StrOutputParser()
        ai = rag_output
        yaml = chain.invoke({"messages":[ai]}, {"tags": ["chain_no"]})
        print("Getting more information using RAG, then generating YAML")
        print()
        print(yaml)
        print()
        return yaml

    def decision_maker(response_obj: analyzed_query):
        for item in response_obj:
            if item == "YES":
                return chain_yes()
            elif item == "NO":
                return chain_no()

    model_output = []
    for answer in feature_extractor:
        model_output.append(decision_maker(answer))
    #This chain ise used for the reflection prompt, which asks the model to critique and improve on the generated YAML text.
    reflection_prompt = ChatPromptTemplate.from_messages([
            ("system", refsystem),
            ("user", rag_output),
            few_shot_prompt,
            MessagesPlaceholder(variable_name="messages")
    ])

    reflect = reflection_prompt | chat | StrOutputParser()
    message = str(f"This is the YAML code you are supposed to provide feedback for: {model_output[0]}." + f"The user query for which the yaml code provided is: \n{human}")
    feedback = reflect.invoke(
        {"messages": [message]}, {"tags": ["feedback"]})
    final_generate = base_prompt | chat | StrOutputParser()
    output_yaml = final_generate.invoke(
        {
            "messages": [
                f"I have some YAML code \n {model_output[0]}"
                + f"\nThis code needs to be regenerated (only if needed) with the following instructions in mind: \n{feedback}. \nThe YAML code generated needs to be for the following query: {human}"
            ]
        },
        {"tags": ["final_generate"]},
        )
    print(output_yaml)
    return

In [36]:
human = "Select all flanges in the model"
generate_yaml(human, chat_google)

answer='NO' features=['flanges']

## Definition of Flanges:

Based on the provided context, here's the definition of flanges:

**Flanges are planar surfaces with a relatively large area compared to neighboring surfaces.** They are typically used in conjunction with other components, such as pipes or beams, to provide a secure connection. 

Here are some key characteristics of flanges:

* **Large area:** Compared to neighboring surfaces, flanges have a significantly larger surface area. This allows them to distribute forces more evenly and provide a stronger connection.
* **Planar:** Flanges are flat surfaces, which makes them easy to machine and assemble.
* **Used for connections:** Flanges are often used to connect pipes, beams, and other components together. They can be bolted, welded, or glued in place.

Here are some additional details about flanges:

* **Identification in the faces table:** Flanges can be identified in the faces table by their large area and planar type.
* **SQL q

Retrying langchain_google_vertexai.chat_models._completion_with_retry.<locals>._completion_with_retry_inner in 4.0 seconds as it raised InvalidArgument: 400 Please ensure that multiturn requests alternate between user and model..
Retrying langchain_google_vertexai.chat_models._completion_with_retry.<locals>._completion_with_retry_inner in 4.0 seconds as it raised InvalidArgument: 400 Please ensure that multiturn requests alternate between user and model..
