Feat: Final changes to prompt

2025-10-22 16:44:01 -03:00
parent f2df55f0f9
commit 42f9d22c77
32 changed files with 1122 additions and 1607 deletions
--- a/agent/Dockerfile
+++ b/agent/Dockerfile
@@ -7,7 +7,7 @@ COPY requirements.txt ${LAMBDA_TASK_ROOT}
 RUN pip install -r requirements.txt

 # Copy function code
-COPY agent.py ${LAMBDA_TASK_ROOT}
+COPY ./ ${LAMBDA_TASK_ROOT}

 # Set the CMD to your handler (could also be done as a parameter override outside of the Dockerfile)
-CMD ["agent.hello" ]
+CMD ["agent.agent_call"]
--- a/agent/agent.py
+++ b/agent/agent.py
@@ -1,37 +1,22 @@
 import json
-from langchain_core.tools import tool
-from langchain.agents.output_parsers import ReActJsonSingleInputOutputParser
-from langchain_core.prompts import ChatPromptTemplate,MessagesPlaceholder, PromptTemplate
-from langchain_core.messages import HumanMessage,AIMessage
-from langchain_core.tools import render_text_description
-from langchain.chains import create_history_aware_retriever
-from langchain.chains.combine_documents import create_stuff_documents_chain
-import langchain.chains
-from langchain.chains import create_history_aware_retriever
-from langchain.chains.combine_documents import create_stuff_documents_chain
-from langchain.agents.format_scratchpad import format_log_to_str
-from langchain.chains import create_retrieval_chain
 from langchain_aws import ChatBedrock
 from langchain_aws.retrievers import AmazonKnowledgeBasesRetriever
-from langchain.chains import ConversationalRetrievalChain
-from typing import Union
-from langchain_core.agents import AgentAction, AgentFinish
-from langchain.agents.output_parsers import ReActSingleInputOutputParser
-from langchain.tools import Tool
 from langgraph.checkpoint.memory import MemorySaver
 from langgraph.prebuilt import create_react_agent
 import os
-
-def find_tool_by_name(tools: list[Tool],tool_name:str):
-    for tool in tools:
-        if tool.name==tool_name:
-            print(tool.name)
-            print("\n\n")
-            return tool
-    raise ValueError(f"Tool with name {tool_name} not found")
-def hello(event,context):
+from langfuse import Langfuse
+from langfuse.langchain import CallbackHandler
+from tools import secrets,dynamo
+import time
+langfuse = Langfuse(
+    public_key=json.loads(secrets.get_secret())['api-langfuse-public'],
+    secret_key=json.loads(secrets.get_secret())['api-langfuse-secret'],
+    host="http://107.20.48.139:3000"
+)
+langfuse_handler = CallbackHandler()
+def agent_call(event,context):
    llm = ChatBedrock(
-    model_id="arn:aws:bedrock:us-east-1:654654422992:application-inference-profile/glvyppv11ds5",
+    model_id="us.anthropic.claude-sonnet-4-20250514-v1:0",
    region_name="us-east-1",
    #aws_access_key_id=os.environ["AWS_ACCESS_KEY_ID"],
    #aws_secret_access_key=os.environ["AWS_SECRET_ACCESS_KEY"],
@@ -45,6 +30,10 @@ def hello(event,context):
    retrieval_config={"vectorSearchConfiguration": {"numberOfResults": 4}},

 )
+    if event['chat_history']==[]:
+        history=dynamo.read_memory(event['username'])
+    else:
+        history=event['chat_history']
    memory = MemorySaver()
    model = llm
    tools = [retriever.as_tool()]
@@ -53,18 +42,47 @@ def hello(event,context):
    Act like a human in Portuguese Brasil.
    You are a assistant for students from diferent school campuses of the Instituto Federal de São Paulo.
    Your objective is to answer diferent questions about editais de bolsas, which can be acessed by the AmazonKnowledgeBaseRetriever tool.
-    The editais change based on the student's campus, if he is a superior or médio student, and if he is already receiving any bolsa or not. Get these informations from the user, only prompting one per message to the user, before ansewering any questions.
+    The editais change based on the student's campus, if he is a superior or médio student, and if he is already receiving any type of "Bolsa PAP", not including "Iniciação Cientifica" or "bolsa de extensão" . Get these informations from the user, only prompting one per message to the user, before ansewering any questions.
+    The criteria for every type of "bolsa" is different, look at the editals to check. Been a student, who doesnt have a bolsa for any campi is not enough for any bolsa, so check for the extra conditions.
    Retrieve the answer from the most recent edital that contemplates this type of student.
    The chat history will be given, without the previous retrieved editais info.
    If there are info or context missing ask the user before proceding with the document retrie
    Also return the title of the source document, with edital number and year, not the file name.val.
-    Document with MTO are from "Campus Matão" and SPO from "Campus São Paulo".
+    Document with MTO are from "Campus Matão", SPO from "Campus São Paulo" and CBT from "Campus Cubatão".
+    If you are prompted after a campus that is not Matão, São Paulo or Cubatão, answer that you can only work with one of these.
    Don't get information from diferent campus under no circunstance.
    You cant evaluate if someone can receive a bolsa, only get the info from docs and send them to the procedure in the document.
+    If the prompt is too generic like or too short, like "sim" or "quero bolsa",  ask for more context before retrieving from the documents.
+    If the user prompt you about wanting to get or to know more about a bolsa pap, ask wich of them (saúde,moradia,transporte,creche didático-pedagócio) they want to know more.
    <\rules>
    <glossary>
    "não registrado" means trabalhador informal.
+    "banco inter" means "banco intermedium", if a user asks about inter, include in the answer this info.
    <\glossary>
+    <chain_of_thought>
+    Use these questions as examples:
+    Quando a minha bolsa vai cair?
+    Resposta: Devido a complexidade da estrtura em volta do pagamento das bolsas, não existe um dia fixo, ele tende a variar dependendo do mês.
+
+    Não tenho conta bancária em meu nome, pode ser no nome do meu responsável?
+    Resposta: Não! A conta deve ser aberta no nome do estudante e pode ser em bancos digitais sem que seja necessário sair de casa, fazendo tudo pela internet!
+    
+    Posso enviar a Documentação solicitada no Edital por e-mail?
+    Resposta: Não! Documentos enviados por e-mail não serão considerados para análise.
+    
+    A comprovação de renda deve ser referente ao qual mês?
+    Resposta: agosto que é o mês mais recente em relação a inscrição.
+
+    Não tenho a Carteira de Trabalho impressa. Serve a digital?
+    Resposta: Sim!
+    
+    Na carteira de trabalho consta o salário. Ela substitui o contracheque?
+    Resposta: Não, pois somente no contracheque encontramos o valor da renda BRUTA.
+    
+    Trabalhador informal e trabalhador autônomo são sinônimos?
+    Resposta: Não! Trabalhadores informais são os que trabalham por conta própria, NÃO tem CNPJ e geralmente não pagam o carnê do INSS, não tendo nenhum direito trabalhista. Diferente deste, o profissional autônomo geralmente é especializado em algum segmento do mercado e atua por conta própria, geralmente sendo MEI – Micro Empreendedores Individuais e tendo CNPJ.
+
+    <\chain_of_thought>
    <general_info>
    Tipos de bolsa:
    Auxílio Alimentação: É um auxílio financeiro que tem por objetivo garantir e disponibilizar condições de que o estudante usufrua de ao menos uma refeição por dia. É pago mensalmente, e caso o aluno não frequente as aulas todos os dias ele poderá ser oferecido de forma parcial, calculado pela quantidade de dias que o aluno frequenta a aula. 
@@ -99,13 +117,16 @@ Answer the following questions as best you can. You have access to the following

 {tools}

-Chat History:"""+str(event["chat_history"])
+Chat History:"""+str(history)

    agent_executor = create_react_agent(model, tools, checkpointer=memory, prompt=prompt)
-    config = {"configurable": {"thread_id": "abc123"}}
+    config = {"configurable": {"thread_id": "abc123"},"callbacks": [langfuse_handler]}
    input_message = event["message"]
-    #input_message=[{"role":"user","content":"aluno superior, nunca recebi auxilio, campus são paulo, Meu pai não é registrado, como faço para ganhar auxilio?"}]
+    dict=input_message[0]
    response=""
    for step in agent_executor.stream({"messages": input_message}, config, stream_mode="values"):
        response={"json":(step["messages"][-1].text())}
+    response['dynamo_reponse']=dynamo.write_memory(event['username'],int(time.time()),dict['role'],dict['content'])
+    #response['chat_history']=history
+    response['chat_history']=[]
    return (response)
--- a/agent/conversational_rag.py
+++ b/agent/conversational_rag.py
@@ -1,74 +0,0 @@
-import boto3
-from langchain_core.prompts import ChatPromptTemplate,MessagesPlaceholder
-from langchain_core.messages import HumanMessage,AIMessage
-from langchain.chains import create_history_aware_retriever
-from langchain.chains.combine_documents import create_stuff_documents_chain
-import langchain.chains
-from langchain.chains import create_retrieval_chain
-from langchain_aws import ChatBedrock
-from langchain_aws.retrievers import AmazonKnowledgeBasesRetriever
-from langchain.chains import ConversationalRetrievalChain
-from dotenv import load_dotenv
-load_dotenv()
-import os
-llm = ChatBedrock(
-    model_id="arn:aws:bedrock:us-east-1:654654422992:application-inference-profile/d9blf0g3fzqz",
-    region_name="us-east-1",
-    aws_access_key_id=os.environ["AWS_ACCESS_KEY_ID"],
-    aws_secret_access_key=os.environ["AWS_SECRET_ACCESS_KEY"],
-    aws_session_token=os.environ["AWS_SESSION_TOKEN"],
-    model_kwargs={"temperature": 0.2, 'max_tokens': 1000,},
-    provider='anthropic'
-)
-# Cria o prompt de busca
-prompt_search_query = ChatPromptTemplate.from_messages([
-    MessagesPlaceholder(variable_name="chat_history"),
-    ("user", "{input}"),
-    ("assistant", "-"),
-    ("user", "Given the above conversation, generate a search query to look up to get information relevant to the conversation")
-])
-
-# Cria o prompt de resposta
-prompt_get_answer = ChatPromptTemplate.from_messages([
-    ("system", "Answer the user's questions based on the below context:\n\n{context}"),
-    MessagesPlaceholder(variable_name="chat_history"),
-    ("user", "{input}")
-])
-
-# Conecta ao Qdrant
-retriever = AmazonKnowledgeBasesRetriever(
-    knowledge_base_id="RBD9TI5HYU",
-    region_name="us-east-1",
-    retrieval_config={"vectorSearchConfiguration": {"numberOfResults": 4}},
-    
-)
-# Cria o retriever com histórico
-retriever_chain = create_history_aware_retriever(llm, retriever, prompt_search_query)
-
-# Cria o documento chain
-document_chain = create_stuff_documents_chain(llm, prompt_get_answer)
-
-# Cria o retrieval chain
-retrieval_chain= create_retrieval_chain(
-    retriever_chain,document_chain
-)
-
-def chat_with_bot(user_input, chat_history):
-    """
-    Função para interagir com o chatbot.
-
-    Args:
-        user_input (str): A entrada do usuário.
-        chat_history (list): O histórico da conversa, incluindo mensagens do usuário e do assistente.
-
-    Returns:
-        str: A resposta do chatbot.
-    """
-    # Chama o chain de recuperação com o histórico e a entrada do usuário
-    response = retrieval_chain.invoke({
-        "chat_history": chat_history,
-        "input": user_input,
-    })
-    # Retorna a resposta do assistente
-    return response['answer']
-print(chat_with_bot("Quanto é o auxilio?",chat_history=[{"role":"user","content":"Hello"}]))
--- a/agent/poetry.lock
+++ b/agent/poetry.lock
--- a/agent/pyproject.toml
+++ b/agent/pyproject.toml
@@ -1,20 +0,0 @@
-[tool.poetry]
-name = "agent"
-version = "0.1.0"
-description = "Agente edital IFSP"
-authors = ["Lucas DNX"]
-readme = "README.md"
-
-[tool.poetry.dependencies]
-python = "^3.12"
-langchain-core = "^0.3.75"
-langchain = "^0.3.27"
-boto3 = "^1.40.19"
-langchain-aws = "^0.2.31"
-dotenv = "^0.9.9"
-langgraph = "^0.6.7"
-
-
-[build-system]
-requires = ["poetry-core"]
-build-backend = "poetry.core.masonry.api"
--- a/agent/requirements.txt
+++ b/agent/requirements.txt
@@ -2,4 +2,5 @@ langchain_core
 langchain
 langchain_aws
 langgraph
-
+langfuse
+boto3
--- a/agent/tools/dynamo.py
+++ b/agent/tools/dynamo.py
@@ -0,0 +1,41 @@
+import boto3
+def write_memory(user,timestamp,role,content):
+    dynamodb = boto3.resource('dynamodb')
+
+    table = dynamodb.Table('br-edu-ifsp-ifsp-ret-memoria-tabela-chatbot-editais-dev') # Replace 'YourTableName' with your actual table name
+
+    item_data = {
+        'UserId': user,  # Replace with your partition key attribute and value
+        'Timestamp': timestamp,      # Replace with your sort key attribute and value (if applicable)
+        'role': role,
+        'content': content
+    }
+
+    try:
+        response = table.put_item(Item=item_data)
+        return response
+    except Exception as e:
+        return "Error adding item:"+str(e)
+def read_memory(userid):
+    dynamodb = boto3.resource('dynamodb')
+    table = dynamodb.Table('br-edu-ifsp-ifsp-ret-memoria-tabela-chatbot-editais-dev')
+
+    # Query parameters
+
+    try:
+        response = table.query(
+            KeyConditionExpression=boto3.dynamodb.conditions.Key('UserId').eq(userid),
+            ScanIndexForward=False,  # Descending order
+            Limit=30  # Get only the latest item
+        )
+        
+        items = response.get('Items', [])
+        if items:
+            latest_items = items
+            return latest_items
+        else:
+            return []
+
+    except Exception as e:
+        print("Error querying DynamoDB:", str(e))
+
--- a/agent/tools/secrets.py
+++ b/agent/tools/secrets.py
@@ -0,0 +1,25 @@
+import boto3
+from botocore.exceptions import ClientError
+def get_secret():
+
+    secret_name = "dev/chatboteditais/apigateway/apikey"
+    region_name = "us-east-1"
+
+    # Create a Secrets Manager client
+    session = boto3.session.Session()
+    client = session.client(
+        service_name='secretsmanager',
+        region_name=region_name
+    )
+
+    try:
+        get_secret_value_response = client.get_secret_value(
+            SecretId=secret_name
+        )
+    except ClientError as e:
+        # For a list of exceptions thrown, see
+        # https://docs.aws.amazon.com/secretsmanager/latest/apireference/API_GetSecretValue.html
+        raise e
+
+    secret = get_secret_value_response['SecretString']
+    return secret