Adds langfuse ec2 and api key to code

2026-02-26 13:34:45 -03:00
parent 5717cdd254
commit b7c0b92fa3
14 changed files with 487 additions and 41 deletions
--- a/code/app.py
+++ b/code/app.py
@@ -1,4 +1,5 @@
-from fastapi import FastAPI
+from fastapi import FastAPI, Security, HTTPException
 from fastapi.security import APIKeyHeader
 from pydantic import BaseModel
 import uvicorn
 import boto3
@@ -9,11 +10,28 @@ from pathlib import Path
 from urllib.parse import urlparse
 from PyPDF2 import PdfReader
 from datetime import datetime
 from utils.langgraph_agent import RULES, run_agent
 from utils.secrets_manager import SECRETS
 app = FastAPI()
 AWS_REGION = "us-east-2"
 INPUT_BUCKET="automated-pre-authorization"
 OUTPUT_BUCKET = "upflux-doc-analyzer"
 VERSION = "v1"
 # API Key auth
 _api_key_header = APIKeyHeader(name="X-API-Key")
 API_KEY = SECRETS["API-KEY"]
 AWS_ACCESS_KEY =SECRETS["AWS_ACCESS_KEY"]
 AWS_SECRET_KEY = SECRETS["AWS_SECRET_KEY"]
 def verify_api_key(api_key: str = Security(_api_key_header)):
    if api_key != API_KEY:
        raise HTTPException(status_code=403, detail="Invalid API key")
    return api_key
 # --- S3 / Textract helpers ---
@@ -29,7 +47,13 @@ def parse_s3_uri(s3_uri: str) -> tuple[str, str]:
    return bucket, key
-def get_s3_client():
+def get_s3_input_client():
    """S3 client with cross-account credentials for INPUT_BUCKET."""
    return boto3.client("s3",aws_access_key_id=AWS_ACCESS_KEY,aws_secret_access_key=AWS_SECRET_KEY,region_name=AWS_REGION)
 def get_s3_output_client():
    """S3 client using ECS task role for OUTPUT_BUCKET."""
    return boto3.client("s3", region_name=AWS_REGION)
@@ -53,42 +77,66 @@ def extract_text_from_textract_response(response: dict) -> str:
    )
-def extract_text_from_s3_document(bucket: str, key: str) -> str:
+def extract_text_from_s3_document(bucket: str, key: str) -> tuple[str, int]:
-    s3 = get_s3_client()
+    """Returns (extracted_text, page_count)."""
    s3_input = get_s3_input_client()
    s3_output = get_s3_output_client()
    textract = get_textract_client()
    file_ext = Path(key).suffix.lower()
    # Download file bytes using cross-account S3 credentials
    obj = s3_input.get_object(Bucket=bucket, Key=key)
    file_bytes = obj["Body"].read()
    if file_ext in [".png", ".jpg", ".jpeg"]:
        # Pass bytes directly to Textract (avoids Textract needing cross-account S3 access)
        response = textract.detect_document_text(
-            Document={"S3Object": {"Bucket": bucket, "Name": key}}
+            Document={"Bytes": file_bytes}
        )
-        return extract_text_from_textract_response(response)
+        return extract_text_from_textract_response(response), 1
    if file_ext == ".pdf":
-        obj = s3.get_object(Bucket=bucket, Key=key)
+        page_count = get_pdf_page_count(file_bytes)
        pdf_bytes = obj["Body"].read()
        page_count = get_pdf_page_count(pdf_bytes)
        if page_count > 1:
            # Async API requires S3Object — copy to local bucket Textract can access
            temp_key = f"temp_textract/{Path(key).name}"
            s3_output.put_object(Bucket=OUTPUT_BUCKET, Key=temp_key, Body=file_bytes)
            response = textract.start_document_text_detection(
-                DocumentLocation={"S3Object": {"Bucket": bucket, "Name": key}}
+                DocumentLocation={"S3Object": {"Bucket": OUTPUT_BUCKET, "Name": temp_key}}
            )
            job_id = response["JobId"]
-            while True:
+            try:
-                result = textract.get_document_text_detection(JobId=job_id)
+                # Wait for job to complete
-                status = result["JobStatus"]
+                while True:
-                if status == "SUCCEEDED":
+                    result = textract.get_document_text_detection(JobId=job_id)
-                    return extract_text_from_textract_response(result)
+                    status = result["JobStatus"]
-                elif status == "FAILED":
+                    if status == "SUCCEEDED":
-                    return ""
+                        break
-                time.sleep(2)
+                    elif status == "FAILED":
-        else:
+                        return "", page_count
-            response = textract.detect_document_text(
+                    time.sleep(2)
                Document={"S3Object": {"Bucket": bucket, "Name": key}}
            )
            return extract_text_from_textract_response(response)
-    return ""
+                # Collect all blocks across paginated results
                all_blocks = result.get("Blocks", [])
                while "NextToken" in result:
                    result = textract.get_document_text_detection(
                        JobId=job_id, NextToken=result["NextToken"]
                    )
                    all_blocks.extend(result.get("Blocks", []))
                return extract_text_from_textract_response({"Blocks": all_blocks}), page_count
            finally:
                s3_output.delete_object(Bucket=OUTPUT_BUCKET, Key=temp_key)
        else:
            # Single-page PDF — pass bytes directly to sync API
            response = textract.detect_document_text(
                Document={"Bytes": file_bytes}
            )
            return extract_text_from_textract_response(response), page_count
    return "", 0
 # --- Guia processing ---
@@ -110,12 +158,14 @@ def process_guia(guia: dict) -> dict:
        try:
            bucket, key = parse_s3_uri(s3_uri)
-            extracted_text = extract_text_from_s3_document(bucket, key)
+            extracted_text, page_count = extract_text_from_s3_document(bucket, key)
        except Exception as e:
            print(f"  Error extracting text from {nome_arquivo}: {e}")
            extracted_text = ""
            page_count = 0
            anexo["error"] = str(e)
        anexo["textoExtraido"] = extracted_text
        anexo["pageCount"] = page_count
        all_extracted_texts.append(f"--- {nome_arquivo} ---\n{extracted_text}")
    file_content = "\n\n".join(all_extracted_texts)
@@ -146,15 +196,22 @@ def process_guia(guia: dict) -> dict:
        query = json.dumps(query_data, indent=2, ensure_ascii=False)
        try:
-            agent_output = run_agent(query, code, file_content)
+            result = run_agent(query, code, file_content)
            agent_output = result["response"]
            input_tokens = result["input_tokens"]
            output_tokens = result["output_tokens"]
        except Exception as e:
            print(f"  Agent error for servico {codigo_servico_raw}: {e}")
            agent_output = f"ERROR: {str(e)}"
            input_tokens = 0
            output_tokens = 0
        avaliacao_resultados.append({
            "codigoServico": codigo_servico_raw,
            "resultado": "Aprovado" if "aprov" in "".join(c for c in agent_output.lower() if c.isalnum() or c == ' ') else "Reprovado",
-            "agentOutput": agent_output
+            "agentOutput": agent_output,
            "input_tokens": input_tokens,
            "output_tokens": output_tokens,
        })
    guia["avaliacaoAgente"] = avaliacao_resultados
@@ -170,7 +227,7 @@ class ProcessRequest(BaseModel):
 # --- Endpoints ---
-@app.post("/process")
+@app.post("/process", dependencies=[Security(verify_api_key)])
 async def process(request: ProcessRequest):
    results = []
    for idx, guia in enumerate(request.guias):
@@ -183,12 +240,30 @@ async def process(request: ProcessRequest):
                "guia": guia.get("guia", {}).get("codigoGuiaLocal", f"index_{idx}")
            })
-    return {
+    response_body = {
        "status": "success",
        "operadora": request.operadora,
        "guias": results
    }
    # Save result to S3
    try:
        s3 = get_s3_output_client()
        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
        for guia_result in results:
            numero_guia = guia_result.get("guia", {}).get("codigoGuiaLocal", "unknown")
            key = f"{VERSION}/{numero_guia}_{timestamp}.json"
            s3.put_object(
                Bucket=OUTPUT_BUCKET,
                Key=key,
                Body=json.dumps(guia_result, ensure_ascii=False),
                ContentType="application/json",
            )
    except Exception as e:
        print(f"Error saving to S3: {e}")
    return response_body
@app.get("/health")
 async def health():
--- a/code/requirements.txt
+++ b/code/requirements.txt
@@ -6,3 +6,4 @@ langchain
 PyPDF2
 pydantic
 boto3
 langfuse
--- a/code/utils/langgraph_agent.py
+++ b/code/utils/langgraph_agent.py
@@ -14,9 +14,21 @@ from langgraph.graph.message import add_messages
 from langchain_aws import ChatBedrock
 from langchain_core.messages import HumanMessage, AIMessage, ToolMessage, SystemMessage
 from langchain_core.tools import tool
 import os
 from langfuse import Langfuse
 from langfuse.langchain import CallbackHandler 
 from utils.secrets_manager import SECRETS
 CODE=""
 langfuse = Langfuse(
    secret_key=SECRETS["LANGFUSE-SECRET-KEY"],
    public_key=SECRETS["LANGFUSE-PUBLIC-KEY"],
    host=os.environ.get("LANGFUSE_HOST", ""),
 )
 # Base paths
 SCRIPTS_DIR = Path(__file__).parent
 JSON_OUTPUT_DIR = SCRIPTS_DIR / "json_output"
@@ -564,13 +576,26 @@ Start your answer with either:
    print("-" * 50)
    # Run the agent
-    final_state = agent.invoke(initial_state)
+    langfuse_handler = CallbackHandler()
    config = {"callbacks": [langfuse_handler]}
    final_state = agent.invoke(initial_state, config=config)
    # Get the final response
    final_message = final_state["messages"][-1]
    response = final_message.content if hasattr(final_message, "content") else str(final_message)
    # Count tokens from all AI messages
    input_tokens = 0
    output_tokens = 0
    for msg in final_state["messages"]:
        usage = getattr(msg, "usage_metadata", None)
        if usage:
            input_tokens += usage.get("input_tokens", 0)
            output_tokens += usage.get("output_tokens", 0)
    langfuse.flush()
    print(f"Agent: {response}")
-    return response
+    print(f"Tokens - input: {input_tokens}, output: {output_tokens}")
    return {"response": response, "input_tokens": input_tokens, "output_tokens": output_tokens}
--- a/code/utils/secrets_manager.py
+++ b/code/utils/secrets_manager.py
@@ -0,0 +1,6 @@
 import json
 import boto3
 _client = boto3.client("secretsmanager", region_name="us-east-2")
 _response = _client.get_secret_value(SecretId="doc-analyzer")
 SECRETS: dict = json.loads(_response["SecretString"])
--- a/infra/ecs_alb/main.tf
+++ b/infra/ecs_alb/main.tf
@@ -202,13 +202,23 @@ resource "aws_iam_role_policy" "s3_policy" {
  policy = jsonencode({
    Version = "2012-10-17"
-    Statement = [{
+    Statement = [
-      Effect = "Allow"
+      {
-      Action = [
+        Effect = "Allow"
-        "s3:GetObject"
+        Action = [
-      ]
+          "s3:GetObject",
-      Resource = "arn:aws:s3:::upflux-doc-analyzer/*"
+          "s3:PutObject"
-    }]
+        ]
        Resource = "arn:aws:s3:::upflux-doc-analyzer/*"
      },
      {
        Effect = "Allow"
        Action = [
          "s3:DeleteObject"
        ]
        Resource = "arn:aws:s3:::upflux-doc-analyzer/temp_textract/*"
      }
    ]
  })
 }
@@ -229,6 +239,23 @@ resource "aws_iam_role_policy" "textract_policy" {
    }]
  })
 }
 resource "aws_iam_role_policy" "secrets_manager_policy" {
  name = "${var.app_name}-secrets-manager-policy"
  role = aws_iam_role.ecs_task_role.id
  policy = jsonencode({
    Version = "2012-10-17"
    Statement = [{
      Effect = "Allow"
      Action = [
        "secretsmanager:GetSecretValue"
      ]
      Resource = "*"
    }]
  })
 }
 # ECS Task Definition
 resource "aws_ecs_task_definition" "app" {
  family                   = var.app_name
@@ -242,6 +269,13 @@ resource "aws_ecs_task_definition" "app" {
    name  = var.app_name
    image = "${data.aws_caller_identity.current.account_id}.dkr.ecr.${var.aws_region}.amazonaws.com/${var.ecr_repository_name}:${var.image_tag}"
    environment = [
      {
        name  = "LANGFUSE_HOST"
        value = var.langfuse_host
      }
    ]
    portMappings = [{
      containerPort = 8000
      hostPort      = 8000
--- a/infra/ecs_alb/terraform.tfvars
+++ b/infra/ecs_alb/terraform.tfvars
@@ -21,3 +21,4 @@ image_tag           = "latest"
 fargate_cpu         = "256"
 fargate_memory      = "512"
 app_count           = 1
 langfuse_host       = "http://10.0.0.12:3000"
--- a/infra/ecs_alb/variables.tf
+++ b/infra/ecs_alb/variables.tf
@@ -54,3 +54,8 @@ variable "app_count" {
  type        = number
  default     = 1
 }
 variable "langfuse_host" {
  description = "Langfuse host URL"
  type        = string
 }
--- a/infra/langfuse-terraform/data.tf
+++ b/infra/langfuse-terraform/data.tf
@@ -0,0 +1,14 @@
 data "aws_ami" "ubuntu" {
  most_recent = true
  owners      = ["099720109477"] # Canonical
  filter {
    name   = "name"
    values = ["ubuntu/images/hvm-ssd/ubuntu-jammy-22.04-amd64-server-*"]
  }
  filter {
    name   = "virtualization-type"
    values = ["hvm"]
  }
 }
--- a/infra/langfuse-terraform/main.tf
+++ b/infra/langfuse-terraform/main.tf
@@ -0,0 +1,57 @@
 # ──────────────────────────────────────────────
 # Security Group
 # ──────────────────────────────────────────────
 resource "aws_security_group" "langfuse" {
  name        = var.sg_name
  description = "Allow defined ports for Langfuse"
  vpc_id      = var.vpc_id
  dynamic "ingress" {
    for_each = var.allowed_ports
    content {
      from_port   = ingress.value
      to_port     = ingress.value
      protocol    = "tcp"
      cidr_blocks = ["3.14.44.224/32"]
    }
  }
  egress {
    from_port   = 0
    to_port     = 0
    protocol    = "-1"
    cidr_blocks = ["0.0.0.0/0"]
  }
  tags = merge(var.tags, {
    Name = var.sg_name
  })
 }
 # ──────────────────────────────────────────────
 # EC2 Instance
 # ──────────────────────────────────────────────
 resource "aws_instance" "langfuse" {
  ami                         = data.aws_ami.ubuntu.id
  instance_type               = var.instance_type
  subnet_id                   = var.subnet_id
  vpc_security_group_ids      = [aws_security_group.langfuse.id]
  associate_public_ip_address = true
  key_name                    = var.key_name != "" ? var.key_name : null
  user_data = templatefile("${path.module}/user_data.sh.tftpl", {
    langfuse_repo_url = var.langfuse_repo_url
    langfuse_web_port = var.langfuse_web_port
    ebs_device_name   = var.ebs_device_name
  })
  root_block_device {
    volume_size           = var.root_volume_size
    volume_type           = var.root_volume_type
    delete_on_termination = true
  }
  tags = merge(var.tags, {
    Name = var.instance_name
  })
 }
--- a/infra/langfuse-terraform/outputs.tf
+++ b/infra/langfuse-terraform/outputs.tf
@@ -0,0 +1,9 @@
 output "instance_ip" {
  description = "Public IP of the Langfuse EC2 instance"
  value       = aws_instance.langfuse.public_ip
 }
 output "url" {
  description = "Langfuse web UI URL"
  value       = "http://${aws_instance.langfuse.public_ip}:${var.langfuse_web_port}"
 }
--- a/infra/langfuse-terraform/providers.tf
+++ b/infra/langfuse-terraform/providers.tf
@@ -0,0 +1,14 @@
 terraform {
  required_version = ">= 1.0"
  required_providers {
    aws = {
      source  = "hashicorp/aws"
      version = "~> 6.0"
    }
  }
 }
 provider "aws" {
  region = var.aws_region
 }
--- a/infra/langfuse-terraform/terraform.tfvars
+++ b/infra/langfuse-terraform/terraform.tfvars
@@ -0,0 +1,36 @@
 # ──────────────────────────────────────────────
 # General
 # ──────────────────────────────────────────────
 aws_region   = "us-east-2"
 project_name = "langfuse"
 environment  = "dev"
 tags = {
  project    = "doc-processor"
  env        = "dev"
  costCenter = "AI"
  owner      = "ai-team"
 }
 # ──────────────────────────────────────────────
 # Network
 # ──────────────────────────────────────────────
 vpc_id    = "vpc-0270f02aee3bf1b8d"
 subnet_id = "subnet-088bc49c54ec8f028" # public-us-east-1a-subnet
 # ──────────────────────────────────────────────
 # EC2
 # ──────────────────────────────────────────────
 instance_type    = "t3.xlarge"
 instance_name    = "LangfuseEC2"
 sg_name          = "langfuse-sg"
 allowed_ports    = [22, 80, 443, 3000]
 root_volume_size = 100
 root_volume_type = "gp2"
 ebs_device_name  = "/dev/sdf"
 # ──────────────────────────────────────────────
 # Langfuse
 # ──────────────────────────────────────────────
 langfuse_repo_url = "https://github.com/langfuse/langfuse.git"
 langfuse_web_port = 3000
--- a/infra/langfuse-terraform/user_data.sh.tftpl
+++ b/infra/langfuse-terraform/user_data.sh.tftpl
@@ -0,0 +1,66 @@
 #!/bin/bash
 set -e
 # Install Docker
 sudo apt-get update -y
 sudo apt-get install -y ca-certificates curl gnupg git
 sudo install -m 0755 -d /etc/apt/keyrings
 curl -fsSL https://download.docker.com/linux/ubuntu/gpg | sudo gpg --dearmor -o /etc/apt/keyrings/docker.gpg
 sudo chmod a+r /etc/apt/keyrings/docker.gpg
 echo \
  "deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.gpg] https://download.docker.com/linux/ubuntu \
  $(. /etc/os-release && echo "$VERSION_CODENAME") stable" | \
  sudo tee /etc/apt/sources.list.d/docker.list > /dev/null
 sudo apt-get update -y
 sudo apt-get install -y docker-ce docker-ce-cli containerd.io docker-compose-plugin
 sudo groupadd docker || true
 sudo usermod -aG docker ubuntu
 sudo chmod 666 /var/run/docker.sock
 sudo systemctl enable docker
 sudo systemctl restart docker
 # Clone and configure Langfuse
 cd /opt
 git clone ${langfuse_repo_url}
 cd langfuse
 NEXTAUTH_SECRET=$(openssl rand -hex 32)
 PUBLIC_IP=$(curl -s http://169.254.169.254/latest/meta-data/public-ipv4)
 SALT=$(openssl rand -hex 16)
 ENCRYPTION_KEY=$(openssl rand -hex 32)
 cat > .env <<EOF
 NEXTAUTH_SECRET=$NEXTAUTH_SECRET
 NEXTAUTH_URL=http://$PUBLIC_IP:${langfuse_web_port}
 DATABASE_URL=postgresql://postgres:postgres@postgres:5432/postgres
 CLICKHOUSE_URL=http://clickhouse:8123
 CLICKHOUSE_USER=clickhouse
 CLICKHOUSE_PASSWORD=clickhouse
 TELEMETRY_ENABLED=false
 SALT=$SALT
 ENCRYPTION_KEY=$ENCRYPTION_KEY
 REDIS_AUTH=myredissecret
 LANGFUSE_S3_EVENT_UPLOAD_ACCESS_KEY_ID=minio
 LANGFUSE_S3_EVENT_UPLOAD_SECRET_ACCESS_KEY=miniosecret
 LANGFUSE_S3_MEDIA_UPLOAD_ACCESS_KEY_ID=minio
 LANGFUSE_S3_MEDIA_UPLOAD_SECRET_ACCESS_KEY=miniosecret
 LANGFUSE_S3_BATCH_EXPORT_ACCESS_KEY_ID=minio
 LANGFUSE_S3_BATCH_EXPORT_SECRET_ACCESS_KEY=miniosecret
 MINIO_ROOT_USER=minio
 MINIO_ROOT_PASSWORD=miniosecret
 EOF
 sudo docker compose -f docker-compose.yml up -d
 # Mount additional EBS volume
 DEVICE="${ebs_device_name}"
 MOUNT_DIR="/mnt/langfuse-data"
 if [ -b "$DEVICE" ]; then
  sudo mkfs -t ext4 $DEVICE
  sudo mkdir -p $MOUNT_DIR
  sudo mount $DEVICE $MOUNT_DIR
  echo "$DEVICE $MOUNT_DIR ext4 defaults,nofail 0 2" | sudo tee -a /etc/fstab
 else
  echo "Volume $DEVICE not found."
 fi
--- a/infra/langfuse-terraform/variables.tf
+++ b/infra/langfuse-terraform/variables.tf
@@ -0,0 +1,103 @@
 # ──────────────────────────────────────────────
 # General
 # ──────────────────────────────────────────────
 variable "aws_region" {
  description = "AWS region"
  type        = string
  default     = "us-east-1"
 }
 variable "project_name" {
  description = "Project name used for resource naming"
  type        = string
 }
 variable "environment" {
  description = "Environment (dev, staging, prod)"
  type        = string
 }
 variable "tags" {
  description = "Tags applied to all resources"
  type        = map(string)
  default     = {}
 }
 # ──────────────────────────────────────────────
 # Network
 # ──────────────────────────────────────────────
 variable "vpc_id" {
  description = "VPC ID where resources will be created"
  type        = string
 }
 variable "subnet_id" {
  description = "Subnet ID for the EC2 instance (must be public for associate_public_ip)"
  type        = string
 }
 # ──────────────────────────────────────────────
 # EC2
 # ──────────────────────────────────────────────
 variable "instance_type" {
  description = "EC2 instance type (langfuse requires at least t3.xlarge)"
  type        = string
  default     = "t3.xlarge"
 }
 variable "instance_name" {
  description = "Name tag for the EC2 instance"
  type        = string
  default     = "LangfuseEC2"
 }
 variable "key_name" {
  description = "EC2 key pair name for SSH access (optional)"
  type        = string
  default     = ""
 }
 variable "sg_name" {
  description = "Security group name"
  type        = string
  default     = "langfuse-sg"
 }
 variable "allowed_ports" {
  description = "List of TCP ports to allow inbound"
  type        = list(number)
  default     = [22, 80, 443, 3000]
 }
 variable "root_volume_size" {
  description = "Root EBS volume size in GB"
  type        = number
  default     = 100
 }
 variable "root_volume_type" {
  description = "Root EBS volume type"
  type        = string
  default     = "gp2"
 }
 variable "ebs_device_name" {
  description = "Device name for the additional EBS volume"
  type        = string
  default     = "/dev/sdf"
 }
 # ──────────────────────────────────────────────
 # Langfuse
 # ──────────────────────────────────────────────
 variable "langfuse_repo_url" {
  description = "Langfuse git repository URL"
  type        = string
  default     = "https://github.com/langfuse/langfuse.git"
 }
 variable "langfuse_web_port" {
  description = "Langfuse web UI port"
  type        = number
  default     = 3000
 }