Flask Integration

Automatic request tracing for Flask applications.

Quick Start

Prereq: set TRACIUM_API_KEY (see Installation).

app.pypython

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import tracium

# Initialize Tracium FIRST
tracium.trace()

# Import libraries after enabling tracing
from flask import Flask, request
from openai import OpenAI

app = Flask(__name__)
openai_client = OpenAI()

@app.route("/chat", methods=["POST"])
def chat():
    # This request is automatically traced
    message = request.json["message"]
    
    response = openai_client.chat.completions.create(
        model="gpt-4",
        messages=[{"role": "user", "content": message}]
    )
    
    return {"response": response.choices[0].message.content}

if __name__ == "__main__":
    app.run(debug=True)

What Gets Captured

Request path - URL and HTTP method
Endpoint name - Flask endpoint/function name
Response status - HTTP status code
Latency - Request duration
Child spans - LLM calls, database queries, etc.

Manual Traces

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import tracium

tracium.trace()

from flask import Flask, request
from openai import OpenAI

app = Flask(__name__)
openai_client = OpenAI()
tracium_client = tracium.get_client()

@app.route("/analyze", methods=["POST"])
def analyze():
    text = request.json["text"]
    
    with tracium_client.agent_trace(
        agent_name="flask-analyzer",
        tags=["flask", "analyze"]
    ) as trace:
        with trace.span(span_type="tool", name="preprocess") as span:
            span.record_input({"text": text})
            processed = preprocess(text)
            span.record_output({"processed": processed})
        
        response = openai_client.chat.completions.create(
            model="gpt-4",
            messages=[{"role": "user", "content": processed}]
        )
        
    return {"result": response.choices[0].message.content}

Blueprints

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
import tracium

tracium.trace()

# Import libraries after enabling tracing
from flask import Flask, Blueprint
from openai import OpenAI

# Blueprint routes are traced automatically
api = Blueprint("api", __name__, url_prefix="/api")
openai_client = OpenAI()

@api.route("/chat", methods=["POST"])
def chat():
    from flask import request
    message = request.json["message"]
    response = openai_client.chat.completions.create(
        model="gpt-4",
        messages=[{"role": "user", "content": message}]
    )
    return {"response": response.choices[0].message.content}

app = Flask(__name__)
app.register_blueprint(api)

Error Handling

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import tracium

tracium.trace()

from flask import Flask, jsonify
from openai import OpenAI, RateLimitError

app = Flask(__name__)
openai_client = OpenAI()

@app.errorhandler(500)
def handle_error(error):
    # Errors are captured in the trace
    return jsonify({"error": str(error)}), 500

@app.route("/chat", methods=["POST"])
def chat():
    try:
        from flask import request
        response = openai_client.chat.completions.create(
            model="gpt-4",
            messages=[{"role": "user", "content": request.json["message"]}]
        )
        return {"response": response.choices[0].message.content}
    except RateLimitError as e:
        # Exception is recorded in trace
        return jsonify({"error": "Rate limited"}), 429

With Gunicorn

# Run with gunicorn
gunicorn -w 4 app:app

← FastAPI Django →