Mistral AI Code Sandbox with Approval Gates for SMB Data Teams

Let business analysts run analytical Python scripts generated by an LLM, with mandatory human approval before execution and full audit trails.

mistral code-execution human-in-the-loop nextjs e2b approval-workflow budget-control data-analysis

The problem

Small businesses want to let non-engineers use natural language to run data analyses, but fear untrusted code execution, runaway costs, and compliance risks. No off-the-shelf tool offers human-in-the-loop gating with fine-grained spend controls.

Built from

Intro

This tutorial walks you through building a human-in-the-loop code sandbox for small-to-medium business data teams. You’ll build a Next.js application where a business analyst types a natural-language data question, Mistral AI generates Python code, a reviewer must explicitly approve the code before it runs, and the approved code executes inside an isolated E2B sandbox. Budget caps, session continuity, and full audit trails are baked in from the start.

By the end, you’ll have a working approval-gated AI code analysis tool that non-engineers can use safely, with spend controls, cost telemetry, and Langfuse observability.

Prerequisites

Node.js 22+ and pnpm 10+
A Mistral AI API key — get one at console.mistral.ai
An E2B API key — sign up at e2b.dev
A Supabase project (free tier works) — create one at supabase.com
A Langfuse account (optional for observability) — set up at langfuse.com
Familiarity with TypeScript, Next.js App Router, and basic tRPC concepts

Step 1: Bootstrap the Next.js project and install dependencies

Start with a fresh Next.js project using the App Router and TypeScript:

Example artifact

A complete, working implementation of this recipe — downloadable as a zip or browsable file by file. Generated by our build pipeline; tested with full coverage before publishing.

Download example (zip)Browse files

189 kB·165 tests·96.2% coverage·vitest passing

SHA-2562a41f0a3f55372ae0067050969f09ca7516745ee2bce96d5cec6e98aec8cef70

Book a conversation All solutions

Comments

Loading comments…

import { createClient, type SupabaseClient } from "@supabase/supabase-js"; import { getConfig } from "../lib/config"; let client: SupabaseClient | null = null; export function getSupabase(): SupabaseClient { if (client) return client; const config = getConfig(); client = createClient(config.supabaseUrl, config.supabaseSecretKey, { auth: { persistSession: false }, }); return client; } export async function migrateSchema(supabase: SupabaseClient): Promise<void> { const sql = ` CREATE TABLE IF NOT EXISTS sessions ( id UUID PRIMARY KEY DEFAULT gen_random_uuid(), user_id TEXT NOT NULL, status TEXT NOT NULL DEFAULT 'active', metadata JSONB DEFAULT '{}', created_at TIMESTAMPTZ DEFAULT NOW(), last_activity_at TIMESTAMPTZ DEFAULT NOW() ); CREATE TABLE IF NOT EXISTS messages ( id UUID PRIMARY KEY DEFAULT gen_random_uuid(), session_id UUID REFERENCES sessions(id), role TEXT NOT NULL, content TEXT NOT NULL, created_at TIMESTAMPTZ DEFAULT NOW() ); CREATE TABLE IF NOT EXISTS approval_requests ( id UUID PRIMARY KEY DEFAULT gen_random_uuid(), code TEXT NOT NULL, user_id TEXT NOT NULL, team_id TEXT NOT NULL, session_id UUID REFERENCES sessions(id), budget_estimate FLOAT NOT NULL, approval_status TEXT DEFAULT 'pending', reviewer_id TEXT, rejection_reason TEXT, created_at TIMESTAMPTZ DEFAULT NOW() ); CREATE TABLE IF NOT EXISTS cost_spans ( id UUID PRIMARY KEY DEFAULT gen_random_uuid(), provider TEXT NOT NULL, model TEXT NOT NULL, input_tokens INT NOT NULL, output_tokens INT NOT NULL, cost_usd FLOAT NOT NULL, tenant TEXT NOT NULL, feature TEXT NOT NULL, timestamp TIMESTAMPTZ DEFAULT NOW() ); CREATE TABLE IF NOT EXISTS audit_logs ( id UUID PRIMARY KEY DEFAULT gen_random_uuid(), action TEXT NOT NULL, actor_id TEXT NOT NULL, details JSONB DEFAULT '{}', created_at TIMESTAMPTZ DEFAULT NOW() ); `; const { error } = await supabase.rpc("exec_sql", { query: sql }); if (error) throw new Error(`migrateSchema failed: ${error.message}`); } export async function insertAuditLog( supabase: SupabaseClient, action: string, actorId: string, details: Record<string, unknown>, ): Promise<void> { const { error } = await supabase.from("audit_logs").insert({ action, actor_id: actorId, details, created_at: new Date().toISOString(), }); if (error) throw new Error(`audit log insert failed: ${error.message}`); }

import { Mistral } from "@mistralai/mistralai"; import { MistralError } from "@mistralai/mistralai/models/errors"; import type { ContentChunk } from "@mistralai/mistralai/models/components"; import pRetry from "p-retry"; import { getConfig } from "../lib/config"; import * as logger from "../lib/logger"; const systemPrompt = "You are a Python data analysis code generator. Given a natural language query, generate Python code using pandas, matplotlib, and numpy to answer it. Return ONLY the Python code inside a markdown code block. Do NOT include explanatory text."; let client: Mistral | null = null; export function createMistralClient(): Mistral { if (client) return client; const config = getConfig(); client = new Mistral({ apiKey: config.mistralApiKey || "" }); return client; } function extractTextContent(content: string | ContentChunk[] | null | undefined): string { if (!content) return ""; if (typeof content === "string") return content; return content.map((chunk) => { if ("text" in chunk) return (chunk as { text: string }).text; return ""; }).join(""); } export async function generateCode( query: string, ): Promise<{ code: string; model: string; usage: { promptTokens: number; completionTokens: number } }> { const config = getConfig(); const c = createMistralClient(); const run = async () => { const result = await c.chat.complete({ model: config.mistralModel, messages: [ { role: "user" as const, content: systemPrompt }, { role: "user" as const, content: query }, ], }); const rawContent = result.choices[0]?.message?.content; const content = extractTextContent(rawContent); const model = result.model; const promptTokens = result.usage.promptTokens ?? 0; const completionTokens = result.usage.completionTokens ?? 0; const codeMatch = content.match(/```(?:python)?\s*\n?([\s\S]*?)```/); const code = codeMatch?.[1]?.trim() ?? content.trim(); return { code, model, usage: { promptTokens, completionTokens } }; }; try { return await pRetry(run, { retries: 3 }); } catch (err) { if (err instanceof MistralError) { const statusCode = err.statusCode; const body = err.body; logger.error("Mistral API error", { statusCode, body }); throw new MistralError(`Mistral API error: ${err.message}`, { response: err.rawResponse, request: new Request(err.rawResponse.url), body: err.body, }); } logger.error("Mistral code generation failed", { error: String(err) }); throw err; } }

import { BudgetController } from "@reaatech/agent-budget-engine"; import { BudgetScope } from "@reaatech/agent-budget-types"; import { SpendStore } from "../lib/adapters/spend-store"; import * as logger from "../lib/logger"; let controller: BudgetController | null = null; export function createBudgetController(): BudgetController { if (controller) return controller; controller = new BudgetController({ spendTracker: new SpendStore() }); controller.on("hard-stop", (event) => { logger.warn("Budget hard stop triggered", { scopeType: event.scopeType, scopeKey: event.scopeKey }); }); controller.on("threshold-breach", (event) => { logger.warn("Budget threshold breached", { threshold: event.threshold }); }); return controller; } export function defineUserBudget( userId: string, limitUsd: number, softCapPct: number = 0.8, ): void { const c = createBudgetController(); c.defineBudget({ scopeType: BudgetScope.User, scopeKey: userId, limit: limitUsd, policy: { softCap: softCapPct, hardCap: 1.0, autoDowngrade: [], disableTools: [], }, }); } export function checkBudget( userId: string, estimatedCost: number, modelId: string, ): { allowed: boolean; suggestedModel?: string; disabledTools?: string[] } { const c = createBudgetController(); const result = c.check({ scopeType: BudgetScope.User, scopeKey: userId, estimatedCost, modelId, tools: [], }); return { allowed: result.allowed, suggestedModel: result.suggestedModel, disabledTools: result.disabledTools, }; } export function recordSpend( userId: string, requestId: string, cost: number, inputTokens: number, outputTokens: number, modelId: string, ): void { const c = createBudgetController(); c.record({ requestId, scopeType: BudgetScope.User, scopeKey: userId, cost, inputTokens, outputTokens, modelId, provider: "mistral", timestamp: new Date(), }); } export function getBudgetState( userId: string, ): { spent: number; remaining: number; state: string } { const c = createBudgetController(); const state = c.getState(BudgetScope.User, userId); if (!state) { return { spent: 0, remaining: 0, state: "unknown" }; } return { spent: state.spent, remaining: state.remaining, state: state.state, }; }

import { generateId, now, calculateCostFromTokens, getWindowStart, getWindowEnd, type CostSpan, } from "@reaatech/llm-cost-telemetry"; import type { SupabaseClient } from "@supabase/supabase-js"; export function createCostSpan( userId: string, teamId: string, provider: string, model: string, inputTokens: number, outputTokens: number, costUsd: number, feature: string, ): CostSpan { const ts = now(); return { id: generateId(), provider: provider as "openai" | "anthropic" | "google", model, inputTokens, outputTokens, costUsd: costUsd > 0 ? costUsd : calculateCostFromTokens(inputTokens + outputTokens, 30), tenant: teamId, feature, timestamp: ts, }; } export async function bufferCostSpan( supabase: SupabaseClient, span: CostSpan, ): Promise<void> { const { error } = await supabase.from("cost_spans").insert({ id: span.id, provider: span.provider, model: span.model, input_tokens: span.inputTokens, output_tokens: span.outputTokens, cost_usd: span.costUsd, tenant: span.tenant, feature: span.feature, timestamp: (span.timestamp ?? new Date()).toISOString(), }); if (error) throw new Error(`cost span insert failed: ${error.message}`); } export async function getUserSpend( supabase: SupabaseClient, userId: string, window: "daily" | "monthly", ): Promise<number> { const windowArg = window === "daily" ? "day" : "month"; const start = getWindowStart(new Date(), windowArg); const end = getWindowEnd(new Date(), windowArg); const { data, error } = await supabase .from("cost_spans") .select("cost_usd") .eq("tenant", userId) .gte("timestamp", start.toISOString()) .lte("timestamp", end.toISOString()); if (error) throw new Error(`getUserSpend failed: ${error.message}`); return (data as { cost_usd: number }[]).reduce((sum: number, row: { cost_usd: number }) => sum + row.cost_usd, 0); } export async function getTeamSpend( supabase: SupabaseClient, teamId: string, window: "daily" | "monthly", ): Promise<number> { const windowArg = window === "daily" ? "day" : "month"; const start = getWindowStart(new Date(), windowArg); const end = getWindowEnd(new Date(), windowArg); const { data, error } = await supabase .from("cost_spans") .select("cost_usd") .eq("tenant", teamId) .gte("timestamp", start.toISOString()) .lte("timestamp", end.toISOString()); if (error) throw new Error(`getTeamSpend failed: ${error.message}`); return (data as { cost_usd: number }[]).reduce((sum: number, row: { cost_usd: number }) => sum + row.cost_usd, 0); }

import { createHandoffConfig, TypedEventEmitter, withRetry, pickDefined, type HandoffPayload, type HandoffConfig, } from "@reaatech/agent-handoff"; import type { ExecutionOutput } from "../types"; export const defaultConfig: HandoffConfig = createHandoffConfig({ routing: { minConfidenceThreshold: 0.7 }, }); export function buildCodeGenerationPayload( sessionId: string, code: string, userId: string, ): HandoffPayload { const payload: HandoffPayload = { handoffId: `handoff-${String(Date.now())}`, sessionId, conversationId: sessionId, sessionHistory: [], compressedContext: { summary: code, keyFacts: [], intents: [], entities: [], openItems: [], compressionMethod: "sliding_window", originalTokenCount: 0, compressedTokenCount: 0, compressionRatio: 0 }, handoffReason: { type: "confidence_too_low", currentConfidence: 0, threshold: 0.6, message: "Code generation to execution" }, userMetadata: pickDefined({ userId, sessionId }) as { userId: string; sessionId?: string }, conversationState: { resolvedEntities: {}, openQuestions: [], contextVariables: {} }, createdAt: new Date(), customData: pickDefined({ code }), }; return payload; } export function buildExecutionResultPayload( sessionId: string, result: ExecutionOutput, ): HandoffPayload { const payload: HandoffPayload = { handoffId: `handoff-${String(Date.now())}`, sessionId, conversationId: sessionId, sessionHistory: [], compressedContext: { summary: JSON.stringify(result), keyFacts: [], intents: [], entities: [], openItems: [], compressionMethod: "sliding_window", originalTokenCount: 0, compressedTokenCount: 0, compressionRatio: 0 }, handoffReason: { type: "confidence_too_low", currentConfidence: 0, threshold: 0.6, message: "Code execution complete" }, userMetadata: { userId: "" }, conversationState: { resolvedEntities: {}, openQuestions: [], contextVariables: {} }, createdAt: new Date(), customData: pickDefined({ result }), }; return payload; } export function createEventBus(): TypedEventEmitter<{ "handoff:start": { sessionId: string }; "handoff:complete": { sessionId: string; duration: number }; "handoff:error": { sessionId: string; error: Error }; }> { return new TypedEventEmitter(); } export async function retryWithDefaults<T>(fn: () => Promise<T>): Promise<T> { return withRetry(fn, { maxRetries: 3, backoff: "exponential", baseDelayMs: 100, maxDelayMs: 5000, shouldRetry: (err) => err instanceof Error, }); }

import { type NextRequest, NextResponse } from "next/server"; import { ApprovalStore } from "../../../src/services/firewall-service"; import { getSupabase } from "../../../src/services/supabase-service"; export async function POST(req: NextRequest) { try { const body = await req.json() as { requestId: string; approved: boolean; reviewerId: string; reason?: string; }; const store = new ApprovalStore(getSupabase()); if (body.approved) { const { approveRequest } = await import("../../../src/services/firewall-service"); await approveRequest(store, body.requestId, body.reviewerId); const { traceApproval } = await import("../../../src/services/langfuse-service"); traceApproval(`approve-${body.requestId}`, body.requestId, { requestId: body.requestId, approved: true, reviewerId: body.reviewerId, decidedAt: new Date() }); const { insertAuditLog } = await import("../../../src/services/supabase-service"); await insertAuditLog(getSupabase(), "approve", body.reviewerId, { requestId: body.requestId }); } else { const { rejectRequest } = await import("../../../src/services/firewall-service"); await rejectRequest(store, body.requestId, body.reviewerId, body.reason ?? "No reason given"); const { traceApproval } = await import("../../../src/services/langfuse-service"); traceApproval(`reject-${body.requestId}`, body.requestId, { requestId: body.requestId, approved: false, reviewerId: body.reviewerId, reason: body.reason ?? "No reason given", decidedAt: new Date() }); const { insertAuditLog } = await import("../../../src/services/supabase-service"); await insertAuditLog(getSupabase(), "reject", body.reviewerId, { requestId: body.requestId, reason: body.reason ?? "No reason given" }); } return NextResponse.json({ ok: true }); } catch (err) { const message = err instanceof Error ? err.message : "Unknown error"; return NextResponse.json({ error: message }, { status: 500 }); } }

Mistral AI Code Sandbox with Approval Gates for SMB Data Teams

The problem

Built from

Intro

Prerequisites

Step 1: Bootstrap the Next.js project and install dependencies

Example artifact

Comments

Intro

Prerequisites

Step 1: Bootstrap the Next.js project and install dependencies

Step 2: Configure environment variables

Step 3: Define shared types

Step 4: Create the Supabase client and schema migration

Step 5: Build the approval store and firewall

Step 6: Wire up the Mistral AI code generator

Step 7: Create the code interpreter sandbox

Step 8: Add budget enforcement with agent-budget-engine

Step 9: Add session continuity

Step 10: Add cost telemetry and Langfuse observability

Step 11: Create the agent handoff service

Step 12: Set up the tRPC router and context

Step 13: Create the Next.js API route handlers

Step 14: Build the frontend UI

Step 15: Run the tests

Next steps