connyay · July 2, 2025 14:02
diff --git a/transports-bifrost-http-main.go b/transports-bifrost-http-main.go
 // Package http provides an HTTP service using FastHTTP that exposes endpoints
 // for text completions, chat completions, and embeddings using various AI model providers (OpenAI, Anthropic, Bedrock, Mistral, Ollama, etc.).
 //
 // The HTTP service provides three main endpoints:
 //   - /v1/text/completions: For text completion requests
 //   - /v1/chat/completions: For chat completion requests
 //   - /v1/embeddings: For text embedding requests
 //   - /v1/mcp/tool/execute: For MCP tool execution requests
 //
 // Configuration is handled through a JSON config file and environment variables:
 //   - Use -config flag to specify the config file location
 //   - Use -port flag to specify the server port (default: 8080)
 //   - Use -pool-size flag to specify the initial connection pool size (default: 300)
 //
 // Example usage:
 //
 //	go run main.go -config config.example.json -port 8080 -pool-size 300
 //	after setting the environment variables present in config.example.json in the environment.
 //
 // Integration Support:
 // Bifrost supports multiple AI provider integrations through dedicated HTTP endpoints.
 // Each integration exposes API-compatible endpoints that accept the provider's native request format,
 // automatically convert it to Bifrost's unified format, process it, and return the expected response format.
 //
 // Integration endpoints follow the pattern: /{provider}/{provider_api_path}
 // Examples:
 //   - OpenAI: POST /openai/v1/chat/completions (accepts OpenAI ChatCompletion requests)
 //   - GenAI:  POST /genai/v1beta/models/{model} (accepts Google GenAI requests)
 //   - Anthropic: POST /anthropic/v1/messages (accepts Anthropic Messages requests)
 //
 // This allows clients to use their existing integration code without modification while benefiting
 // from Bifrost's unified model routing, fallbacks, and monitoring capabilities.
 //
 // NOTE: Streaming is not supported yet so all the flags related to streaming are ignored. (in both bifrost and its integrations)
 package main

 import (
 	"encoding/json"
 	"flag"
 	"fmt"
 	"log"
 	"os"
 	"strings"

 	"github.com/fasthttp/router"
 	bifrost "github.com/maximhq/bifrost/core"
 	schemas "github.com/maximhq/bifrost/core/schemas"
 	"github.com/maximhq/bifrost/plugins/maxim"
 	"github.com/maximhq/bifrost/transports/bifrost-http/integrations"
 	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/anthropic"
 	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/genai"
 	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/litellm"
 	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/openai"
 	"github.com/maximhq/bifrost/transports/bifrost-http/lib"
 	"github.com/maximhq/bifrost/transports/bifrost-http/tracking"
 	"github.com/prometheus/client_golang/prometheus"
 	"github.com/prometheus/client_golang/prometheus/collectors"
 	"github.com/prometheus/client_golang/prometheus/promhttp"
 	"github.com/valyala/fasthttp"
 	"github.com/valyala/fasthttp/fasthttpadaptor"
 )

 // Command line flags
 var (
 	initialPoolSize    int      // Initial size of the connection pool
 	dropExcessRequests bool     // Drop excess requests
 	port               string   // Port to run the server on
 	configPath         string   // Path to the config file
 	pluginsToLoad      []string // Path to the plugins
 	prometheusLabels   []string // Labels to add to Prometheus metrics (optional)
 )

 // init initializes command line flags and validates required configuration.
 // It sets up the following flags:
 //   - pool-size: Initial connection pool size (default: 300)
 //   - port: Server port (default: 8080)
 //   - config: Path to config file (required)
 //   - drop-excess-requests: Whether to drop excess requests
 func init() {
 	pluginString := ""
 	var prometheusLabelsString string

 	flag.IntVar(&initialPoolSize, "pool-size", 300, "Initial pool size for Bifrost")
 	flag.StringVar(&port, "port", "8080", "Port to run the server on")
 	flag.StringVar(&configPath, "config", "", "Path to the config file")
 	flag.BoolVar(&dropExcessRequests, "drop-excess-requests", false, "Drop excess requests")
 	flag.StringVar(&pluginString, "plugins", "", "Comma separated list of plugins to load")
 	flag.StringVar(&prometheusLabelsString, "prometheus-labels", "", "Labels to add to Prometheus metrics")
 	flag.Parse()

 	pluginsToLoad = strings.Split(pluginString, ",")

 	if configPath == "" {
 		log.Fatalf("config path is required")
 	}

 	if prometheusLabelsString != "" {
 		// Split and filter out empty strings
 		rawLabels := strings.Split(prometheusLabelsString, ",")
 		prometheusLabels = make([]string, 0, len(rawLabels))
 		for _, label := range rawLabels {
 			if trimmed := strings.TrimSpace(label); trimmed != "" {
 				prometheusLabels = append(prometheusLabels, strings.ToLower(trimmed))
 			}
 		}
 	}
 }

 // CompletionRequest represents a request for either text or chat completion.
 // It includes all necessary fields for both types of completions.
 type CompletionRequest struct {
 	Provider  schemas.ModelProvider    `json:"provider"`  // The AI model provider to use
 	Messages  []schemas.BifrostMessage `json:"messages"`  // Chat messages (for chat completion)
 	Text      string                   `json:"text"`      // Text input (for text completion)
 	Model     string                   `json:"model"`     // Model to use
 	Params    *schemas.ModelParameters `json:"params"`    // Additional model parameters
 	Fallbacks []schemas.Fallback       `json:"fallbacks"` // Fallback providers and models
 }

 // EmbeddingRequest represents a request for text embeddings.
 type EmbeddingRequest struct {
 	Provider       schemas.ModelProvider    `json:"provider"`        // The AI model provider to use
 	Input          any                      `json:"input"`           // Text input (string or []string)
 	Model          string                   `json:"model"`           // Model to use
 	Params         *schemas.ModelParameters `json:"params"`          // Additional model parameters
 	Fallbacks      []schemas.Fallback       `json:"fallbacks"`       // Fallback providers and models
 	Dimensions     *int                     `json:"dimensions"`      // Number of dimensions for embedding output
 	EncodingFormat *string                  `json:"encoding_format"` // Format of embedding output (e.g., "float", "base64")
 	User           *string                  `json:"user"`            // User identification
 }

 // registerCollectorSafely attempts to register a Prometheus collector,
 // handling the case where it may already be registered.
 // It logs any errors that occur during registration, except for AlreadyRegisteredError.
 func registerCollectorSafely(collector prometheus.Collector) {
 	if err := prometheus.Register(collector); err != nil {
 		if _, ok := err.(prometheus.AlreadyRegisteredError); !ok {
 			log.Printf("Failed to register collector: %v", err)
 		}
 	}
 }

 // main is the entry point of the application.
 // It:
 // 1. Initializes Prometheus collectors for monitoring
 // 2. Reads and parses configuration from the specified config file
 // 3. Initializes the Bifrost client with the configuration
 // 4. Sets up HTTP routes for text and chat completions
 // 5. Starts the HTTP server on the specified port
 //
 // The server exposes the following endpoints:
 //   - POST /v1/text/completions: For text completion requests
 //   - POST /v1/chat/completions: For chat completion requests
 //   - POST /v1/embeddings: For embedding requests
 //   - GET /metrics: For Prometheus metrics
 func main() {
 	// Register Prometheus collectors
 	registerCollectorSafely(collectors.NewGoCollector())
 	registerCollectorSafely(collectors.NewProcessCollector(collectors.ProcessCollectorOpts{}))

 	tracking.InitPrometheusMetrics(prometheusLabels)

 	log.Println("Prometheus Go/Process collectors registered.")

 	config := lib.ReadConfig(configPath)
 	account := &lib.BaseAccount{Config: config.ProviderConfig}

 	if err := account.ReadKeys(); err != nil {
 		log.Printf("warning: failed to read environment variables: %v", err)
 	}

 	if err := config.ReadMCPKeys(); err != nil {
 		log.Printf("warning: failed to read MCP environment variables: %v", err)
 	}

 	loadedPlugins := []schemas.Plugin{}

 	for _, plugin := range pluginsToLoad {
 		switch strings.ToLower(plugin) {
 		case "maxim":
 			if os.Getenv("MAXIM_LOG_REPO_ID") == "" {
 				log.Println("warning: maxim log repo id is required to initialize maxim plugin")
 				continue
 			}
 			if os.Getenv("MAXIM_API_KEY") == "" {
 				log.Println("warning: maxim api key is required in environment variable MAXIM_API_KEY to initialize maxim plugin")
 				continue
 			}

 			maximPlugin, err := maxim.NewMaximLoggerPlugin(os.Getenv("MAXIM_API_KEY"), os.Getenv("MAXIM_LOG_REPO_ID"))
 			if err != nil {
 				log.Printf("warning: failed to initialize maxim plugin: %v", err)
 				continue
 			}

 			loadedPlugins = append(loadedPlugins, maximPlugin)
 		}
 	}

 	promPlugin := tracking.NewPrometheusPlugin()
 	loadedPlugins = append(loadedPlugins, promPlugin)

 	client, err := bifrost.Init(schemas.BifrostConfig{
 		Account:            account,
 		InitialPoolSize:    initialPoolSize,
 		DropExcessRequests: dropExcessRequests,
 		Plugins:            loadedPlugins,
 		MCPConfig:          config.MCPConfig,
 	})
 	if err != nil {
 		log.Fatalf("failed to initialize bifrost: %v", err)
 	}

 	r := router.New()

 	extensions := []integrations.ExtensionRouter{
 		genai.NewGenAIRouter(client),
 		openai.NewOpenAIRouter(client),
 		anthropic.NewAnthropicRouter(client),
 		litellm.NewLiteLLMRouter(client),
 	}

 	r.POST("/v1/text/completions", func(ctx *fasthttp.RequestCtx) {
 		handleCompletion(ctx, client, false)
 	})

 	r.POST("/v1/chat/completions", func(ctx *fasthttp.RequestCtx) {
 		handleCompletion(ctx, client, true)
 	})

 	r.POST("/v1/embeddings", func(ctx *fasthttp.RequestCtx) {
 		handleEmbedding(ctx, client)
 	})

 	r.POST("/v1/mcp/tool/execute", func(ctx *fasthttp.RequestCtx) {
 		handleMCPToolExecution(ctx, client)
 	})

 	for _, extension := range extensions {
 		extension.RegisterRoutes(r)
 	}

 	// Add Prometheus /metrics endpoint
 	r.GET("/metrics", fasthttpadaptor.NewFastHTTPHandler(promhttp.Handler()))

 	r.NotFound = func(ctx *fasthttp.RequestCtx) {
 		ctx.SetStatusCode(fasthttp.StatusNotFound)
 		ctx.SetContentType("text/plain")
 		ctx.SetBodyString("Route not found: " + string(ctx.Path()))
 	}

 	server := &fasthttp.Server{
 		// A custom handler that excludes middleware from /metrics
 		Handler: func(ctx *fasthttp.RequestCtx) {
 			if string(ctx.Path()) == "/metrics" {
 				r.Handler(ctx)
 				return
 			}
 			tracking.PrometheusMiddleware(r.Handler)(ctx)
 		},
 	}

 	log.Println("Started Bifrost HTTP server on port", port)
 	if err := server.ListenAndServe(fmt.Sprintf(":%s", port)); err != nil {
 		log.Fatalf("failed to start server: %v", err)
 	}

 	client.Cleanup()
 }

 // handleCompletion processes both text and chat completion requests.
 // It handles request parsing, validation, and response formatting.
 //
 // Parameters:
 //   - ctx: The FastHTTP request context
 //   - client: The Bifrost client instance
 //   - isChat: Whether this is a chat completion request (true) or text completion (false)
 //
 // The function:
 // 1. Parses the request body into a CompletionRequest
 // 2. Validates required fields based on the request type
 // 3. Creates a BifrostRequest with the appropriate input type
 // 4. Calls the appropriate completion method on the client
 // 5. Handles any errors and formats the response
 func handleCompletion(ctx *fasthttp.RequestCtx, client *bifrost.Bifrost, isChat bool) {
 	var req CompletionRequest
 	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
 		return
 	}

 	if req.Provider == "" {
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString("Provider is required")
 		return
 	}

 	bifrostReq := &schemas.BifrostRequest{
 		Provider:  req.Provider,
 		Model:     req.Model,
 		Params:    req.Params,
 		Fallbacks: req.Fallbacks,
 	}

 	if isChat {
 		if len(req.Messages) == 0 {
 			ctx.SetStatusCode(fasthttp.StatusBadRequest)
 			ctx.SetBodyString("Messages array is required")
 			return
 		}
 		bifrostReq.Input = schemas.RequestInput{
 			ChatCompletionInput: &req.Messages,
 		}
 	} else {
 		if req.Text == "" {
 			ctx.SetStatusCode(fasthttp.StatusBadRequest)
 			ctx.SetBodyString("Text is required")
 			return
 		}
 		bifrostReq.Input = schemas.RequestInput{
 			TextCompletionInput: &req.Text,
 		}
 	}

 	bifrostCtx := lib.ConvertToBifrostContext(ctx)

 	var resp *schemas.BifrostResponse
 	var bifrostErr *schemas.BifrostError

 	if bifrostCtx == nil {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		ctx.SetBodyString("Failed to convert context")
 		return
 	}

 	if isChat {
 		resp, bifrostErr = client.ChatCompletionRequest(*bifrostCtx, bifrostReq)
 	} else {
 		resp, bifrostErr = client.TextCompletionRequest(*bifrostCtx, bifrostReq)
 	}

 	if bifrostErr != nil {
 		handleBifrostError(ctx, bifrostErr)
 		return
 	}

 	ctx.SetStatusCode(fasthttp.StatusOK)
 	ctx.SetContentType("application/json")
 	if encodeErr := json.NewEncoder(ctx).Encode(resp); encodeErr != nil {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		ctx.SetBodyString(fmt.Sprintf("failed to encode response: %v", encodeErr))
 	}
 }

 func handleMCPToolExecution(ctx *fasthttp.RequestCtx, client *bifrost.Bifrost) {
 	var req schemas.ToolCall
 	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
 		return
 	}

 	bifrostCtx := lib.ConvertToBifrostContext(ctx)

 	resp, bifrostErr := client.ExecuteMCPTool(*bifrostCtx, req)
 	if bifrostErr != nil {
 		handleBifrostError(ctx, bifrostErr)
 		return
 	}

 	ctx.SetStatusCode(fasthttp.StatusOK)
 	ctx.SetContentType("application/json")
 	if encodeErr := json.NewEncoder(ctx).Encode(resp); encodeErr != nil {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		ctx.SetBodyString(fmt.Sprintf("failed to encode response: %v", encodeErr))
 	}
 }

 func handleBifrostError(ctx *fasthttp.RequestCtx, bifrostErr *schemas.BifrostError) {
 	if bifrostErr.StatusCode != nil {
 		ctx.SetStatusCode(*bifrostErr.StatusCode)
 	} else {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 	}

 	ctx.SetContentType("application/json")
 	if encodeErr := json.NewEncoder(ctx).Encode(bifrostErr); encodeErr != nil {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		ctx.SetBodyString(fmt.Sprintf("failed to encode error response: %v", encodeErr))
 	}
 }

 // handleEmbedding processes embedding requests.
 // It handles request parsing, validation, and response formatting.
 //
 // Parameters:
 //   - ctx: The FastHTTP request context
 //   - client: The Bifrost client instance
 //
 // The function:
 // 1. Parses the request body into an EmbeddingRequest
 // 2. Validates required fields
 // 3. Creates a BifrostRequest with the appropriate input type
 // 4. Calls the embedding method on the client
 // 5. Handles any errors and formats the response
 func handleEmbedding(ctx *fasthttp.RequestCtx, client *bifrost.Bifrost) {
 	var req EmbeddingRequest
 	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
 		return
 	}

 	if req.Provider == "" {
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString("Provider is required")
 		return
 	}

 	var input schemas.EmbeddingInput
 	switch v := req.Input.(type) {
 	case string:
 		input.Texts = []string{v}
 	case []string:
 		input.Texts = v
 	default:
 		ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		ctx.SetBodyString("Input must be a string or []string")
 		return
 	}

 	bifrostReq := &schemas.BifrostRequest{
 		Provider:  req.Provider,
 		Model:     req.Model,
 		Params:    req.Params,
 		Fallbacks: req.Fallbacks,
 		Input: schemas.RequestInput{
 			EmbeddingInput: &input,
 		},
 	}

 	// If any of the new fields are set, ensure we have a Params object
 	if req.Dimensions != nil || req.EncodingFormat != nil || req.User != nil {
 		if bifrostReq.Params == nil {
 			bifrostReq.Params = &schemas.ModelParameters{}
 		}
 		bifrostReq.Params.Dimensions = req.Dimensions
 		bifrostReq.Params.EncodingFormat = req.EncodingFormat
 		bifrostReq.Params.User = req.User
 	}

 	bifrostCtx := lib.ConvertToBifrostContext(ctx)
 	if bifrostCtx == nil {
 		ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		ctx.SetBodyString("Failed to convert context")
 		return
 	}

 	resp, err := client.EmbeddingRequest(*bifrostCtx, bifrostReq)
 	if err != nil {
 		if err.IsBifrostError {
 			ctx.SetStatusCode(fasthttp.StatusInternalServerError)
 		} else {
 			ctx.SetStatusCode(fasthttp.StatusBadRequest)
 		}
 		ctx.SetContentType("application/json")
 		json.NewEncoder(ctx).Encode(err)
 		return
 	}

 	ctx.SetStatusCode(fasthttp.StatusOK)
 	ctx.SetContentType("application/json")
 	json.NewEncoder(ctx).Encode(resp)
 }
diff --git a/transports-bifrost-http-tracking-plugin.go b/transports-bifrost-http-tracking-plugin.go
 // Package tracking provides Prometheus metrics collection and monitoring functionality
 // for the Bifrost HTTP service. It includes middleware for HTTP request tracking
 // and a plugin for tracking upstream provider metrics.
 package tracking

 import (
 	"context"
 	"fmt"
 	"log"
 	"time"

 	schemas "github.com/maximhq/bifrost/core/schemas"
 	"github.com/prometheus/client_golang/prometheus"
 )

 // Define context key type for storing start time
 type contextKey string

 // PrometheusContextKey is a custom type for prometheus context keys to prevent collisions
 type PrometheusContextKey string

 const startTimeKey contextKey = "startTime"
 const methodKey contextKey = "method"

 // PrometheusPlugin implements the schemas.Plugin interface for Prometheus metrics.
 // It tracks metrics for upstream provider requests, including:
 //   - Total number of requests
 //   - Request latency
 //   - Error counts
 type PrometheusPlugin struct {
 	// Metrics are defined using promauto for automatic registration
 	UpstreamRequestsTotal *prometheus.CounterVec
 	UpstreamLatency       *prometheus.HistogramVec
 }

 // NewPrometheusPlugin creates a new PrometheusPlugin with initialized metrics.
 func NewPrometheusPlugin() *PrometheusPlugin {
 	return &PrometheusPlugin{
 		UpstreamRequestsTotal: bifrostUpstreamRequestsTotal,
 		UpstreamLatency:       bifrostUpstreamLatencySeconds,
 	}
 }

 // GetName returns the name of the plugin.
 func (p *PrometheusPlugin) GetName() string {
 	return "bifrost-http-prometheus"
 }

 // PreHook records the start time of the request in the context.
 // This time is used later in PostHook to calculate request duration.
 func (p *PrometheusPlugin) PreHook(ctx *context.Context, req *schemas.BifrostRequest) (*schemas.BifrostRequest, *schemas.PluginShortCircuit, error) {
 	*ctx = context.WithValue(*ctx, startTimeKey, time.Now())

 	if req.Input.ChatCompletionInput != nil {
 		*ctx = context.WithValue(*ctx, methodKey, "chat")
 	} else if req.Input.TextCompletionInput != nil {
 		*ctx = context.WithValue(*ctx, methodKey, "text")
 	}
 	// Needs a bifrost/core version bump before enabling
 	// else if req.Input.EmbeddingInput != nil {
 	// 	*ctx = context.WithValue(*ctx, methodKey, "embed")
 	// }

 	return req, nil, nil
 }

 // PostHook calculates duration and records upstream metrics for successful requests.
 // It records:
 //   - Request latency
 //   - Total request count
 func (p *PrometheusPlugin) PostHook(ctx *context.Context, result *schemas.BifrostResponse, bifrostErr *schemas.BifrostError) (*schemas.BifrostResponse, *schemas.BifrostError, error) {
 	if result == nil {
 		return result, bifrostErr, nil
 	}

 	startTime, ok := (*ctx).Value(startTimeKey).(time.Time)
 	if !ok {
 		log.Println("Warning: startTime not found in context for Prometheus PostHook")
 		return result, bifrostErr, nil
 	}

 	method, ok := (*ctx).Value(methodKey).(string)
 	if !ok {
 		log.Println("Warning: method not found in context for Prometheus PostHook")
 		return result, bifrostErr, nil
 	}

 	// Collect prometheus labels from context
 	labelValues := map[string]string{
 		"target": fmt.Sprintf("%s/%s", result.ExtraFields.Provider, result.Model),
 		"method": method,
 	}

 	// Get all prometheus labels from context
 	for _, key := range customLabels {
 		if value := (*ctx).Value(PrometheusContextKey(key)); value != nil {
 			if strValue, ok := value.(string); ok {
 				labelValues[key] = strValue
 			}
 		}
 	}

 	// Get label values in the correct order
 	promLabelValues := getPrometheusLabelValues(append([]string{"target", "method"}, customLabels...), labelValues)

 	duration := time.Since(startTime).Seconds()
 	p.UpstreamLatency.WithLabelValues(promLabelValues...).Observe(duration)
 	p.UpstreamRequestsTotal.WithLabelValues(promLabelValues...).Inc()

 	return result, bifrostErr, nil
 }

 func (p *PrometheusPlugin) Cleanup() error {
 	return nil
 }
	// Package http provides an HTTP service using FastHTTP that exposes endpoints
	// for text completions, chat completions, and embeddings using various AI model providers (OpenAI, Anthropic, Bedrock, Mistral, Ollama, etc.).
	//
	// The HTTP service provides three main endpoints:
	// - /v1/text/completions: For text completion requests
	// - /v1/chat/completions: For chat completion requests
	// - /v1/embeddings: For text embedding requests
	// - /v1/mcp/tool/execute: For MCP tool execution requests
	//
	// Configuration is handled through a JSON config file and environment variables:
	// - Use -config flag to specify the config file location
	// - Use -port flag to specify the server port (default: 8080)
	// - Use -pool-size flag to specify the initial connection pool size (default: 300)
	//
	// Example usage:
	//
	// go run main.go -config config.example.json -port 8080 -pool-size 300
	// after setting the environment variables present in config.example.json in the environment.
	//
	// Integration Support:
	// Bifrost supports multiple AI provider integrations through dedicated HTTP endpoints.
	// Each integration exposes API-compatible endpoints that accept the provider's native request format,
	// automatically convert it to Bifrost's unified format, process it, and return the expected response format.
	//
	// Integration endpoints follow the pattern: /{provider}/{provider_api_path}
	// Examples:
	// - OpenAI: POST /openai/v1/chat/completions (accepts OpenAI ChatCompletion requests)
	// - GenAI: POST /genai/v1beta/models/{model} (accepts Google GenAI requests)
	// - Anthropic: POST /anthropic/v1/messages (accepts Anthropic Messages requests)
	//
	// This allows clients to use their existing integration code without modification while benefiting
	// from Bifrost's unified model routing, fallbacks, and monitoring capabilities.
	//
	// NOTE: Streaming is not supported yet so all the flags related to streaming are ignored. (in both bifrost and its integrations)
	package main

	import (
	"encoding/json"
	"flag"
	"fmt"
	"log"
	"os"
	"strings"

	"github.com/fasthttp/router"
	bifrost "github.com/maximhq/bifrost/core"
	schemas "github.com/maximhq/bifrost/core/schemas"
	"github.com/maximhq/bifrost/plugins/maxim"
	"github.com/maximhq/bifrost/transports/bifrost-http/integrations"
	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/anthropic"
	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/genai"
	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/litellm"
	"github.com/maximhq/bifrost/transports/bifrost-http/integrations/openai"
	"github.com/maximhq/bifrost/transports/bifrost-http/lib"
	"github.com/maximhq/bifrost/transports/bifrost-http/tracking"
	"github.com/prometheus/client_golang/prometheus"
	"github.com/prometheus/client_golang/prometheus/collectors"
	"github.com/prometheus/client_golang/prometheus/promhttp"
	"github.com/valyala/fasthttp"
	"github.com/valyala/fasthttp/fasthttpadaptor"
	)

	// Command line flags
	var (
	initialPoolSize int // Initial size of the connection pool
	dropExcessRequests bool // Drop excess requests
	port string // Port to run the server on
	configPath string // Path to the config file
	pluginsToLoad []string // Path to the plugins
	prometheusLabels []string // Labels to add to Prometheus metrics (optional)
	)

	// init initializes command line flags and validates required configuration.
	// It sets up the following flags:
	// - pool-size: Initial connection pool size (default: 300)
	// - port: Server port (default: 8080)
	// - config: Path to config file (required)
	// - drop-excess-requests: Whether to drop excess requests
	func init() {
	pluginString := ""
	var prometheusLabelsString string

	flag.IntVar(&initialPoolSize, "pool-size", 300, "Initial pool size for Bifrost")
	flag.StringVar(&port, "port", "8080", "Port to run the server on")
	flag.StringVar(&configPath, "config", "", "Path to the config file")
	flag.BoolVar(&dropExcessRequests, "drop-excess-requests", false, "Drop excess requests")
	flag.StringVar(&pluginString, "plugins", "", "Comma separated list of plugins to load")
	flag.StringVar(&prometheusLabelsString, "prometheus-labels", "", "Labels to add to Prometheus metrics")
	flag.Parse()

	pluginsToLoad = strings.Split(pluginString, ",")

	if configPath == "" {
	log.Fatalf("config path is required")
	}

	if prometheusLabelsString != "" {
	// Split and filter out empty strings
	rawLabels := strings.Split(prometheusLabelsString, ",")
	prometheusLabels = make([]string, 0, len(rawLabels))
	for _, label := range rawLabels {
	if trimmed := strings.TrimSpace(label); trimmed != "" {
	prometheusLabels = append(prometheusLabels, strings.ToLower(trimmed))
	}
	}
	}
	}

	// CompletionRequest represents a request for either text or chat completion.
	// It includes all necessary fields for both types of completions.
	type CompletionRequest struct {
	Provider schemas.ModelProvider `json:"provider"` // The AI model provider to use
	Messages []schemas.BifrostMessage `json:"messages"` // Chat messages (for chat completion)
	Text string `json:"text"` // Text input (for text completion)
	Model string `json:"model"` // Model to use
	Params *schemas.ModelParameters `json:"params"` // Additional model parameters
	Fallbacks []schemas.Fallback `json:"fallbacks"` // Fallback providers and models
	}

	// EmbeddingRequest represents a request for text embeddings.
	type EmbeddingRequest struct {
	Provider schemas.ModelProvider `json:"provider"` // The AI model provider to use
	Input any `json:"input"` // Text input (string or []string)
	Model string `json:"model"` // Model to use
	Params *schemas.ModelParameters `json:"params"` // Additional model parameters
	Fallbacks []schemas.Fallback `json:"fallbacks"` // Fallback providers and models
	Dimensions *int `json:"dimensions"` // Number of dimensions for embedding output
	EncodingFormat *string `json:"encoding_format"` // Format of embedding output (e.g., "float", "base64")
	User *string `json:"user"` // User identification
	}

	// registerCollectorSafely attempts to register a Prometheus collector,
	// handling the case where it may already be registered.
	// It logs any errors that occur during registration, except for AlreadyRegisteredError.
	func registerCollectorSafely(collector prometheus.Collector) {
	if err := prometheus.Register(collector); err != nil {
	if _, ok := err.(prometheus.AlreadyRegisteredError); !ok {
	log.Printf("Failed to register collector: %v", err)
	}
	}
	}

	// main is the entry point of the application.
	// It:
	// 1. Initializes Prometheus collectors for monitoring
	// 2. Reads and parses configuration from the specified config file
	// 3. Initializes the Bifrost client with the configuration
	// 4. Sets up HTTP routes for text and chat completions
	// 5. Starts the HTTP server on the specified port
	//
	// The server exposes the following endpoints:
	// - POST /v1/text/completions: For text completion requests
	// - POST /v1/chat/completions: For chat completion requests
	// - POST /v1/embeddings: For embedding requests
	// - GET /metrics: For Prometheus metrics
	func main() {
	// Register Prometheus collectors
	registerCollectorSafely(collectors.NewGoCollector())
	registerCollectorSafely(collectors.NewProcessCollector(collectors.ProcessCollectorOpts{}))

	tracking.InitPrometheusMetrics(prometheusLabels)

	log.Println("Prometheus Go/Process collectors registered.")

	config := lib.ReadConfig(configPath)
	account := &lib.BaseAccount{Config: config.ProviderConfig}

	if err := account.ReadKeys(); err != nil {
	log.Printf("warning: failed to read environment variables: %v", err)
	}

	if err := config.ReadMCPKeys(); err != nil {
	log.Printf("warning: failed to read MCP environment variables: %v", err)
	}

	loadedPlugins := []schemas.Plugin{}

	for _, plugin := range pluginsToLoad {
	switch strings.ToLower(plugin) {
	case "maxim":
	if os.Getenv("MAXIM_LOG_REPO_ID") == "" {
	log.Println("warning: maxim log repo id is required to initialize maxim plugin")
	continue
	}
	if os.Getenv("MAXIM_API_KEY") == "" {
	log.Println("warning: maxim api key is required in environment variable MAXIM_API_KEY to initialize maxim plugin")
	continue
	}

	maximPlugin, err := maxim.NewMaximLoggerPlugin(os.Getenv("MAXIM_API_KEY"), os.Getenv("MAXIM_LOG_REPO_ID"))
	if err != nil {
	log.Printf("warning: failed to initialize maxim plugin: %v", err)
	continue
	}

	loadedPlugins = append(loadedPlugins, maximPlugin)
	}
	}

	promPlugin := tracking.NewPrometheusPlugin()
	loadedPlugins = append(loadedPlugins, promPlugin)

	client, err := bifrost.Init(schemas.BifrostConfig{
	Account: account,
	InitialPoolSize: initialPoolSize,
	DropExcessRequests: dropExcessRequests,
	Plugins: loadedPlugins,
	MCPConfig: config.MCPConfig,
	})
	if err != nil {
	log.Fatalf("failed to initialize bifrost: %v", err)
	}

	r := router.New()

	extensions := []integrations.ExtensionRouter{
	genai.NewGenAIRouter(client),
	openai.NewOpenAIRouter(client),
	anthropic.NewAnthropicRouter(client),
	litellm.NewLiteLLMRouter(client),
	}

	r.POST("/v1/text/completions", func(ctx *fasthttp.RequestCtx) {
	handleCompletion(ctx, client, false)
	})

	r.POST("/v1/chat/completions", func(ctx *fasthttp.RequestCtx) {
	handleCompletion(ctx, client, true)
	})

	r.POST("/v1/embeddings", func(ctx *fasthttp.RequestCtx) {
	handleEmbedding(ctx, client)
	})

	r.POST("/v1/mcp/tool/execute", func(ctx *fasthttp.RequestCtx) {
	handleMCPToolExecution(ctx, client)
	})

	for _, extension := range extensions {
	extension.RegisterRoutes(r)
	}

	// Add Prometheus /metrics endpoint
	r.GET("/metrics", fasthttpadaptor.NewFastHTTPHandler(promhttp.Handler()))

	r.NotFound = func(ctx *fasthttp.RequestCtx) {
	ctx.SetStatusCode(fasthttp.StatusNotFound)
	ctx.SetContentType("text/plain")
	ctx.SetBodyString("Route not found: " + string(ctx.Path()))
	}

	server := &fasthttp.Server{
	// A custom handler that excludes middleware from /metrics
	Handler: func(ctx *fasthttp.RequestCtx) {
	if string(ctx.Path()) == "/metrics" {
	r.Handler(ctx)
	return
	}
	tracking.PrometheusMiddleware(r.Handler)(ctx)
	},
	}

	log.Println("Started Bifrost HTTP server on port", port)
	if err := server.ListenAndServe(fmt.Sprintf(":%s", port)); err != nil {
	log.Fatalf("failed to start server: %v", err)
	}

	client.Cleanup()
	}

	// handleCompletion processes both text and chat completion requests.
	// It handles request parsing, validation, and response formatting.
	//
	// Parameters:
	// - ctx: The FastHTTP request context
	// - client: The Bifrost client instance
	// - isChat: Whether this is a chat completion request (true) or text completion (false)
	//
	// The function:
	// 1. Parses the request body into a CompletionRequest
	// 2. Validates required fields based on the request type
	// 3. Creates a BifrostRequest with the appropriate input type
	// 4. Calls the appropriate completion method on the client
	// 5. Handles any errors and formats the response
	func handleCompletion(ctx fasthttp.RequestCtx, client bifrost.Bifrost, isChat bool) {
	var req CompletionRequest
	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
	return
	}

	if req.Provider == "" {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString("Provider is required")
	return
	}

	bifrostReq := &schemas.BifrostRequest{
	Provider: req.Provider,
	Model: req.Model,
	Params: req.Params,
	Fallbacks: req.Fallbacks,
	}

	if isChat {
	if len(req.Messages) == 0 {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString("Messages array is required")
	return
	}
	bifrostReq.Input = schemas.RequestInput{
	ChatCompletionInput: &req.Messages,
	}
	} else {
	if req.Text == "" {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString("Text is required")
	return
	}
	bifrostReq.Input = schemas.RequestInput{
	TextCompletionInput: &req.Text,
	}
	}

	bifrostCtx := lib.ConvertToBifrostContext(ctx)

	var resp *schemas.BifrostResponse
	var bifrostErr *schemas.BifrostError

	if bifrostCtx == nil {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	ctx.SetBodyString("Failed to convert context")
	return
	}

	if isChat {
	resp, bifrostErr = client.ChatCompletionRequest(*bifrostCtx, bifrostReq)
	} else {
	resp, bifrostErr = client.TextCompletionRequest(*bifrostCtx, bifrostReq)
	}

	if bifrostErr != nil {
	handleBifrostError(ctx, bifrostErr)
	return
	}

	ctx.SetStatusCode(fasthttp.StatusOK)
	ctx.SetContentType("application/json")
	if encodeErr := json.NewEncoder(ctx).Encode(resp); encodeErr != nil {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	ctx.SetBodyString(fmt.Sprintf("failed to encode response: %v", encodeErr))
	}
	}

	func handleMCPToolExecution(ctx fasthttp.RequestCtx, client bifrost.Bifrost) {
	var req schemas.ToolCall
	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
	return
	}

	bifrostCtx := lib.ConvertToBifrostContext(ctx)

	resp, bifrostErr := client.ExecuteMCPTool(*bifrostCtx, req)
	if bifrostErr != nil {
	handleBifrostError(ctx, bifrostErr)
	return
	}

	ctx.SetStatusCode(fasthttp.StatusOK)
	ctx.SetContentType("application/json")
	if encodeErr := json.NewEncoder(ctx).Encode(resp); encodeErr != nil {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	ctx.SetBodyString(fmt.Sprintf("failed to encode response: %v", encodeErr))
	}
	}

	func handleBifrostError(ctx fasthttp.RequestCtx, bifrostErr schemas.BifrostError) {
	if bifrostErr.StatusCode != nil {
	ctx.SetStatusCode(*bifrostErr.StatusCode)
	} else {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	}

	ctx.SetContentType("application/json")
	if encodeErr := json.NewEncoder(ctx).Encode(bifrostErr); encodeErr != nil {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	ctx.SetBodyString(fmt.Sprintf("failed to encode error response: %v", encodeErr))
	}
	}

	// handleEmbedding processes embedding requests.
	// It handles request parsing, validation, and response formatting.
	//
	// Parameters:
	// - ctx: The FastHTTP request context
	// - client: The Bifrost client instance
	//
	// The function:
	// 1. Parses the request body into an EmbeddingRequest
	// 2. Validates required fields
	// 3. Creates a BifrostRequest with the appropriate input type
	// 4. Calls the embedding method on the client
	// 5. Handles any errors and formats the response
	func handleEmbedding(ctx fasthttp.RequestCtx, client bifrost.Bifrost) {
	var req EmbeddingRequest
	if err := json.Unmarshal(ctx.PostBody(), &req); err != nil {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString(fmt.Sprintf("invalid request format: %v", err))
	return
	}

	if req.Provider == "" {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString("Provider is required")
	return
	}

	var input schemas.EmbeddingInput
	switch v := req.Input.(type) {
	case string:
	input.Texts = []string{v}
	case []string:
	input.Texts = v
	default:
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	ctx.SetBodyString("Input must be a string or []string")
	return
	}

	bifrostReq := &schemas.BifrostRequest{
	Provider: req.Provider,
	Model: req.Model,
	Params: req.Params,
	Fallbacks: req.Fallbacks,
	Input: schemas.RequestInput{
	EmbeddingInput: &input,
	},
	}

	// If any of the new fields are set, ensure we have a Params object
	if req.Dimensions != nil \|\| req.EncodingFormat != nil \|\| req.User != nil {
	if bifrostReq.Params == nil {
	bifrostReq.Params = &schemas.ModelParameters{}
	}
	bifrostReq.Params.Dimensions = req.Dimensions
	bifrostReq.Params.EncodingFormat = req.EncodingFormat
	bifrostReq.Params.User = req.User
	}

	bifrostCtx := lib.ConvertToBifrostContext(ctx)
	if bifrostCtx == nil {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	ctx.SetBodyString("Failed to convert context")
	return
	}

	resp, err := client.EmbeddingRequest(*bifrostCtx, bifrostReq)
	if err != nil {
	if err.IsBifrostError {
	ctx.SetStatusCode(fasthttp.StatusInternalServerError)
	} else {
	ctx.SetStatusCode(fasthttp.StatusBadRequest)
	}
	ctx.SetContentType("application/json")
	json.NewEncoder(ctx).Encode(err)
	return
	}

	ctx.SetStatusCode(fasthttp.StatusOK)
	ctx.SetContentType("application/json")
	json.NewEncoder(ctx).Encode(resp)
	}
	// Package tracking provides Prometheus metrics collection and monitoring functionality
	// for the Bifrost HTTP service. It includes middleware for HTTP request tracking
	// and a plugin for tracking upstream provider metrics.
	package tracking

	import (
	"context"
	"fmt"
	"log"
	"time"

	schemas "github.com/maximhq/bifrost/core/schemas"
	"github.com/prometheus/client_golang/prometheus"
	)

	// Define context key type for storing start time
	type contextKey string

	// PrometheusContextKey is a custom type for prometheus context keys to prevent collisions
	type PrometheusContextKey string

	const startTimeKey contextKey = "startTime"
	const methodKey contextKey = "method"

	// PrometheusPlugin implements the schemas.Plugin interface for Prometheus metrics.
	// It tracks metrics for upstream provider requests, including:
	// - Total number of requests
	// - Request latency
	// - Error counts
	type PrometheusPlugin struct {
	// Metrics are defined using promauto for automatic registration
	UpstreamRequestsTotal *prometheus.CounterVec
	UpstreamLatency *prometheus.HistogramVec
	}

	// NewPrometheusPlugin creates a new PrometheusPlugin with initialized metrics.
	func NewPrometheusPlugin() *PrometheusPlugin {
	return &PrometheusPlugin{
	UpstreamRequestsTotal: bifrostUpstreamRequestsTotal,
	UpstreamLatency: bifrostUpstreamLatencySeconds,
	}
	}

	// GetName returns the name of the plugin.
	func (p *PrometheusPlugin) GetName() string {
	return "bifrost-http-prometheus"
	}

	// PreHook records the start time of the request in the context.
	// This time is used later in PostHook to calculate request duration.
	func (p PrometheusPlugin) PreHook(ctx context.Context, req schemas.BifrostRequest) (schemas.BifrostRequest, *schemas.PluginShortCircuit, error) {
	ctx = context.WithValue(ctx, startTimeKey, time.Now())

	if req.Input.ChatCompletionInput != nil {
	ctx = context.WithValue(ctx, methodKey, "chat")
	} else if req.Input.TextCompletionInput != nil {
	ctx = context.WithValue(ctx, methodKey, "text")
	}
	// Needs a bifrost/core version bump before enabling
	// else if req.Input.EmbeddingInput != nil {
	// ctx = context.WithValue(ctx, methodKey, "embed")
	// }

	return req, nil, nil
	}

	// PostHook calculates duration and records upstream metrics for successful requests.
	// It records:
	// - Request latency
	// - Total request count
	func (p PrometheusPlugin) PostHook(ctx context.Context, result schemas.BifrostResponse, bifrostErr schemas.BifrostError) (schemas.BifrostResponse, schemas.BifrostError, error) {
	if result == nil {
	return result, bifrostErr, nil
	}

	startTime, ok := (*ctx).Value(startTimeKey).(time.Time)
	if !ok {
	log.Println("Warning: startTime not found in context for Prometheus PostHook")
	return result, bifrostErr, nil
	}

	method, ok := (*ctx).Value(methodKey).(string)
	if !ok {
	log.Println("Warning: method not found in context for Prometheus PostHook")
	return result, bifrostErr, nil
	}

	// Collect prometheus labels from context
	labelValues := map[string]string{
	"target": fmt.Sprintf("%s/%s", result.ExtraFields.Provider, result.Model),
	"method": method,
	}

	// Get all prometheus labels from context
	for _, key := range customLabels {
	if value := (*ctx).Value(PrometheusContextKey(key)); value != nil {
	if strValue, ok := value.(string); ok {
	labelValues[key] = strValue
	}
	}
	}

	// Get label values in the correct order
	promLabelValues := getPrometheusLabelValues(append([]string{"target", "method"}, customLabels...), labelValues)

	duration := time.Since(startTime).Seconds()
	p.UpstreamLatency.WithLabelValues(promLabelValues...).Observe(duration)
	p.UpstreamRequestsTotal.WithLabelValues(promLabelValues...).Inc()

	return result, bifrostErr, nil
	}

	func (p *PrometheusPlugin) Cleanup() error {
	return nil
	}