diff --git a/core/cli/run.go b/core/cli/run.go
index 9b46b570133e..ba8a677ee3f7 100644
--- a/core/cli/run.go
+++ b/core/cli/run.go
@@ -77,6 +77,8 @@ type RunCMD struct {
 	DisableGalleryEndpoint             bool     `env:"LOCALAI_DISABLE_GALLERY_ENDPOINT,DISABLE_GALLERY_ENDPOINT" help:"Disable the gallery endpoints" group:"api"`
 	MachineTag                         string   `env:"LOCALAI_MACHINE_TAG,MACHINE_TAG" help:"Add Machine-Tag header to each response which is useful to track the machine in the P2P network" group:"api"`
 	LoadToMemory                       []string `env:"LOCALAI_LOAD_TO_MEMORY,LOAD_TO_MEMORY" help:"A list of models to load into memory at startup" group:"models"`
+	EnableTracing                      bool     `env:"LOCALAI_ENABLE_TRACING,ENABLE_TRACING" help:"Enable API tracing" group:"api"`
+	TracingMaxItems                    int      `env:"LOCALAI_TRACING_MAX_ITEMS" default:"1024" help:"Maximum number of traces to keep" group:"api"`
 	AgentJobRetentionDays              int      `env:"LOCALAI_AGENT_JOB_RETENTION_DAYS,AGENT_JOB_RETENTION_DAYS" default:"30" help:"Number of days to keep agent job history (default: 30)" group:"api"`
 
 	Version bool
@@ -149,6 +151,15 @@ func (r *RunCMD) Run(ctx *cliContext.Context) error {
 		opts = append(opts, config.DisableRuntimeSettings)
 	}
 
+	if r.EnableTracing {
+		opts = append(opts, config.EnableTracing)
+	}
+
+	if r.EnableTracing {
+		opts = append(opts, config.EnableTracing)
+	}
+	opts = append(opts, config.WithTracingMaxItems(r.TracingMaxItems))
+
 	token := ""
 	if r.Peer2Peer || r.Peer2PeerToken != "" {
 		xlog.Info("P2P mode enabled")
diff --git a/core/config/application_config.go b/core/config/application_config.go
index 07b8b7682ceb..4d393c7d5dc2 100644
--- a/core/config/application_config.go
+++ b/core/config/application_config.go
@@ -19,6 +19,8 @@ type ApplicationConfig struct {
 	UploadLimitMB, Threads, ContextSize int
 	F16                                 bool
 	Debug                               bool
+	EnableTracing                       bool
+	TracingMaxItems                     int
 	GeneratedContentDir                 string
 
 	UploadDir string
@@ -89,6 +91,7 @@ func NewApplicationConfig(o ...AppOption) *ApplicationConfig {
 		Context:               context.Background(),
 		UploadLimitMB:         15,
 		Debug:                 true,
+		TracingMaxItems:       1024,
 		AgentJobRetentionDays: 30, // Default: 30 days
 		PathWithoutAuth: []string{
 			"/static/",
@@ -158,6 +161,10 @@ var EnableWatchDog = func(o *ApplicationConfig) {
 	o.WatchDog = true
 }
 
+var EnableTracing = func(o *ApplicationConfig) {
+	o.EnableTracing = true
+}
+
 var EnableWatchDogIdleCheck = func(o *ApplicationConfig) {
 	o.WatchDog = true
 	o.WatchDogIdle = true
@@ -386,6 +393,12 @@ func WithDebug(debug bool) AppOption {
 	}
 }
 
+func WithTracingMaxItems(items int) AppOption {
+	return func(o *ApplicationConfig) {
+		o.TracingMaxItems = items
+	}
+}
+
 func WithGeneratedContentDir(generatedContentDir string) AppOption {
 	return func(o *ApplicationConfig) {
 		o.GeneratedContentDir = generatedContentDir
@@ -509,6 +522,8 @@ func (o *ApplicationConfig) ToRuntimeSettings() RuntimeSettings {
 	contextSize := o.ContextSize
 	f16 := o.F16
 	debug := o.Debug
+	tracingMaxItems := o.TracingMaxItems
+	enableTracing := o.EnableTracing
 	cors := o.CORS
 	csrf := o.CSRF
 	corsAllowOrigins := o.CORSAllowOrigins
@@ -556,6 +571,8 @@ func (o *ApplicationConfig) ToRuntimeSettings() RuntimeSettings {
 		ContextSize:              &contextSize,
 		F16:                      &f16,
 		Debug:                    &debug,
+		TracingMaxItems:          &tracingMaxItems,
+		EnableTracing:            &enableTracing,
 		CORS:                     &cors,
 		CSRF:                     &csrf,
 		CORSAllowOrigins:         &corsAllowOrigins,
@@ -656,6 +673,12 @@ func (o *ApplicationConfig) ApplyRuntimeSettings(settings *RuntimeSettings) (req
 	if settings.Debug != nil {
 		o.Debug = *settings.Debug
 	}
+	if settings.EnableTracing != nil {
+		o.EnableTracing = *settings.EnableTracing
+	}
+	if settings.TracingMaxItems != nil {
+		o.TracingMaxItems = *settings.TracingMaxItems
+	}
 	if settings.CORS != nil {
 		o.CORS = *settings.CORS
 	}
diff --git a/core/config/runtime_settings.go b/core/config/runtime_settings.go
index c02d4fcd7c20..01c6f383d703 100644
--- a/core/config/runtime_settings.go
+++ b/core/config/runtime_settings.go
@@ -27,10 +27,12 @@ type RuntimeSettings struct {
 	MemoryReclaimerThreshold *float64 `json:"memory_reclaimer_threshold,omitempty"` // Threshold 0.0-1.0 (e.g., 0.95 = 95%)
 
 	// Performance settings
-	Threads     *int  `json:"threads,omitempty"`
-	ContextSize *int  `json:"context_size,omitempty"`
-	F16         *bool `json:"f16,omitempty"`
-	Debug       *bool `json:"debug,omitempty"`
+	Threads         *int  `json:"threads,omitempty"`
+	ContextSize     *int  `json:"context_size,omitempty"`
+	F16             *bool `json:"f16,omitempty"`
+	Debug           *bool `json:"debug,omitempty"`
+	EnableTracing   *bool `json:"enable_tracing,omitempty"`
+	TracingMaxItems *int  `json:"tracing_max_items,omitempty"`
 
 	// Security/CORS settings
 	CORS             *bool   `json:"cors,omitempty"`
diff --git a/core/http/middleware/trace.go b/core/http/middleware/trace.go
new file mode 100644
index 000000000000..aa63ba349f37
--- /dev/null
+++ b/core/http/middleware/trace.go
@@ -0,0 +1,156 @@
+package middleware
+
+import (
+	"bytes"
+	"github.com/emirpasic/gods/v2/queues/circularbuffer"
+	"io"
+	"net/http"
+	"sort"
+	"sync"
+	"time"
+
+	"github.com/labstack/echo/v4"
+	"github.com/mudler/LocalAI/core/application"
+	"github.com/mudler/xlog"
+)
+
+type APIExchangeRequest struct {
+	Method  string       `json:"method"`
+	Path    string       `json:"path"`
+	Headers *http.Header `json:"headers"`
+	Body    *[]byte      `json:"body"`
+}
+
+type APIExchangeResponse struct {
+	Status  int          `json:"status"`
+	Headers *http.Header `json:"headers"`
+	Body    *[]byte      `json:"body"`
+}
+
+type APIExchange struct {
+	Timestamp time.Time           `json:"timestamp"`
+	Request   APIExchangeRequest  `json:"request"`
+	Response  APIExchangeResponse `json:"response"`
+}
+
+var traceBuffer *circularbuffer.Queue[APIExchange]
+var mu sync.Mutex
+var logChan = make(chan APIExchange, 100)
+
+type bodyWriter struct {
+	http.ResponseWriter
+	body *bytes.Buffer
+}
+
+func (w *bodyWriter) Write(b []byte) (int, error) {
+	w.body.Write(b)
+	return w.ResponseWriter.Write(b)
+}
+
+func (w *bodyWriter) Flush() {
+	if flusher, ok := w.ResponseWriter.(http.Flusher); ok {
+		flusher.Flush()
+	}
+}
+
+// TraceMiddleware intercepts and logs JSON API requests and responses
+func TraceMiddleware(app *application.Application) echo.MiddlewareFunc {
+	if app.ApplicationConfig().EnableTracing && traceBuffer == nil {
+		traceBuffer = circularbuffer.New[APIExchange](app.ApplicationConfig().TracingMaxItems)
+
+		go func() {
+			for exchange := range logChan {
+				mu.Lock()
+				traceBuffer.Enqueue(exchange)
+				mu.Unlock()
+			}
+		}()
+	}
+
+	return func(next echo.HandlerFunc) echo.HandlerFunc {
+		return func(c echo.Context) error {
+			if !app.ApplicationConfig().EnableTracing {
+				return next(c)
+			}
+
+			if c.Request().Header.Get("Content-Type") != "application/json" {
+				return next(c)
+			}
+
+			body, err := io.ReadAll(c.Request().Body)
+			if err != nil {
+				xlog.Error("Failed to read request body")
+				return err
+			}
+
+			// Restore the body for downstream handlers
+			c.Request().Body = io.NopCloser(bytes.NewBuffer(body))
+
+			startTime := time.Now()
+
+			// Wrap response writer to capture body
+			resBody := new(bytes.Buffer)
+			mw := &bodyWriter{
+				ResponseWriter: c.Response().Writer,
+				body:           resBody,
+			}
+			c.Response().Writer = mw
+
+			err = next(c)
+			if err != nil {
+				c.Response().Writer = mw.ResponseWriter // Restore original writer if error
+				return err
+			}
+
+			// Create exchange log
+			requestHeaders := c.Request().Header.Clone()
+			requestBody := make([]byte, len(body))
+			copy(requestBody, body)
+			responseHeaders := c.Response().Header().Clone()
+			responseBody := make([]byte, resBody.Len())
+			copy(responseBody, resBody.Bytes())
+			exchange := APIExchange{
+				Timestamp: startTime,
+				Request: APIExchangeRequest{
+					Method:  c.Request().Method,
+					Path:    c.Path(),
+					Headers: &requestHeaders,
+					Body:    &requestBody,
+				},
+				Response: APIExchangeResponse{
+					Status:  c.Response().Status,
+					Headers: &responseHeaders,
+					Body:    &responseBody,
+				},
+			}
+
+			select {
+			case logChan <- exchange:
+			default:
+				xlog.Warn("Trace channel full, dropping trace")
+			}
+
+			return nil
+		}
+	}
+}
+
+// GetTraces returns a copy of the logged API exchanges for display
+func GetTraces() []APIExchange {
+	mu.Lock()
+	traces := traceBuffer.Values()
+	mu.Unlock()
+
+	sort.Slice(traces, func(i, j int) bool {
+		return traces[i].Timestamp.Before(traces[j].Timestamp)
+	})
+
+	return traces
+}
+
+// ClearTraces clears the in-memory logs
+func ClearTraces() {
+	mu.Lock()
+	traceBuffer.Clear()
+	mu.Unlock()
+}
diff --git a/core/http/routes/openai.go b/core/http/routes/openai.go
index 921582a6b54b..93fed71dbb59 100644
--- a/core/http/routes/openai.go
+++ b/core/http/routes/openai.go
@@ -14,16 +14,18 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	re *middleware.RequestExtractor,
 	application *application.Application) {
 	// openAI compatible API endpoint
+	traceMiddleware := middleware.TraceMiddleware(application)
 
 	// realtime
 	// TODO: Modify/disable the API key middleware for this endpoint to allow ephemeral keys created by sessions
 	app.GET("/v1/realtime", openai.Realtime(application))
-	app.POST("/v1/realtime/sessions", openai.RealtimeTranscriptionSession(application))
-	app.POST("/v1/realtime/transcription_session", openai.RealtimeTranscriptionSession(application))
+	app.POST("/v1/realtime/sessions", openai.RealtimeTranscriptionSession(application), traceMiddleware)
+	app.POST("/v1/realtime/transcription_session", openai.RealtimeTranscriptionSession(application), traceMiddleware)
 
 	// chat
 	chatHandler := openai.ChatEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.TemplatesEvaluator(), application.ApplicationConfig())
 	chatMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_CHAT)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
 		func(next echo.HandlerFunc) echo.HandlerFunc {
@@ -41,6 +43,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// edit
 	editHandler := openai.EditEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.TemplatesEvaluator(), application.ApplicationConfig())
 	editMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_EDIT)),
 		re.BuildConstantDefaultModelNameMiddleware("gpt-4o"),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
@@ -59,6 +62,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// completion
 	completionHandler := openai.CompletionEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.TemplatesEvaluator(), application.ApplicationConfig())
 	completionMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_COMPLETION)),
 		re.BuildConstantDefaultModelNameMiddleware("gpt-4o"),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
@@ -78,6 +82,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// MCPcompletion
 	mcpCompletionHandler := openai.MCPCompletionEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.TemplatesEvaluator(), application.ApplicationConfig())
 	mcpCompletionMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_CHAT)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
 		func(next echo.HandlerFunc) echo.HandlerFunc {
@@ -95,6 +100,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// embeddings
 	embeddingHandler := openai.EmbeddingsEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig())
 	embeddingMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_EMBEDDINGS)),
 		re.BuildConstantDefaultModelNameMiddleware("gpt-4o"),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
@@ -113,6 +119,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 
 	audioHandler := openai.TranscriptEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig())
 	audioMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_TRANSCRIPT)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
 		func(next echo.HandlerFunc) echo.HandlerFunc {
@@ -130,6 +137,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 
 	audioSpeechHandler := localai.TTSEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig())
 	audioSpeechMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_TTS)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.TTSRequest) }),
 	}
@@ -140,6 +148,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// images
 	imageHandler := openai.ImageEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig())
 	imageMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		// Default: use the first available image generation model
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_IMAGE)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
@@ -164,6 +173,7 @@ func RegisterOpenAIRoutes(app *echo.Echo,
 	// videos (OpenAI-compatible endpoints mapped to LocalAI video handler)
 	videoHandler := openai.VideoEndpoint(application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig())
 	videoMiddleware := []echo.MiddlewareFunc{
+		traceMiddleware,
 		re.BuildFilteredFirstAvailableDefaultModel(config.BuildUsecaseFilterFn(config.FLAG_VIDEO)),
 		re.SetModelAndConfig(func() schema.LocalAIRequest { return new(schema.OpenAIRequest) }),
 		func(next echo.HandlerFunc) echo.HandlerFunc {
diff --git a/core/http/routes/ui.go b/core/http/routes/ui.go
index 4b852875fa77..da6f5d1ee7f5 100644
--- a/core/http/routes/ui.go
+++ b/core/http/routes/ui.go
@@ -317,4 +317,24 @@ func RegisterUIRoutes(app *echo.Echo,
 		// Render index
 		return c.Render(200, "views/tts", summary)
 	})
+
+	// Traces UI
+	app.GET("/traces", func(c echo.Context) error {
+		summary := map[string]interface{}{
+			"Title":   "LocalAI - Traces",
+			"BaseURL": middleware.BaseURL(c),
+			"Version": internal.PrintableVersion(),
+		}
+		return c.Render(200, "views/traces", summary)
+	})
+
+	app.GET("/api/traces", func(c echo.Context) error {
+		return c.JSON(200, middleware.GetTraces())
+	})
+
+	app.POST("/api/traces/clear", func(c echo.Context) error {
+		middleware.ClearTraces()
+		return c.NoContent(204)
+	})
+
 }
diff --git a/core/http/routes/ui_api.go b/core/http/routes/ui_api.go
index 36194d5c06c4..84af2e32fe57 100644
--- a/core/http/routes/ui_api.go
+++ b/core/http/routes/ui_api.go
@@ -16,6 +16,7 @@ import (
 	"github.com/mudler/LocalAI/core/config"
 	"github.com/mudler/LocalAI/core/gallery"
 	"github.com/mudler/LocalAI/core/http/endpoints/localai"
+	"github.com/mudler/LocalAI/core/http/middleware"
 	"github.com/mudler/LocalAI/core/p2p"
 	"github.com/mudler/LocalAI/core/services"
 	"github.com/mudler/LocalAI/pkg/model"
@@ -947,4 +948,24 @@ func RegisterUIAPIRoutes(app *echo.Echo, cl *config.ModelConfigLoader, ml *model
 		app.GET("/api/settings", localai.GetSettingsEndpoint(applicationInstance))
 		app.POST("/api/settings", localai.UpdateSettingsEndpoint(applicationInstance))
 	}
+
+	// Logs API
+	app.GET("/api/traces", func(c echo.Context) error {
+		if !appConfig.EnableTracing {
+			return c.JSON(503, map[string]any{
+				"error": "Tracing disabled",
+				})
+		}
+		traces := middleware.GetTraces()
+		return c.JSON(200, map[string]interface{}{
+			"traces": traces,
+		})
+	})
+
+	app.POST("/api/traces/clear", func(c echo.Context) error {
+		middleware.ClearTraces()
+		return c.JSON(200, map[string]interface{}{
+			"message": "Traces cleared",
+		})
+	})
 }
diff --git a/core/http/views/partials/navbar.html b/core/http/views/partials/navbar.html
index 2afdfa36e13f..cbc092c41a04 100644
--- a/core/http/views/partials/navbar.html
+++ b/core/http/views/partials/navbar.html
@@ -37,6 +37,9 @@
                 <a href="agent-jobs" class="text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] px-2 py-2 rounded-lg transition duration-300 ease-in-out hover:bg-[var(--color-bg-secondary)] flex items-center group text-sm">
                     <i class="fas fa-tasks text-[var(--color-primary)] mr-1.5 text-sm group-hover:scale-110 transition-transform"></i>Agent Jobs
                 </a>
+                <a href="traces/" class="text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] px-2 py-2 rounded-lg transition duration-300 ease-in-out hover:bg-[var(--color-bg-secondary)] flex items-center group text-sm">
+                    <i class="fas fa-chart-line text-[var(--color-primary)] mr-1.5 text-sm group-hover:scale-110 transition-transform"></i>Traces
+                </a>
                 <a href="swagger/" class="text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] px-2 py-2 rounded-lg transition duration-300 ease-in-out hover:bg-[var(--color-bg-secondary)] flex items-center group text-sm">
                     <i class="fas fa-code text-[var(--color-primary)] mr-1.5 text-sm group-hover:scale-110 transition-transform"></i>API
                 </a>
@@ -94,6 +97,9 @@
                 <a href="agent-jobs" class="block text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] hover:bg-[var(--color-bg-secondary)] px-3 py-2 rounded-lg transition duration-300 ease-in-out flex items-center text-sm">
                     <i class="fas fa-tasks text-[var(--color-primary)] mr-3 w-5 text-center text-sm"></i>Agent Jobs
                 </a>
+                <a href="traces/" class="block text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] hover:bg-[var(--color-bg-secondary)] px-3 py-2 rounded-lg transition duration-300 ease-in-out flex items-center text-sm">
+                    <i class="fas fa-chart-line text-[var(--color-primary)] mr-3 w-5 text-center text-sm"></i>Traces
+                </a>
                 <a href="swagger/" class="block text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] hover:bg-[var(--color-bg-secondary)] px-3 py-2 rounded-lg transition duration-300 ease-in-out flex items-center text-sm">
                     <i class="fas fa-code text-[var(--color-primary)] mr-3 w-5 text-center text-sm"></i>API
                 </a>
diff --git a/core/http/views/settings.html b/core/http/views/settings.html
index c960862a07c5..b06c85a6d965 100644
--- a/core/http/views/settings.html
+++ b/core/http/views/settings.html
@@ -10,7 +10,7 @@
     <!-- Notifications -->
     <div class="fixed top-20 right-4 z-50 space-y-2" style="max-width: 400px;">
         <template x-for="notification in notifications" :key="notification.id">
-            <div x-show="true" 
+            <div x-show="true"
                  x-transition:enter="transition ease-out duration-200"
                  x-transition:enter-start="opacity-0"
                  x-transition:enter-end="opacity-100"
@@ -39,7 +39,7 @@
                 <h1 class="h2">
                     Application Settings
                 </h1>
-                <a href="/manage" 
+                <a href="/manage"
                    class="inline-flex items-center text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)] transition-colors">
                     <i class="fas fa-arrow-left mr-2 text-sm"></i>
                     <span class="text-sm">Back to Manage</span>
@@ -68,7 +68,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable automatic monitoring of backend processes</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.watchdog_enabled" 
+                            <input type="checkbox" x-model="settings.watchdog_enabled"
                                    @change="updateWatchdogEnabled()"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-primary-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-primary)]"></div>
@@ -82,7 +82,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Automatically stop backends that are idle for too long</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.watchdog_idle_enabled" 
+                            <input type="checkbox" x-model="settings.watchdog_idle_enabled"
                                    :disabled="!settings.watchdog_enabled"
                                    class="sr-only peer" :class="!settings.watchdog_enabled ? 'opacity-50' : ''">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-primary-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-primary)]"></div>
@@ -93,7 +93,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Idle Timeout</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Time before an idle backend is stopped (e.g., 15m, 1h)</p>
-                        <input type="text" x-model="settings.watchdog_idle_timeout" 
+                        <input type="text" x-model="settings.watchdog_idle_timeout"
                                :disabled="!settings.watchdog_idle_enabled"
                                placeholder="15m"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-primary-border)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-primary-border)]"
@@ -107,7 +107,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Automatically stop backends that are busy for too long (stuck processes)</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.watchdog_busy_enabled" 
+                            <input type="checkbox" x-model="settings.watchdog_busy_enabled"
                                    :disabled="!settings.watchdog_enabled"
                                    class="sr-only peer" :class="!settings.watchdog_enabled ? 'opacity-50' : ''">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-primary-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-primary)]"></div>
@@ -118,7 +118,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Busy Timeout</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Time before a busy backend is stopped (e.g., 5m, 30m)</p>
-                        <input type="text" x-model="settings.watchdog_busy_timeout" 
+                        <input type="text" x-model="settings.watchdog_busy_timeout"
                                :disabled="!settings.watchdog_busy_enabled"
                                placeholder="5m"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-primary-border)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-primary-border)]"
@@ -129,7 +129,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Check Interval</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">How often the watchdog checks backends and memory usage (e.g., 2s, 30s)</p>
-                        <input type="text" x-model="settings.watchdog_interval" 
+                        <input type="text" x-model="settings.watchdog_interval"
                                :disabled="!settings.watchdog_enabled"
                                placeholder="2s"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-primary-border)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-primary-border)]"
@@ -159,7 +159,7 @@ <h3 class="text-md font-medium text-[var(--color-text-primary)] mb-3 flex items-
                                     <template x-for="gpu in resourceData.gpus" :key="gpu.index">
                                         <div class="flex items-center justify-between text-xs">
                                             <span class="text-[var(--color-text-primary)] truncate max-w-[200px]" x-text="gpu.name"></span>
-                                            <span class="font-mono" 
+                                            <span class="font-mono"
                                                   :class="gpu.usage_percent > 90 ? 'text-red-400' : gpu.usage_percent > 70 ? 'text-yellow-400' : 'text-green-400'"
                                                   x-text="`${gpu.usage_percent.toFixed(1)}%`"></span>
                                         </div>
@@ -169,7 +169,7 @@ <h3 class="text-md font-medium text-[var(--color-text-primary)] mb-3 flex items-
                             <template x-if="resourceData && resourceData.available && resourceData.type === 'ram'">
                                 <div class="flex items-center justify-between text-xs">
                                     <span class="text-[var(--color-text-primary)]">System RAM</span>
-                                    <span class="font-mono" 
+                                    <span class="font-mono"
                                           :class="resourceData.ram.usage_percent > 90 ? 'text-red-400' : resourceData.ram.usage_percent > 70 ? 'text-yellow-400' : 'text-green-400'"
                                           x-text="`${resourceData.ram.usage_percent.toFixed(1)}%`"></span>
                                 </div>
@@ -186,7 +186,7 @@ <h3 class="text-md font-medium text-[var(--color-text-primary)] mb-3 flex items-
                                 <p class="text-xs text-[var(--color-text-secondary)] mt-1">Evict backends when memory usage exceeds threshold</p>
                             </div>
                             <label class="relative inline-flex items-center cursor-pointer">
-                                <input type="checkbox" x-model="settings.memory_reclaimer_enabled" 
+                                <input type="checkbox" x-model="settings.memory_reclaimer_enabled"
                                        :disabled="!settings.watchdog_enabled"
                                        class="sr-only peer" :class="!settings.watchdog_enabled ? 'opacity-50' : ''">
                                 <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-primary-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-primary)]"></div>
@@ -198,12 +198,12 @@ <h3 class="text-md font-medium text-[var(--color-text-primary)] mb-3 flex items-
                             <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Memory Threshold (%)</label>
                             <p class="text-xs text-[var(--color-text-secondary)] mb-2">When memory usage exceeds this, backends will be evicted (50-100%)</p>
                             <div class="flex items-center gap-3">
-                                <input type="range" x-model="settings.memory_reclaimer_threshold_percent" 
+                                <input type="range" x-model="settings.memory_reclaimer_threshold_percent"
                                        min="50" max="100" step="1"
                                        :disabled="!settings.memory_reclaimer_enabled || !settings.watchdog_enabled"
                                        class="flex-1 h-2 bg-[var(--color-bg-primary)] rounded-lg appearance-none cursor-pointer"
                                        :class="(!settings.memory_reclaimer_enabled || !settings.watchdog_enabled) ? 'opacity-50' : ''">
-                                <span class="text-sm font-mono text-[var(--color-text-primary)] w-12 text-right" 
+                                <span class="text-sm font-mono text-[var(--color-text-primary)] w-12 text-right"
                                       x-text="`${settings.memory_reclaimer_threshold_percent}%`"></span>
                             </div>
                         </div>
@@ -226,7 +226,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Max Active Backends</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Maximum number of models to keep loaded at once (0 = unlimited, 1 = single backend mode). Least recently used models are evicted when limit is reached.</p>
-                        <input type="number" x-model="settings.max_active_backends" 
+                        <input type="number" x-model="settings.max_active_backends"
                                min="0"
                                placeholder="0"
                                @change="updateMaxActiveBackends()"
@@ -240,7 +240,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable backends to handle multiple requests in parallel (if supported)</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.parallel_backend_requests" 
+                            <input type="checkbox" x-model="settings.parallel_backend_requests"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-accent-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-accent)]"></div>
                         </label>
@@ -263,7 +263,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Default Threads</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Number of threads to use for model inference (0 = auto)</p>
-                        <input type="number" x-model="settings.threads" 
+                        <input type="number" x-model="settings.threads"
                                min="0"
                                placeholder="0"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-success-light)] rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-success-light)]">
@@ -273,7 +273,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Default Context Size</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Default context window size for models</p>
-                        <input type="number" x-model="settings.context_size" 
+                        <input type="number" x-model="settings.context_size"
                                min="0"
                                placeholder="512"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-success-light)] rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-success-light)]">
@@ -286,7 +286,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Use 16-bit floating point precision</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.f16" 
+                            <input type="checkbox" x-model="settings.f16"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-success-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-success)]"></div>
                         </label>
@@ -299,11 +299,37 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable debug logging</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.debug" 
+                            <input type="checkbox" x-model="settings.debug"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-success-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-success)]"></div>
                         </label>
                     </div>
+
+                    <!-- Enable Tracing -->
+                    <div class="flex items-center justify-between">
+                        <div>
+                            <label class="text-sm font-medium text-[var(--color-text-primary)]">Enable Tracing</label>
+                            <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable tracing of requests and responses</p>
+                        </div>
+                        <label class="relative inline-flex items-center cursor-pointer">
+                            <input type="checkbox" x-model="settings.enable_tracing"
+                                   class="sr-only peer">
+                            <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-success-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-success)]"></div>
+                        </label>
+                    </div>
+
+                    <!-- Tracing Max Items -->
+                    <div>
+                        <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Tracing Max Items</label>
+                        <p class="text-xs text-[var(--color-text-secondary)] mb-2">Maximum number of tracing items to keep</p>
+                        <input type="number" x-model="settings.tracing_max_items"
+                               min="0"
+                               placeholder="0"
+                               :disabled="!settings.enable_tracing"
+                               class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-success-light)] rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-success-light)]"
+                               :class="!settings.enable_tracing ? 'opacity-50 cursor-not-allowed' : ''">
+                    </div>
+
                 </div>
             </div>
 
@@ -325,7 +351,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable Cross-Origin Resource Sharing</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.cors" 
+                            <input type="checkbox" x-model="settings.cors"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-warning-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-warning)]"></div>
                         </label>
@@ -335,7 +361,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">CORS Allow Origins</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Comma-separated list of allowed origins</p>
-                        <input type="text" x-model="settings.cors_allow_origins" 
+                        <input type="text" x-model="settings.cors_allow_origins"
                                placeholder="*"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-warning-light)] rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-warning-light)]">
                     </div>
@@ -347,7 +373,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable Cross-Site Request Forgery protection</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.csrf" 
+                            <input type="checkbox" x-model="settings.csrf"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-warning-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-warning)]"></div>
                         </label>
@@ -370,7 +396,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">P2P Token</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Authentication token for P2P network (set to 0 to generate a new token)</p>
-                        <input type="text" x-model="settings.p2p_token" 
+                        <input type="text" x-model="settings.p2p_token"
                                placeholder=""
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-accent)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-accent)]/50">
                     </div>
@@ -379,7 +405,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">P2P Network ID</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Network identifier for P2P connections</p>
-                        <input type="text" x-model="settings.p2p_network_id" 
+                        <input type="text" x-model="settings.p2p_network_id"
                                placeholder=""
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-accent)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-accent)]/50">
                     </div>
@@ -391,7 +417,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable federated instance mode</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.federated" 
+                            <input type="checkbox" x-model="settings.federated"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-accent)]/20 rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-accent)]"></div>
                         </label>
@@ -414,7 +440,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Job Retention Days</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Number of days to keep job history (default: 30)</p>
-                        <input type="number" x-model="settings.agent_job_retention_days" 
+                        <input type="number" x-model="settings.agent_job_retention_days"
                                min="0"
                                placeholder="30"
                                class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-primary)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-primary)]/50">
@@ -437,7 +463,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">API Keys</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">List of API keys (one per line or comma-separated)</p>
-                        <textarea x-model="settings.api_keys_text" 
+                        <textarea x-model="settings.api_keys_text"
                                   rows="4"
                                   placeholder="sk-1234567890abcdef&#10;sk-0987654321fedcba"
                                   class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-error-light)] rounded text-sm text-[var(--color-text-primary)] font-mono focus:outline-none focus:ring-2 focus:ring-[var(--color-error-light)]"></textarea>
@@ -464,7 +490,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Automatically load model galleries on startup</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.autoload_galleries" 
+                            <input type="checkbox" x-model="settings.autoload_galleries"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-accent)]/20 rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-accent)]"></div>
                         </label>
@@ -477,7 +503,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                             <p class="text-xs text-[var(--color-text-secondary)] mt-1">Automatically load backend galleries on startup</p>
                         </div>
                         <label class="relative inline-flex items-center cursor-pointer">
-                            <input type="checkbox" x-model="settings.autoload_backend_galleries" 
+                            <input type="checkbox" x-model="settings.autoload_backend_galleries"
                                    class="sr-only peer">
                             <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-accent)]/20 rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-accent)]"></div>
                         </label>
@@ -487,7 +513,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Model Galleries (JSON)</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Array of gallery objects with 'url' and 'name' fields</p>
-                        <textarea x-model="settings.galleries_json" 
+                        <textarea x-model="settings.galleries_json"
                                   rows="4"
                                   placeholder='[{"url": "https://example.com", "name": "Example Gallery"}]'
                                   class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-accent)]/20 rounded text-sm text-[var(--color-text-primary)] font-mono focus:outline-none focus:ring-2 focus:ring-[var(--color-accent)]/50"></textarea>
@@ -497,7 +523,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     <div>
                         <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Backend Galleries (JSON)</label>
                         <p class="text-xs text-[var(--color-text-secondary)] mb-2">Array of backend gallery objects with 'url' and 'name' fields</p>
-                        <textarea x-model="settings.backend_galleries_json" 
+                        <textarea x-model="settings.backend_galleries_json"
                                   rows="4"
                                   placeholder='[{"url": "https://example.com", "name": "Example Backend Gallery"}]'
                                   class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-accent)]/20 rounded text-sm text-[var(--color-text-primary)] font-mono focus:outline-none focus:ring-2 focus:ring-[var(--color-accent)]/50"></textarea>
@@ -521,7 +547,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
 
             <!-- Save Button -->
             <div class="flex justify-end">
-                <button type="submit" 
+                <button type="submit"
                         :disabled="saving"
                         class="btn-primary">
                     <i class="fas fa-save mr-2" :class="saving ? 'fa-spin fa-spinner' : ''"></i>
@@ -554,6 +580,8 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
             context_size: 0,
             f16: false,
             debug: false,
+            enable_tracing: false,
+            tracing_max_items: 0,
             cors: false,
             csrf: false,
             cors_allow_origins: '',
@@ -569,16 +597,16 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
         },
         sourceInfo: '',
         saving: false,
-        
+
         init() {
             this.loadSettings();
         },
-        
+
         async loadSettings() {
             try {
                 const response = await fetch('/api/settings');
                 const data = await response.json();
-                
+
                 if (response.ok) {
                     this.settings = {
                         watchdog_enabled: data.watchdog_enabled,
@@ -596,6 +624,8 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                         context_size: data.context_size || 0,
                         f16: data.f16 || false,
                         debug: data.debug || false,
+                        enable_tracing: data.enable_tracing || false,
+                        tracing_max_items: data.tracing_max_items || 0,
                         cors: data.cors || false,
                         csrf: data.csrf || false,
                         cors_allow_origins: data.cors_allow_origins || '',
@@ -618,7 +648,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                 this.addNotification('Failed to load settings: ' + error.message, 'error');
             }
         },
-        
+
         updateWatchdogEnabled() {
             if (!this.settings.watchdog_enabled) {
                 this.settings.watchdog_idle_enabled = false;
@@ -626,21 +656,27 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                 this.settings.memory_reclaimer_enabled = false;
             }
         },
-        
+
         updateMaxActiveBackends() {
             // Ensure max_active_backends is a non-negative integer
             const value = parseInt(this.settings.max_active_backends) || 0;
             this.settings.max_active_backends = Math.max(0, value);
         },
-        
+
+        updateTracingEnabled() {
+            if (!this.settings.enable_tracing) {
+                this.settings.tracing_max_items = 0;
+            }
+        },
+
         async saveSettings() {
             if (this.saving) return;
-            
+
             this.saving = true;
-            
+
             try {
                 const payload = {};
-                
+
                 // Only include changed values
                 if (this.settings.watchdog_enabled !== undefined) {
                     payload.watchdog_enabled = this.settings.watchdog_enabled;
@@ -685,6 +721,12 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                 if (this.settings.debug !== undefined) {
                     payload.debug = this.settings.debug;
                 }
+                if (this.settings.enable_tracing !== undefined) {
+                    payload.enable_tracing = this.settings.enable_tracing;
+                }
+                if (this.settings.tracing_max_items !== undefined) {
+                    payload.tracing_max_items = parseInt(this.settings.tracing_max_items) || 0;
+                }
                 if (this.settings.cors !== undefined) {
                     payload.cors = this.settings.cors;
                 }
@@ -744,7 +786,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                 if (this.settings.agent_job_retention_days !== undefined) {
                     payload.agent_job_retention_days = parseInt(this.settings.agent_job_retention_days) || 30;
                 }
-                
+
                 const response = await fetch('/api/settings', {
                     method: 'POST',
                     headers: {
@@ -752,9 +794,9 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                     },
                     body: JSON.stringify(payload)
                 });
-                
+
                 const data = await response.json();
-                
+
                 if (response.ok && data.success) {
                     this.addNotification('Settings saved successfully!', 'success');
                     // Reload settings to get updated source info
@@ -769,13 +811,13 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
                 this.saving = false;
             }
         },
-        
+
         addNotification(message, type = 'success') {
             const id = Date.now();
             this.notifications.push({ id, message, type });
             setTimeout(() => this.dismissNotification(id), 5000);
         },
-        
+
         dismissNotification(id) {
             this.notifications = this.notifications.filter(n => n.id !== id);
         }
@@ -786,7 +828,7 @@ <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex item
 function resourceStatus() {
     return {
         resourceData: null,
-        
+
         async fetchResource() {
             try {
                 const response = await fetch('/api/resources');
diff --git a/core/http/views/traces.html b/core/http/views/traces.html
new file mode 100644
index 000000000000..97fe5e330e46
--- /dev/null
+++ b/core/http/views/traces.html
@@ -0,0 +1,334 @@
+<!DOCTYPE html>
+<html lang="en">
+{{template "views/partials/head" .}}
+
+<body class="bg-[var(--color-bg-primary)] text-[var(--color-text-primary)]">
+<div class="flex flex-col min-h-screen" x-data="tracesApp()" x-init="init()">
+
+    {{template "views/partials/navbar" .}}
+
+    <!-- Notifications -->
+    <div class="fixed top-20 right-4 z-50 space-y-2" style="max-width: 400px;">
+        <template x-for="notification in notifications" :key="notification.id">
+            <div x-show="true"
+                 x-transition:enter="transition ease-out duration-200"
+                 x-transition:enter-start="opacity-0"
+                 x-transition:enter-end="opacity-100"
+                 x-transition:leave="transition ease-in duration-150"
+                 x-transition:leave-start="opacity-100"
+                 x-transition:leave-end="opacity-0"
+                 :class="notification.type === 'error' ? 'bg-red-500' : 'bg-green-500'"
+                 class="rounded-lg p-4 text-white flex items-start space-x-3">
+                <div class="flex-shrink-0">
+                    <i :class="notification.type === 'error' ? 'fas fa-exclamation-circle' : 'fas fa-check-circle'" class="text-xl"></i>
+                </div>
+                <div class="flex-1 min-w-0">
+                    <p class="text-sm font-medium break-words" x-text="notification.message"></p>
+                </div>
+                <button @click="dismissNotification(notification.id)" class="flex-shrink-0 text-white hover:opacity-80 transition-opacity">
+                    <i class="fas fa-times"></i>
+                </button>
+            </div>
+        </template>
+    </div>
+
+    <div class="container mx-auto px-4 py-8 flex-grow">
+
+        <!-- Hero Header -->
+        <div class="hero-section">
+            <div class="hero-content">
+                <h1 class="hero-title">
+                    API Traces
+                </h1>
+                <p class="hero-subtitle">View logged API requests and responses</p>
+                <div class="flex flex-wrap justify-center gap-3">
+                    <button @click="clearTraces()" class="btn-secondary text-sm py-1.5 px-3">
+                        <i class="fas fa-trash mr-1.5 text-[10px]"></i>
+                        <span>Clear Traces</span>
+                    </button>
+                    <a href="/api/traces" download="traces.json" class="btn-secondary text-sm py-1.5 px-3">
+                        <i class="fas fa-download mr-1.5 text-[10px]"></i>
+                        <span>Export Traces</span>
+                    </a>
+                </div>
+            </div>
+        </div>
+
+        <!-- Tracing Settings -->
+        <div class="bg-[var(--color-bg-secondary)] border border-[var(--color-primary)]/20 rounded-lg p-6 mb-8">
+            <h2 class="text-xl font-semibold text-[var(--color-text-primary)] mb-4 flex items-center">
+                <i class="fas fa-bug mr-2 text-[var(--color-primary)] text-sm"></i>
+                Tracing Settings
+            </h2>
+            <p class="text-xs text-[var(--color-text-secondary)] mb-4">Configure API tracing</p>
+
+            <div class="space-y-4">
+                <!-- Enable Tracing -->
+                <div class="flex items-center justify-between">
+                    <div>
+                        <label class="text-sm font-medium text-[var(--color-text-primary)]">Enable Tracing</label>
+                        <p class="text-xs text-[var(--color-text-secondary)] mt-1">Enable tracing of requests and responses</p>
+                    </div>
+                    <label class="relative inline-flex items-center cursor-pointer">
+                        <input type="checkbox" x-model="settings.enable_tracing"
+                               @change="updateTracingEnabled()"
+                               class="sr-only peer">
+                        <div class="w-11 h-6 bg-[var(--color-bg-primary)] peer-focus:outline-none peer-focus:ring-4 peer-focus:ring-[var(--color-primary-light)] rounded-full peer peer-checked:after:translate-x-full peer-checked:after:border-white after:content-[''] after:absolute after:top-[2px] after:left-[2px] after:bg-white after:border-gray-300 after:border after:rounded-full after:h-5 after:w-5 after:transition-all peer-checked:bg-[var(--color-primary)]"></div>
+                    </label>
+                </div>
+
+                <!-- Tracing Max Items -->
+                <div>
+                    <label class="block text-sm font-medium text-[var(--color-text-primary)] mb-2">Tracing Max Items</label>
+                    <p class="text-xs text-[var(--color-text-secondary)] mb-2">Maximum number of tracing items to keep (0 = unlimited)</p>
+                    <input type="number" x-model="settings.tracing_max_items"
+                           min="0"
+                           placeholder="1000"
+                           :disabled="!settings.enable_tracing"
+                           class="w-full px-3 py-2 bg-[var(--color-bg-primary)] border border-[var(--color-primary)]/20 rounded text-sm text-[var(--color-text-primary)] focus:outline-none focus:ring-2 focus:ring-[var(--color-primary)]/50"
+                           :class="!settings.enable_tracing ? 'opacity-50 cursor-not-allowed' : ''">
+                </div>
+
+                <!-- Save Button -->
+                <div class="flex justify-end pt-2">
+                    <button @click="saveTracingSettings()"
+                            :disabled="saving"
+                            class="btn-primary px-4 py-2 text-sm">
+                        <i class="fas fa-save mr-2" :class="saving ? 'fa-spin fa-spinner' : ''"></i>
+                        <span x-text="saving ? 'Saving...' : 'Save Settings'"></span>
+                    </button>
+                </div>
+            </div>
+        </div>
+
+        <!-- Traces Table -->
+        <div class="mt-8">
+            <div class="overflow-x-auto">
+                <table class="w-full border-collapse">
+                    <thead>
+                        <tr class="border-b border-[var(--color-bg-secondary)]">
+                            <th class="text-left p-2 text-xs font-semibold text-[var(--color-text-secondary)]">Method</th>
+                            <th class="text-left p-2 text-xs font-semibold text-[var(--color-text-secondary)]">Path</th>
+                            <th class="text-left p-2 text-xs font-semibold text-[var(--color-text-secondary)]">Status</th>
+                            <th class="text-right p-2 text-xs font-semibold text-[var(--color-text-secondary)]">Actions</th>
+                        </tr>
+                    </thead>
+                    <tbody>
+                        <template x-for="(trace, index) in traces" :key="index">
+                            <tr class="hover:bg-[var(--color-bg-secondary)]/50 border-b border-[var(--color-bg-secondary)] transition-colors">
+                                <td class="p-2" x-text="trace.request.method"></td>
+                                <td class="p-2" x-text="trace.request.path"></td>
+                                <td class="p-2" x-text="trace.response.status"></td>
+                                <td class="p-2 text-right">
+                                    <button @click="showDetails(index)" class="text-[var(--color-primary)]/60 hover:text-[var(--color-primary)] hover:bg-[var(--color-primary)]/10 rounded p-1 transition-colors">
+                                        <i class="fas fa-eye text-xs"></i>
+                                    </button>
+                                </td>
+                            </tr>
+                        </template>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+        <!-- Details Modal -->
+        <div x-show="selectedTrace !== null" class="fixed inset-0 bg-black/50 flex items-center justify-center z-50" @click="selectedTrace = null">
+            <div class="bg-[var(--color-bg-secondary)] rounded-lg p-6 max-w-4xl w-full max-h-[90vh] overflow-auto" @click.stop>
+                <div class="flex justify-between mb-4">
+                    <h2 class="h3">Trace Details</h2>
+                    <button @click="selectedTrace = null" class="text-[var(--color-text-secondary)] hover:text-[var(--color-text-primary)]">
+                        <i class="fas fa-times"></i>
+                    </button>
+                </div>
+                <div class="grid grid-cols-2 gap-4">
+                    <div>
+                        <h3 class="text-lg font-semibold mb-2">Request Body</h3>
+                        <div id="requestEditor" class="h-96 border border-[var(--color-primary-border)]/20"></div>
+                    </div>
+                    <div>
+                        <h3 class="text-lg font-semibold mb-2">Response Body</h3>
+                        <div id="responseEditor" class="h-96 border border-[var(--color-primary-border)]/20"></div>
+                    </div>
+                </div>
+            </div>
+        </div>
+
+    </div>
+
+    {{template "views/partials/footer" .}}
+
+</div>
+
+<!-- CodeMirror -->
+<link rel="stylesheet" href="static/assets/codemirror.min.css">
+<script src="static/assets/codemirror.min.js"></script>
+<script src="static/assets/javascript.min.js"></script>
+
+<!-- Styles from model-editor -->
+<style>
+.CodeMirror {
+    height: 100% !important;
+    font-family: monospace;
+}
+</style>
+
+<script>
+function tracesApp() {
+    return {
+        traces: [],
+        selectedTrace: null,
+        requestEditor: null,
+        responseEditor: null,
+        notifications: [],
+        settings: {
+            enable_tracing: false,
+            tracing_max_items: 0
+        },
+        saving: false,
+
+        init() {
+            this.loadTracingSettings();
+            this.fetchTraces();
+            setInterval(() => this.fetchTraces(), 5000);
+        },
+
+        async loadTracingSettings() {
+            try {
+                const response = await fetch('/api/settings');
+                const data = await response.json();
+
+                if (response.ok) {
+                    this.settings.enable_tracing = data.enable_tracing || false;
+                    this.settings.tracing_max_items = data.tracing_max_items || 0;
+                } else {
+                    this.addNotification('Failed to load tracing settings: ' + (data.error || 'Unknown error'), 'error');
+                }
+            } catch (error) {
+                console.error('Error loading tracing settings:', error);
+                this.addNotification('Failed to load tracing settings: ' + error.message, 'error');
+            }
+        },
+
+        updateTracingEnabled() {
+            if (!this.settings.enable_tracing) {
+                this.settings.tracing_max_items = 0;
+            }
+        },
+
+        async saveTracingSettings() {
+            if (this.saving) return;
+
+            this.saving = true;
+
+            try {
+                const payload = {
+                    enable_tracing: this.settings.enable_tracing,
+                    tracing_max_items: parseInt(this.settings.tracing_max_items) || 0
+                };
+
+                const response = await fetch('/api/settings', {
+                    method: 'POST',
+                    headers: {
+                        'Content-Type': 'application/json',
+                    },
+                    body: JSON.stringify(payload)
+                });
+
+                const data = await response.json();
+
+                if (response.ok && data.success) {
+                    this.addNotification('Tracing settings saved successfully!', 'success');
+                } else {
+                    this.addNotification('Failed to save tracing settings: ' + (data.error || 'Unknown error'), 'error');
+                }
+            } catch (error) {
+                console.error('Error saving tracing settings:', error);
+                this.addNotification('Failed to save tracing settings: ' + error.message, 'error');
+            } finally {
+                this.saving = false;
+            }
+        },
+
+        addNotification(message, type = 'success') {
+            const id = Date.now();
+            this.notifications.push({ id, message, type });
+            setTimeout(() => this.dismissNotification(id), 5000);
+        },
+
+        dismissNotification(id) {
+            this.notifications = this.notifications.filter(n => n.id !== id);
+        },
+
+        async fetchTraces() {
+            const response = await fetch('/api/traces');
+            this.traces = await response.json();
+        },
+
+        async clearTraces() {
+            if (confirm('Clear all traces?')) {
+                await fetch('/api/traces/clear', { method: 'POST' });
+                this.traces = [];
+            }
+        },
+
+        showDetails(index) {
+            this.selectedTrace = index;
+            this.$nextTick(() => {
+                const trace = this.traces[index];
+
+                const decodeBase64 = (base64) => {
+                    const binaryString = atob(base64);
+                    const bytes = new Uint8Array(binaryString.length);
+                    for (let i = 0; i < binaryString.length; i++) {
+                        bytes[i] = binaryString.charCodeAt(i);
+                    }
+                    return new TextDecoder().decode(bytes);
+                };
+
+                const formatBody = (bodyText) => {
+                    try {
+                        const json = JSON.parse(bodyText);
+                        return JSON.stringify(json, null, 2);
+                    } catch {
+                        return bodyText;
+                    }
+                };
+
+                const reqBody = formatBody(decodeBase64(trace.request.body));
+                const resBody = formatBody(decodeBase64(trace.response.body));
+
+                if (!this.requestEditor) {
+                    this.requestEditor = CodeMirror(document.getElementById('requestEditor'), {
+                        value: reqBody,
+                        mode: 'javascript',
+                        json: true,
+                        theme: 'default',
+                        lineNumbers: true,
+                        readOnly: true,
+                        lineWrapping: true
+                    });
+                } else {
+                    this.requestEditor.setValue(reqBody);
+                }
+
+                if (!this.responseEditor) {
+                    this.responseEditor = CodeMirror(document.getElementById('responseEditor'), {
+                        value: resBody,
+                        mode: 'javascript',
+                        json: true,
+                        theme: 'default',
+                        lineNumbers: true,
+                        readOnly: true,
+                        lineWrapping: true
+                    });
+                } else {
+                    this.responseEditor.setValue(resBody);
+                }
+            });
+        }
+    }
+}
+</script>
+
+</body>
+</html>
diff --git a/go.mod b/go.mod
index 3d9448438bc1..85e980ddd0cf 100644
--- a/go.mod
+++ b/go.mod
@@ -12,6 +12,7 @@ require (
 	github.com/charmbracelet/glamour v0.10.0
 	github.com/containerd/containerd v1.7.30
 	github.com/ebitengine/purego v0.9.1
+	github.com/emirpasic/gods/v2 v2.0.0-alpha
 	github.com/fsnotify/fsnotify v1.9.0
 	github.com/go-audio/wav v1.1.0
 	github.com/go-skynet/go-llama.cpp v0.0.0-20240314183750-6a8041ef6b46
@@ -57,6 +58,7 @@ require (
 	go.opentelemetry.io/otel/metric v1.39.0
 	go.opentelemetry.io/otel/sdk/metric v1.39.0
 	google.golang.org/grpc v1.77.0
+	google.golang.org/protobuf v1.36.10
 	gopkg.in/yaml.v2 v2.4.0
 	gopkg.in/yaml.v3 v3.0.1
 	oras.land/oras-go/v2 v2.6.0
@@ -67,7 +69,6 @@ require (
 	github.com/labstack/gommon v0.4.2 // indirect
 	github.com/swaggo/files/v2 v2.0.2 // indirect
 	github.com/valyala/fasttemplate v1.2.2 // indirect
-	google.golang.org/protobuf v1.36.10 // indirect
 )
 
 require (
diff --git a/go.sum b/go.sum
index 64cc0b086c0d..4b4760ceee40 100644
--- a/go.sum
+++ b/go.sum
@@ -142,6 +142,8 @@ github.com/dsnet/golib v0.0.0-20171103203638-1ea166775780/go.mod h1:Lj+Z9rebOhdf
 github.com/dustin/go-humanize v1.0.0/go.mod h1:HtrtbFcZ19U5GC7JDqmcUSB87Iq5E25KnS6fMYU6eOk=
 github.com/ebitengine/purego v0.9.1 h1:a/k2f2HQU3Pi399RPW1MOaZyhKJL9w/xFpKAg4q1s0A=
 github.com/ebitengine/purego v0.9.1/go.mod h1:iIjxzd6CiRiOG0UyXP+V1+jWqUXVjPKLAI0mRfJZTmQ=
+github.com/emirpasic/gods/v2 v2.0.0-alpha h1:dwFlh8pBg1VMOXWGipNMRt8v96dKAIvBehtCt6OtunU=
+github.com/emirpasic/gods/v2 v2.0.0-alpha/go.mod h1:W0y4M2dtBB9U5z3YlghmpuUhiaZT2h6yoeE+C1sCp6A=
 github.com/envoyproxy/go-control-plane v0.9.0/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
 github.com/envoyproxy/go-control-plane v0.9.1-0.20191026205805-5f8ba28d4473/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
 github.com/envoyproxy/go-control-plane v0.9.4/go.mod h1:6rpuAdCZL397s3pYoYcLgu1mIlRU8Am5FuJP05cCM98=