gui/pkg/display/ml.go

package display

import (
	"context"
	"os"
	"strings"

	core "dappco.re/go/core"
	"forge.lthn.ai/core/gui/pkg/chat"
)

type ModelRuntimeState struct {
	APIURL       string            `json:"api_url"`
	Loaded       []chat.ModelEntry `json:"loaded"`
	Available    []chat.ModelEntry `json:"available"`
	VRAMBytes    int64             `json:"vram_bytes"`
	Backend      string            `json:"backend"`
	InferenceURL string            `json:"inference_url"`
}

func (s *Service) modelState() ModelRuntimeState {
	apiURL := strings.TrimRight(strings.TrimSpace(os.Getenv("CORE_ML_API_URL")), "/")
	if apiURL == "" {
		apiURL = "http://localhost:8090"
	}
	models := s.chatModels()
	loaded := make([]chat.ModelEntry, 0)
	for _, model := range models {
		if model.Loaded {
			loaded = append(loaded, model)
		}
	}
	return ModelRuntimeState{
		APIURL:       apiURL,
		Loaded:       loaded,
		Available:    models,
		VRAMBytes:    estimateVRAM(models),
		Backend:      dominantBackend(models),
		InferenceURL: apiURL + "/v1/chat/completions",
	}
}

func (s *Service) chatModels() []chat.ModelEntry {
	if s == nil || s.ServiceRuntime == nil {
		return nil
	}
	result := s.Core().Action("gui.chat.models").Run(context.Background(), core.NewOptions())
	models, _ := result.Value.([]chat.ModelEntry)
	return models
}

func estimateVRAM(models []chat.ModelEntry) int64 {
	var total int64
	for _, model := range models {
		if model.Loaded {
			total += model.SizeBytes
		}
	}
	return total
}

func dominantBackend(models []chat.ModelEntry) string {
	for _, model := range models {
		if strings.TrimSpace(model.Backend) != "" {
			return model.Backend
		}
	}
	return "local"
}

func quoteJS(value string) string {
	return `"` + strings.ReplaceAll(strings.ReplaceAll(strings.ReplaceAll(value, `\`, `\\`), "\n", `\n`), `"`, `\"`) + `"`
}