feat: port 11 LEM data management commands into core ml
Ports all remaining LEM pipeline commands from pkg/lem into core ml,
eliminating the standalone LEM CLI dependency. Each command is split
into reusable business logic (pkg/ml/) and a thin cobra wrapper
(internal/cmd/ml/).
New commands: query, inventory, metrics, ingest, normalize, seed-influx,
consolidate, import-all, approve, publish, coverage.
Adds Path(), Exec(), QueryRowScan() convenience methods to DB type.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-16 04:02:28 +00:00
|
|
|
package ml
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
|
"fmt"
|
|
|
|
|
"os"
|
|
|
|
|
|
2026-02-16 14:24:37 +00:00
|
|
|
"forge.lthn.ai/core/go/pkg/cli"
|
|
|
|
|
"forge.lthn.ai/core/go/pkg/ml"
|
feat: port 11 LEM data management commands into core ml
Ports all remaining LEM pipeline commands from pkg/lem into core ml,
eliminating the standalone LEM CLI dependency. Each command is split
into reusable business logic (pkg/ml/) and a thin cobra wrapper
(internal/cmd/ml/).
New commands: query, inventory, metrics, ingest, normalize, seed-influx,
consolidate, import-all, approve, publish, coverage.
Adds Path(), Exec(), QueryRowScan() convenience methods to DB type.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-16 04:02:28 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
|
|
var seedInfluxCmd = &cli.Command{
|
|
|
|
|
Use: "seed-influx",
|
|
|
|
|
Short: "Seed InfluxDB golden_gen from DuckDB golden_set",
|
|
|
|
|
Long: "One-time migration: batch-loads DuckDB golden_set records into InfluxDB golden_gen measurement.",
|
|
|
|
|
RunE: runSeedInflux,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var (
|
|
|
|
|
seedInfluxForce bool
|
|
|
|
|
seedInfluxBatchSize int
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
|
seedInfluxCmd.Flags().BoolVar(&seedInfluxForce, "force", false, "Re-seed even if InfluxDB already has data")
|
|
|
|
|
seedInfluxCmd.Flags().IntVar(&seedInfluxBatchSize, "batch-size", 500, "Lines per InfluxDB write batch")
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func runSeedInflux(cmd *cli.Command, args []string) error {
|
|
|
|
|
path := dbPath
|
|
|
|
|
if path == "" {
|
|
|
|
|
path = os.Getenv("LEM_DB")
|
|
|
|
|
}
|
|
|
|
|
if path == "" {
|
|
|
|
|
return fmt.Errorf("--db or LEM_DB required")
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
db, err := ml.OpenDB(path)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return fmt.Errorf("open db: %w", err)
|
|
|
|
|
}
|
|
|
|
|
defer db.Close()
|
|
|
|
|
|
|
|
|
|
influx := ml.NewInfluxClient(influxURL, influxDB)
|
|
|
|
|
|
|
|
|
|
return ml.SeedInflux(db, influx, ml.SeedInfluxConfig{
|
|
|
|
|
Force: seedInfluxForce,
|
|
|
|
|
BatchSize: seedInfluxBatchSize,
|
|
|
|
|
}, os.Stdout)
|
|
|
|
|
}
|