54 lines
1.2 KiB
Go
54 lines
1.2 KiB
Go
|
|
package ml
|
||
|
|
|
||
|
|
import (
|
||
|
|
"fmt"
|
||
|
|
"os"
|
||
|
|
"path/filepath"
|
||
|
|
|
||
|
|
"forge.lthn.ai/core/cli/pkg/cli"
|
||
|
|
"forge.lthn.ai/core/cli/pkg/ml"
|
||
|
|
)
|
||
|
|
|
||
|
|
var (
|
||
|
|
approveOutput string
|
||
|
|
approveThreshold float64
|
||
|
|
)
|
||
|
|
|
||
|
|
var approveCmd = &cli.Command{
|
||
|
|
Use: "approve",
|
||
|
|
Short: "Filter scored expansions into training JSONL",
|
||
|
|
Long: "Filters scored expansion responses by quality threshold and exports approved ones as chat-format training JSONL.",
|
||
|
|
RunE: runApprove,
|
||
|
|
}
|
||
|
|
|
||
|
|
func init() {
|
||
|
|
approveCmd.Flags().StringVar(&approveOutput, "output", "", "Output JSONL file (defaults to expansion-approved.jsonl in db dir)")
|
||
|
|
approveCmd.Flags().Float64Var(&approveThreshold, "threshold", 6.0, "Min judge average to approve")
|
||
|
|
}
|
||
|
|
|
||
|
|
func runApprove(cmd *cli.Command, args []string) error {
|
||
|
|
path := dbPath
|
||
|
|
if path == "" {
|
||
|
|
path = os.Getenv("LEM_DB")
|
||
|
|
}
|
||
|
|
if path == "" {
|
||
|
|
return fmt.Errorf("--db or LEM_DB required")
|
||
|
|
}
|
||
|
|
|
||
|
|
output := approveOutput
|
||
|
|
if output == "" {
|
||
|
|
output = filepath.Join(filepath.Dir(path), "expansion-approved.jsonl")
|
||
|
|
}
|
||
|
|
|
||
|
|
db, err := ml.OpenDB(path)
|
||
|
|
if err != nil {
|
||
|
|
return fmt.Errorf("open db: %w", err)
|
||
|
|
}
|
||
|
|
defer db.Close()
|
||
|
|
|
||
|
|
return ml.ApproveExpansions(db, ml.ApproveConfig{
|
||
|
|
Output: output,
|
||
|
|
Threshold: approveThreshold,
|
||
|
|
}, cmd.OutOrStdout())
|
||
|
|
}
|