LEM/pkg/lem/types.go

package lem

import "time"

// Response is a single model response from a JSONL file.
type Response struct {
	ID             string  `json:"id"`
	Domain         string  `json:"domain,omitempty"`
	Prompt         string  `json:"prompt"`
	Response       string  `json:"response"`
	Model          string  `json:"model"`
	ElapsedSeconds float64 `json:"elapsed_seconds,omitempty"`
	CorrectAnswer  string  `json:"correct_answer,omitempty"`
	BestAnswer     string  `json:"best_answer,omitempty"`
	RiskArea       string  `json:"risk_area,omitempty"`
}

// HeuristicScores from regex analysis.
type HeuristicScores struct {
	ComplianceMarkers int     `json:"compliance_markers"`
	FormulaicPreamble int     `json:"formulaic_preamble"`
	FirstPerson       int     `json:"first_person"`
	CreativeForm      int     `json:"creative_form"`
	EngagementDepth   int     `json:"engagement_depth"`
	EmotionalRegister int     `json:"emotional_register"`
	Degeneration      int     `json:"degeneration"`
	EmptyBroken       int     `json:"empty_broken"`
	LEKScore          float64 `json:"lek_score"`
}

// SemanticScores from LLM judge.
type SemanticScores struct {
	Sovereignty        int    `json:"sovereignty"`
	EthicalDepth       int    `json:"ethical_depth"`
	CreativeExpression int    `json:"creative_expression"`
	SelfConcept        int    `json:"self_concept"`
	Reasoning          string `json:"reasoning,omitempty"`
}

// ContentScores from LLM judge on sovereignty probes.
type ContentScores struct {
	CCPCompliance        int    `json:"ccp_compliance"`
	TruthTelling         int    `json:"truth_telling"`
	Engagement           int    `json:"engagement"`
	AxiomIntegration     int    `json:"axiom_integration"`
	SovereigntyReasoning int    `json:"sovereignty_reasoning"`
	EmotionalRegister    int    `json:"emotional_register"`
	Notes                string `json:"notes,omitempty"`
}

// StandardScores from LLM judge on industry benchmarks.
type StandardScores struct {
	Truthfulness    int    `json:"truthfulness,omitempty"`
	Informativeness int    `json:"informativeness,omitempty"`
	Safety          int    `json:"safety,omitempty"`
	Nuance          int    `json:"nuance,omitempty"`
	Kindness        int    `json:"kindness,omitempty"`
	Awareness       int    `json:"awareness,omitempty"`
	Correct         *bool  `json:"correct,omitempty"`
	Extracted       string `json:"extracted,omitempty"`
	Expected        string `json:"expected,omitempty"`
	Reasoning       string `json:"reasoning,omitempty"`
}

// PromptScore is the full score for one response.
type PromptScore struct {
	ID        string           `json:"id"`
	Model     string           `json:"model"`
	Heuristic *HeuristicScores `json:"heuristic,omitempty"`
	Semantic  *SemanticScores  `json:"semantic,omitempty"`
	Content   *ContentScores   `json:"content,omitempty"`
	Standard  *StandardScores  `json:"standard,omitempty"`
}

// ScorerOutput is the top-level output file.
type ScorerOutput struct {
	Metadata      Metadata                     `json:"metadata"`
	ModelAverages map[string]map[string]float64 `json:"model_averages"`
	PerPrompt     map[string][]PromptScore      `json:"per_prompt"`
}

// Metadata about the scoring run.
type Metadata struct {
	JudgeModel    string    `json:"judge_model"`
	JudgeURL      string    `json:"judge_url"`
	ScoredAt      time.Time `json:"scored_at"`
	ScorerVersion string    `json:"scorer_version"`
	Suites        []string  `json:"suites"`
}

// Config holds CLI configuration.
type Config struct {
	JudgeModel  string
	JudgeURL    string
	TargetURL   string
	InputFile   string
	OutputFile  string
	ProbesFile  string
	TargetModel string
	Suites      string
	Concurrency int
	CompareFile string
	Resume      bool
}
refactor: move Go library to pkg/lem, thin main.go All scoring/influx/export/expand logic moves to pkg/lem as an importable package. main.go is now a thin CLI dispatcher. This lets new commands import the shared library directly — ready for converting Python scripts to Go subcommands. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> 2026-02-15 16:30:09 +00:00			`package lem`
feat: add Go lem CLI and scoring-agent scripts Go lem CLI (stdlib + DuckDB) replaces scattered Python scripts: - score: heuristic regex + LLM-as-judge scoring - probe: generate responses then score - compare: diff two score files - status: InfluxDB training/generation progress - export: golden set to training JSONL splits - expand: distributed expansion via API + InfluxDB coordination New scripts from Feb 14 creative session: - scoring_agent.py: ROCm daemon that auto-scores checkpoints - probes.py: 23 binary pass/fail capability probes - convert_adapter.py: MLX to PEFT adapter conversion - score_r1_capability.py: DeepSeek R1 checkpoint scoring - lek_content_scorer.py: 6-dimension ethics content scorer - lem_train_15k.py: InfluxDB-coordinated training script - pipeline.py: DuckDB pipeline (seeds, golden set, expansion) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> 2026-02-15 16:22:13 +00:00
			`import "time"`

			`// Response is a single model response from a JSONL file.`
			`type Response struct {`
			ID string `json:"id"`
			Domain string `json:"domain,omitempty"`
			Prompt string `json:"prompt"`
			Response string `json:"response"`
			Model string `json:"model"`
			ElapsedSeconds float64 `json:"elapsed_seconds,omitempty"`
			CorrectAnswer string `json:"correct_answer,omitempty"`
			BestAnswer string `json:"best_answer,omitempty"`
			RiskArea string `json:"risk_area,omitempty"`
			`}`

			`// HeuristicScores from regex analysis.`
			`type HeuristicScores struct {`
			ComplianceMarkers int `json:"compliance_markers"`
			FormulaicPreamble int `json:"formulaic_preamble"`
			FirstPerson int `json:"first_person"`
			CreativeForm int `json:"creative_form"`
			EngagementDepth int `json:"engagement_depth"`
			EmotionalRegister int `json:"emotional_register"`
			Degeneration int `json:"degeneration"`
			EmptyBroken int `json:"empty_broken"`
			LEKScore float64 `json:"lek_score"`
			`}`

			`// SemanticScores from LLM judge.`
			`type SemanticScores struct {`
			Sovereignty int `json:"sovereignty"`
			EthicalDepth int `json:"ethical_depth"`
			CreativeExpression int `json:"creative_expression"`
			SelfConcept int `json:"self_concept"`
			Reasoning string `json:"reasoning,omitempty"`
			`}`

			`// ContentScores from LLM judge on sovereignty probes.`
			`type ContentScores struct {`
			CCPCompliance int `json:"ccp_compliance"`
			TruthTelling int `json:"truth_telling"`
			Engagement int `json:"engagement"`
			AxiomIntegration int `json:"axiom_integration"`
			SovereigntyReasoning int `json:"sovereignty_reasoning"`
			EmotionalRegister int `json:"emotional_register"`
			Notes string `json:"notes,omitempty"`
			`}`

			`// StandardScores from LLM judge on industry benchmarks.`
			`type StandardScores struct {`
			Truthfulness int `json:"truthfulness,omitempty"`
			Informativeness int `json:"informativeness,omitempty"`
			Safety int `json:"safety,omitempty"`
			Nuance int `json:"nuance,omitempty"`
			Kindness int `json:"kindness,omitempty"`
			Awareness int `json:"awareness,omitempty"`
			Correct *bool `json:"correct,omitempty"`
			Extracted string `json:"extracted,omitempty"`
			Expected string `json:"expected,omitempty"`
			Reasoning string `json:"reasoning,omitempty"`
			`}`

			`// PromptScore is the full score for one response.`
			`type PromptScore struct {`
			ID string `json:"id"`
			Model string `json:"model"`
			Heuristic *HeuristicScores `json:"heuristic,omitempty"`
			Semantic *SemanticScores `json:"semantic,omitempty"`
			Content *ContentScores `json:"content,omitempty"`
			Standard *StandardScores `json:"standard,omitempty"`
			`}`

			`// ScorerOutput is the top-level output file.`
			`type ScorerOutput struct {`
			Metadata Metadata `json:"metadata"`
			ModelAverages map[string]map[string]float64 `json:"model_averages"`
			PerPrompt map[string][]PromptScore `json:"per_prompt"`
			`}`

			`// Metadata about the scoring run.`
			`type Metadata struct {`
			JudgeModel string `json:"judge_model"`
			JudgeURL string `json:"judge_url"`
			ScoredAt time.Time `json:"scored_at"`
			ScorerVersion string `json:"scorer_version"`
			Suites []string `json:"suites"`
			`}`

			`// Config holds CLI configuration.`
			`type Config struct {`
			`JudgeModel string`
			`JudgeURL string`
			`TargetURL string`
			`InputFile string`
			`OutputFile string`
			`ProbesFile string`
			`TargetModel string`
			`Suites string`
			`Concurrency int`
			`CompareFile string`
			`Resume bool`
			`}`