feat: infrastructure packages and lint cleanup (#281)
* ci: consolidate duplicate workflows and merge CodeQL configs
Remove 17 duplicate workflow files that were split copies of the
combined originals. Each family (CI, CodeQL, Coverage, PR Build,
Alpha Release) had the same job duplicated across separate
push/pull_request/schedule/manual trigger files.
Merge codeql.yml and codescan.yml into a single codeql.yml with
a language matrix covering go, javascript-typescript, python,
and actions — matching the previous default setup coverage.
Remaining workflows (one per family):
- ci.yml (push + PR + manual)
- codeql.yml (push + PR + schedule, all languages)
- coverage.yml (push + PR + manual)
- alpha-release.yml (push + manual)
- pr-build.yml (PR + manual)
- release.yml (tag push)
- agent-verify.yml, auto-label.yml, auto-project.yml
Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
* feat: add collect, config, crypt, plugin packages and fix all lint issues
Add four new infrastructure packages with CLI commands:
- pkg/config: layered configuration (defaults → file → env → flags)
- pkg/crypt: crypto primitives (Argon2id, AES-GCM, ChaCha20, HMAC, checksums)
- pkg/plugin: plugin system with GitHub-based install/update/remove
- pkg/collect: collection subsystem (GitHub, BitcoinTalk, market, papers, excavate)
Fix all golangci-lint issues across the entire codebase (~100 errcheck,
staticcheck SA1012/SA1019/ST1005, unused, ineffassign fixes) so that
`core go qa` passes with 0 issues.
Closes #167, #168, #170, #250, #251, #252, #253, #254, #255, #256
Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---------
Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com>
2026-02-04 11:34:43 +00:00
|
|
|
package collect
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
|
"encoding/json"
|
|
|
|
|
"sync"
|
|
|
|
|
"time"
|
|
|
|
|
|
2026-02-16 00:30:41 +00:00
|
|
|
core "forge.lthn.ai/core/cli/pkg/framework/core"
|
|
|
|
|
"forge.lthn.ai/core/cli/pkg/io"
|
feat: infrastructure packages and lint cleanup (#281)
* ci: consolidate duplicate workflows and merge CodeQL configs
Remove 17 duplicate workflow files that were split copies of the
combined originals. Each family (CI, CodeQL, Coverage, PR Build,
Alpha Release) had the same job duplicated across separate
push/pull_request/schedule/manual trigger files.
Merge codeql.yml and codescan.yml into a single codeql.yml with
a language matrix covering go, javascript-typescript, python,
and actions — matching the previous default setup coverage.
Remaining workflows (one per family):
- ci.yml (push + PR + manual)
- codeql.yml (push + PR + schedule, all languages)
- coverage.yml (push + PR + manual)
- alpha-release.yml (push + manual)
- pr-build.yml (PR + manual)
- release.yml (tag push)
- agent-verify.yml, auto-label.yml, auto-project.yml
Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
* feat: add collect, config, crypt, plugin packages and fix all lint issues
Add four new infrastructure packages with CLI commands:
- pkg/config: layered configuration (defaults → file → env → flags)
- pkg/crypt: crypto primitives (Argon2id, AES-GCM, ChaCha20, HMAC, checksums)
- pkg/plugin: plugin system with GitHub-based install/update/remove
- pkg/collect: collection subsystem (GitHub, BitcoinTalk, market, papers, excavate)
Fix all golangci-lint issues across the entire codebase (~100 errcheck,
staticcheck SA1012/SA1019/ST1005, unused, ineffassign fixes) so that
`core go qa` passes with 0 issues.
Closes #167, #168, #170, #250, #251, #252, #253, #254, #255, #256
Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---------
Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com>
2026-02-04 11:34:43 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
|
|
// State tracks collection progress for incremental runs.
|
|
|
|
|
// It persists entries to disk so that subsequent runs can resume
|
|
|
|
|
// where they left off.
|
|
|
|
|
type State struct {
|
|
|
|
|
mu sync.Mutex
|
|
|
|
|
medium io.Medium
|
|
|
|
|
path string
|
|
|
|
|
entries map[string]*StateEntry
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// StateEntry tracks state for one source.
|
|
|
|
|
type StateEntry struct {
|
|
|
|
|
// Source identifies the collector.
|
|
|
|
|
Source string `json:"source"`
|
|
|
|
|
|
|
|
|
|
// LastRun is the timestamp of the last successful run.
|
|
|
|
|
LastRun time.Time `json:"last_run"`
|
|
|
|
|
|
|
|
|
|
// LastID is an opaque identifier for the last item processed.
|
|
|
|
|
LastID string `json:"last_id,omitempty"`
|
|
|
|
|
|
|
|
|
|
// Items is the total number of items collected so far.
|
|
|
|
|
Items int `json:"items"`
|
|
|
|
|
|
|
|
|
|
// Cursor is an opaque pagination cursor for resumption.
|
|
|
|
|
Cursor string `json:"cursor,omitempty"`
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// NewState creates a state tracker that persists to the given path
|
|
|
|
|
// using the provided storage medium.
|
|
|
|
|
func NewState(m io.Medium, path string) *State {
|
|
|
|
|
return &State{
|
|
|
|
|
medium: m,
|
|
|
|
|
path: path,
|
|
|
|
|
entries: make(map[string]*StateEntry),
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Load reads state from disk. If the file does not exist, the state
|
|
|
|
|
// is initialised as empty without error.
|
|
|
|
|
func (s *State) Load() error {
|
|
|
|
|
s.mu.Lock()
|
|
|
|
|
defer s.mu.Unlock()
|
|
|
|
|
|
|
|
|
|
if !s.medium.IsFile(s.path) {
|
|
|
|
|
return nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
data, err := s.medium.Read(s.path)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return core.E("collect.State.Load", "failed to read state file", err)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var entries map[string]*StateEntry
|
|
|
|
|
if err := json.Unmarshal([]byte(data), &entries); err != nil {
|
|
|
|
|
return core.E("collect.State.Load", "failed to parse state file", err)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if entries == nil {
|
|
|
|
|
entries = make(map[string]*StateEntry)
|
|
|
|
|
}
|
|
|
|
|
s.entries = entries
|
|
|
|
|
return nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Save writes state to disk.
|
|
|
|
|
func (s *State) Save() error {
|
|
|
|
|
s.mu.Lock()
|
|
|
|
|
defer s.mu.Unlock()
|
|
|
|
|
|
|
|
|
|
data, err := json.MarshalIndent(s.entries, "", " ")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return core.E("collect.State.Save", "failed to marshal state", err)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if err := s.medium.Write(s.path, string(data)); err != nil {
|
|
|
|
|
return core.E("collect.State.Save", "failed to write state file", err)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Get returns a copy of the state for a source. The second return value
|
|
|
|
|
// indicates whether the entry was found.
|
|
|
|
|
func (s *State) Get(source string) (*StateEntry, bool) {
|
|
|
|
|
s.mu.Lock()
|
|
|
|
|
defer s.mu.Unlock()
|
|
|
|
|
entry, ok := s.entries[source]
|
|
|
|
|
if !ok {
|
|
|
|
|
return nil, false
|
|
|
|
|
}
|
|
|
|
|
// Return a copy to avoid callers mutating internal state.
|
|
|
|
|
cp := *entry
|
|
|
|
|
return &cp, true
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Set updates state for a source.
|
|
|
|
|
func (s *State) Set(source string, entry *StateEntry) {
|
|
|
|
|
s.mu.Lock()
|
|
|
|
|
defer s.mu.Unlock()
|
|
|
|
|
s.entries[source] = entry
|
|
|
|
|
}
|