chore: snapshot working tree - pty_exited notifications + in-flight inference WIP

feat(booterm): structured pty_exited WS notifications. Plan-validated, impl-validated, code-reviewed green (contracts build clean, contracts test 29/29, booterm + web typecheck clean).

wip: in-progress inference/provider refactor (agents.ts, provider.ts, new llama-providers.ts, removed llama-args-validator), plus arena, dispatcher, compaction, schema changes.

openspec: pty-exit-notifications complete; x-agent-flags planned (not yet implemented).
This commit is contained in:
2026-06-14 12:48:47 +00:00
parent 0ed506f1da
commit b18de2a331
204 changed files with 25344 additions and 867 deletions

View File

@@ -137,6 +137,173 @@
- items_completed: integer (required)
- metadata: jsonb
### control_hosts
- provider_id: text (pk, fk)
- ssh_host: text
- ssh_user: text
- ssh_key_path: text
- config_path: text
- restart_cmd: text
- os: text
- gpu_label: text
- enabled: boolean (required)
### control_requests
- id: bigint(auto) (pk)
- provider_id: text (required, fk)
- swap_entry_id: integer (required, fk)
- ts: timestamp(tz) (required)
- model: text
- req_path: text
- status_code: integer
- duration_ms: integer
- cache_tokens: integer
- input_tokens: integer
- output_tokens: integer
- prompt_tps: real
- gen_tps: real
- has_capture: boolean (required)
- capture: jsonb
### control_perf_samples
- provider_id: text (required, fk)
- ts: timestamp(tz) (required)
- gpu: jsonb
- sys: jsonb
### control_perf_rollup_5m
- provider_id: text (required, fk)
- bucket: timestamp(tz) (required)
- gpu_agg: jsonb
- sys_agg: jsonb
### control_model_events
- provider_id: text (required, fk)
- model: text (required)
- state: text (required)
- ts: timestamp(tz) (required)
- detail: jsonb
### bench_suites
- id: text (pk)
- name: text (required)
- provider_id: text (required, fk)
- model: text (required)
- repetitions: integer (required)
- metadata: jsonb
### bench_runs
- id: text (pk)
- suite_id: text (required, fk)
- job_type: text (required)
- status: text (required)
- started_at: timestamp(tz)
- finished_at: timestamp(tz)
- total_samples: integer (required)
- completed_samples: integer (required)
- concurrent_foreign_requests: integer (required)
- temperature: real
- top_p: real
- aggregate: jsonb
- regression_flag: text
- error: text
### bench_samples
- id: bigint(auto) (pk)
- run_id: text (required, fk)
- prompt_tokens: integer (required)
- gen_tokens: integer (required)
- concurrency: integer (required)
- repetition: integer (required)
- ttft_ms: real
- total_ms: real
- prompt_tps: real
- gen_tps: real
- cache_n: integer
- error: text
### bench_baselines
- provider_id: text (required, fk)
- model: text (required)
- aggregate: jsonb (required)
- run_id: text (required, fk)
### eval_suites
- id: text (pk)
- name: text (required)
- kind: text (required)
- version: integer (required)
- tasks: jsonb (required)
- judge_model: text
- judge_model_version: text
- metadata: jsonb
### eval_runs
- id: text (pk)
- suite_id: text (required, fk)
- job_type: text (required)
- provider_id: text (required, fk)
- model: text (required)
- quant: text
- status: text (required)
- judge_model: text
- judge_model_version: text
- started_at: timestamp(tz)
- finished_at: timestamp(tz)
- total_tasks: integer (required)
- completed_tasks: integer (required)
- aggregate: jsonb
- error: text
### eval_results
- id: bigint(auto) (pk)
- run_id: text (required, fk)
- task_id: text (required, fk)
- task_index: integer (required)
- score: real
- max_score: real
- rationale: text
- sandbox_exit_code: integer
- sandbox_stderr: text
- sandbox_stdout: text
- execution_ms: integer
- error: text
### control_reports
- id: text (pk)
- kind: text (required)
- interval: text (required)
- period_start: timestamp(tz) (required)
- period_end: timestamp(tz) (required)
- markdown: text (required)
- stats: jsonb
### control_schedule_meta
- name: text (pk)
- interval: text (required)
- enabled: boolean (required)
- last_run_at: timestamp(tz)
### route_policies
- id: text (pk)
- name: text (required)
- virtual_model: text (required)
- candidates: jsonb (required)
- fallback: text
- enabled: boolean (required)
### route_dispatch_log
- id: bigint(auto) (pk)
- ts: timestamp(tz) (required)
- virtual_model: text (required)
- chosen_provider_id: text (fk)
- chosen_model: text
- candidates_tried: jsonb
- status: text (required)
- source: text
- error: text
- duration_ms: integer
### projects
- id: uuid (pk)
- name: text (required)
@@ -215,3 +382,12 @@
- turn_number: integer (required)
- messages: jsonb (required)
- tool_states: jsonb (required)
### memory_entries
- id: uuid (pk)
- project_id: uuid (required, fk)
- topic: text (required)
- title: text (required)
- content: text (required)
- date: date
- mood: text