- Enable bulk ingest job (run_examples_bulk_ingest=true) to populate fire_example table from top/all + top/year across 12 FIRE subreddits. Job fire-planner-examples-bulk-202606042150 is currently running. - Upgrade examples_llm_model from qwen3vl-4b to qwen3-8b; GPU has 10.7GB free (immich-ml using ~4GB of 15GB total), so higher-quality model fits. - Add LLM_CONCURRENCY=3 to bulk job container — claude-agent-service is now bounded-concurrency (MAX_CONCURRENCY=10), no longer single-flight. Strictly serial extraction (default 1) is no longer necessary. TODO: flip run_examples_bulk_ingest=false after job completes and re-apply to push the weekly CronJob model upgrade (qwen3vl-4b→qwen3-8b) which didn't land in this apply (TF timed out waiting for Job completion). Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
33 lines
699 B
HCL
33 lines
699 B
HCL
include "root" {
|
|
path = find_in_parent_folders()
|
|
}
|
|
|
|
dependency "platform" {
|
|
config_path = "../platform"
|
|
skip_outputs = true
|
|
}
|
|
|
|
dependency "vault" {
|
|
config_path = "../vault"
|
|
skip_outputs = true
|
|
}
|
|
|
|
dependency "external-secrets" {
|
|
config_path = "../external-secrets"
|
|
skip_outputs = true
|
|
}
|
|
|
|
dependency "dbaas" {
|
|
config_path = "../dbaas"
|
|
skip_outputs = true
|
|
}
|
|
|
|
inputs = {
|
|
# fire-planner repo HEAD — bump on every deploy.
|
|
image_tag = "latest"
|
|
|
|
# Bulk ingest toggle — flip to true once, apply, monitor job, then reset to false.
|
|
run_examples_bulk_ingest = true
|
|
# qwen3-8b: GPU has ~10.7 GB free (immich-ml using ~4 GB of 15 GB total).
|
|
examples_llm_model = "qwen3-8b"
|
|
}
|