feat: Improve agents config

2026-07-01 18:49:14 -04:00 · 2026-06-29 23:12:44 +02:00
parent 080947c0dc
commit 2a3fd4f5be
26 changed files with 274 additions and 15 deletions
--- a/sources/agents/llamacpp_completion_fim.toml
+++ b/sources/agents/llamacpp_completion_fim.toml
@@ -0,0 +1,15 @@
+schema_version = 1
+
+name        = "llama.cpp Completion — FIM"
+description = "Local llama.cpp native fill-in-the-middle via the /infill endpoint (input_prefix + input_suffix). Fast and clean, but the loaded GGUF MUST be a FIM-trained model (qwen2.5-coder, codellama-code, deepseek-coder, starcoder2, codegemma). A plain chat model produces garbage here — there is no native completion path for those. llama-server serves whichever model is loaded, so 'model' is only a label."
+
+provider_instance = "llama.cpp"
+endpoint          = "/infill"
+model             = "qwen2.5-coder-7b"
+tags              = ["completion", "llama.cpp", "local", "fim"]
+
+[body]
+input_prefix = """{{ tojson(ctx.prefix) }}"""
+input_suffix = """{% if existsIn(ctx, "suffix") %}{{ tojson(ctx.suffix) }}{% endif %}"""
+n_predict    = 256
+temperature  = 0.2