LLAMA: replace test_main with nitro agent application

Chris Warren-Smith · Chris Warren-Smith · commit 370e440b9a67 · 2026-05-20T20:21:38.000+09:30
diff --git a/llama/CMakeLists.txt b/llama/CMakeLists.txt
@@ -150,27 +150,68 @@ set_target_properties(llm PROPERTIES
 )
 
 # -----------------------------
-# Optional test application
+# nitro agent application
+# (only built when notcurses is available)
 # -----------------------------
-add_executable(llm_test
-  test_main.cpp
-)
+find_package(PkgConfig QUIET)
+
+set(NC_FOUND FALSE)
+set(NC_TARGET "")
+
+if(DEFINED NOTCURSES_DIR)
+  # Explicit path — create an imported target manually
+  find_library(NC_LIB      NAMES notcurses      HINTS "${NOTCURSES_DIR}/lib" REQUIRED)
+  find_library(NC_CORE_LIB NAMES notcurses-core HINTS "${NOTCURSES_DIR}/lib")
+  add_library(notcurses_imported INTERFACE IMPORTED)
+  target_include_directories(notcurses_imported INTERFACE "${NOTCURSES_DIR}/include")
+  target_link_libraries(notcurses_imported INTERFACE ${NC_LIB})
+  if(NC_CORE_LIB)
+    target_link_libraries(notcurses_imported INTERFACE ${NC_CORE_LIB})
+  endif()
+  set(NC_TARGET notcurses_imported)
+  set(NC_FOUND TRUE)
+
+elseif(PkgConfig_FOUND)
+  # IMPORTED_TARGET gives a PkgConfig::NC target with full lib paths baked in
+  pkg_check_modules(NC QUIET IMPORTED_TARGET notcurses)
+  if(NC_FOUND)
+    set(NC_TARGET PkgConfig::NC)
+  endif()
 
-target_include_directories(llm_test PRIVATE
-  ${LLAMA_DIR}/include
-  ${LLAMA_DIR}/ggml/include
-  ${CMAKE_CURRENT_SOURCE_DIR}/../include
-)
+else()
+  find_library(NC_LIB      NAMES notcurses)
+  find_library(NC_CORE_LIB NAMES notcurses-core)
+  if(NC_LIB AND NC_CORE_LIB)
+    add_library(notcurses_imported INTERFACE IMPORTED)
+    target_link_libraries(notcurses_imported INTERFACE ${NC_LIB} ${NC_CORE_LIB})
+    set(NC_TARGET notcurses_imported)
+    set(NC_FOUND TRUE)
+  endif()
+endif()
 
-target_link_libraries(llm_test PRIVATE
-  llm
-  llama
-  ggml
-)
+if(NC_FOUND)
+  message(STATUS "notcurses found — building nitro")
 
-set_target_properties(llm_test PROPERTIES
-  RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin
-)
+  add_executable(nitro
+    nitro.cpp
+  )
+  target_include_directories(nitro PRIVATE
+    ${LLAMA_DIR}/include
+    ${LLAMA_DIR}/ggml/include
+    ${CMAKE_CURRENT_SOURCE_DIR}/../include
+  )
+  target_link_libraries(nitro PRIVATE
+    llm
+    llama
+    ggml
+    ${NC_TARGET}           # imported target carries include + lib paths
+  )
+  set_target_properties(nitro PROPERTIES
+    RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin
+  )
+else()
+  message(STATUS "notcurses not found — skipping nitro (set -DNOTCURSES_DIR=... to enable)")
+endif()
 
 # -----------------------------
 # RAG indexer
diff --git a/llama/llama-sb-rag.cpp b/llama/llama-sb-rag.cpp
@@ -6,6 +6,7 @@
 // Copyright(C) 2026 Chris Warren-Smith
 
 #include "llama-sb.h"
+#include "llama-sb-rag.h"
 
 #include <algorithm>
 #include <cmath>
@@ -17,55 +18,6 @@
 #include <string>
 #include <vector>
 
-struct RagChunk {
-  std::string        text;
-  std::string        source;
-  std::string        type;
-  std::vector<float> embedding;
-};
-
-struct RagDB {
-  std::vector<RagChunk> chunks;
-  int embed_dim = 0;
-
-  int  size()  const { return (int)chunks.size(); }
-  bool empty() const { return chunks.empty(); }
-};
-
-//
-// per-session deduplication + token budget
-//
-struct RagSession {
-  std::vector<bool> seen;        /* sized to db.size() on init  */
-  int  tokens_used  = 0;
-  int  tokens_max   = 0;         /* set to your n_ctx           */
-  float score_threshold = 0.60f; /* skip weak matches           */
-
-  void init(int n_chunks, int ctx_size) {
-    seen.assign(n_chunks, false);
-    tokens_used = 0;
-    tokens_max  = ctx_size;
-  }
-
-  void reset() {
-    std::fill(seen.begin(), seen.end(), false);
-    tokens_used = 0;
-  }
-
-  bool is_seen(int idx)  const { return idx < (int)seen.size() && seen[idx]; }
-  void mark(int idx)           { if (idx < (int)seen.size()) seen[idx] = true; }
-
-  /* rough token estimate: 1 token ≈ 4 chars */
-  bool budget_ok(const std::string &text) const {
-    return tokens_max == 0 ||
-           (tokens_used + (int)text.size() / 4) < (int)(tokens_max * 0.85f);
-  }
-
-  void charge(const std::string &text) {
-    tokens_used += (int)text.size() / 4;
-  }
-};
-
 bool Llama::embed_text(const std::string &text, std::vector<float> &out, int embed_dim) {
   vector<llama_token> tokens = tokenize(text);
   if (tokens.size() == 0) {
diff --git a/llama/llama-sb-rag.h b/llama/llama-sb-rag.h
@@ -0,0 +1,58 @@
+// This file is part of SmallBASIC
+//
+// This program is distributed under the terms of the GPL v2.0 or later
+// Download the GNU Public License (GPL) from www.gnu.org
+//
+// Copyright(C) 2026 Chris Warren-Smith
+
+#pragma once
+
+struct RagChunk {
+  std::string        text;
+  std::string        source;
+  std::string        type;
+  std::vector<float> embedding;
+};
+
+struct RagDB {
+  std::vector<RagChunk> chunks;
+  int embed_dim = 0;
+
+  int  size()  const { return (int)chunks.size(); }
+  bool empty() const { return chunks.empty(); }
+};
+
+//
+// per-session deduplication + token budget
+//
+struct RagSession {
+  std::vector<bool> seen;        /* sized to db.size() on init  */
+  int  tokens_used  = 0;
+  int  tokens_max   = 0;         /* set to your n_ctx           */
+  float score_threshold = 0.60f; /* skip weak matches           */
+
+  void init(int n_chunks, int ctx_size) {
+    seen.assign(n_chunks, false);
+    tokens_used = 0;
+    tokens_max  = ctx_size;
+  }
+
+  void reset() {
+    std::fill(seen.begin(), seen.end(), false);
+    tokens_used = 0;
+  }
+
+  bool is_seen(int idx)  const { return idx < (int)seen.size() && seen[idx]; }
+  void mark(int idx)           { if (idx < (int)seen.size()) seen[idx] = true; }
+
+  /* rough token estimate: 1 token ≈ 4 chars */
+  bool budget_ok(const std::string &text) const {
+    return tokens_max == 0 ||
+           (tokens_used + (int)text.size() / 4) < (int)(tokens_max * 0.85f);
+  }
+
+  void charge(const std::string &text) {
+    tokens_used += (int)text.size() / 4;
+  }
+};
+
diff --git a/llama/llama-sb.cpp b/llama/llama-sb.cpp
@@ -130,10 +130,6 @@ void Llama::reset() {
   _min_p = 0.0f;
   _max_tokens = 150;
   _n_past = 0;
-  _is_gemma4 = false;
-  _grammar_src.clear();
-  _grammar_root.clear();
-  _template.clear();
   _seed = LLAMA_DEFAULT_SEED;
   if (_ctx) {
     llama_memory_clear(llama_get_memory(_ctx), true);
diff --git a/llama/llama.cpp b/llama/llama.cpp
@@ -1 +1 @@
-Subproject commit 3fbadb06dc867d3236937705477e090724ebbc6e
+Subproject commit 6db130445d29b243ee2171efb8cd61b84a1c5322
diff --git a/llama/nitro.cpp b/llama/nitro.cpp
diff --git a/llama/test_main.cpp b/llama/test_main.cpp