format codebase

2026-06-01 01:54:00 +00:00 · 2026-04-02 21:46:46 -04:00
parent ba165d8aa7
commit 3af053f0eb
31 changed files with 1479 additions and 1445 deletions
--- a/pipeline/src/data_generation/data_downloader.cpp
+++ b/pipeline/src/data_generation/data_downloader.cpp
@@ -1,46 +1,49 @@
 #include "data_generation/data_downloader.h"
-#include "web_client/web_client.h"
+
+#include <spdlog/spdlog.h>
+
 #include <filesystem>
 #include <fstream>
-#include <spdlog/spdlog.h>
 #include <sstream>
 #include <stdexcept>

+#include "web_client/web_client.h"
+
 DataDownloader::DataDownloader(std::shared_ptr<WebClient> web_client)
    : web_client_(std::move(web_client)) {}

 DataDownloader::~DataDownloader() {}

-bool DataDownloader::FileExists(const std::string &file_path) {
-  return std::filesystem::exists(file_path);
+bool DataDownloader::FileExists(const std::string& file_path) {
+   return std::filesystem::exists(file_path);
 }

-std::string
-DataDownloader::DownloadCountriesDatabase(const std::string &cache_path,
-                                          const std::string &commit) {
-  if (FileExists(cache_path)) {
-    spdlog::info("[DataDownloader] Cache hit: {}", cache_path);
-    return cache_path;
-  }
+std::string DataDownloader::DownloadCountriesDatabase(
+    const std::string& cache_path, const std::string& commit) {
+   if (FileExists(cache_path)) {
+      spdlog::info("[DataDownloader] Cache hit: {}", cache_path);
+      return cache_path;
+   }

-  std::string short_commit = commit;
-  if (commit.length() > 7) {
-    short_commit = commit.substr(0, 7);
-  }
+   std::string short_commit = commit;
+   if (commit.length() > 7) {
+      short_commit = commit.substr(0, 7);
+   }

-  std::string url = "https://raw.githubusercontent.com/dr5hn/"
-                    "countries-states-cities-database/" +
-                    short_commit + "/json/countries+states+cities.json";
+   std::string url =
+       "https://raw.githubusercontent.com/dr5hn/"
+       "countries-states-cities-database/" +
+       short_commit + "/json/countries+states+cities.json";

-  spdlog::info("[DataDownloader] Downloading: {}", url);
+   spdlog::info("[DataDownloader] Downloading: {}", url);

-  web_client_->DownloadToFile(url, cache_path);
+   web_client_->DownloadToFile(url, cache_path);

-  std::ifstream file_check(cache_path, std::ios::binary | std::ios::ate);
-  std::streamsize size = file_check.tellg();
-  file_check.close();
+   std::ifstream file_check(cache_path, std::ios::binary | std::ios::ate);
+   std::streamsize size = file_check.tellg();
+   file_check.close();

-  spdlog::info("[DataDownloader] OK: Download complete: {} ({:.2f} MB)",
-               cache_path, (size / (1024.0 * 1024.0)));
-  return cache_path;
+   spdlog::info("[DataDownloader] OK: Download complete: {} ({:.2f} MB)",
+                cache_path, (size / (1024.0 * 1024.0)));
+   return cache_path;
 }
--- a/pipeline/src/data_generation/llama/destructor.cpp
+++ b/pipeline/src/data_generation/llama/destructor.cpp
@@ -1,17 +1,16 @@
+#include "data_generation/llama_generator.h"
 #include "llama.h"

-#include "data_generation/llama_generator.h"
-
 LlamaGenerator::~LlamaGenerator() {
-  if (context_ != nullptr) {
-    llama_free(context_);
-    context_ = nullptr;
-  }
+   if (context_ != nullptr) {
+      llama_free(context_);
+      context_ = nullptr;
+   }

-  if (model_ != nullptr) {
-    llama_model_free(model_);
-    model_ = nullptr;
-  }
+   if (model_ != nullptr) {
+      llama_model_free(model_);
+      model_ = nullptr;
+   }

-  llama_backend_free();
+   llama_backend_free();
 }
--- a/pipeline/src/data_generation/llama/generate_brewery.cpp
+++ b/pipeline/src/data_generation/llama/generate_brewery.cpp
@@ -1,72 +1,74 @@
+#include <spdlog/spdlog.h>
+
 #include <stdexcept>
 #include <string>

-#include <spdlog/spdlog.h>
-
 #include "data_generation/llama_generator.h"
 #include "data_generation/llama_generator_helpers.h"

-BreweryResult
-LlamaGenerator::GenerateBrewery(const std::string& city_name,
-                                const std::string& country_name,
-                                const std::string& region_context) {
-  const std::string safe_region_context =
-      PrepareRegionContextPublic(region_context);
+BreweryResult LlamaGenerator::GenerateBrewery(
+    const std::string& city_name, const std::string& country_name,
+    const std::string& region_context) {
+   const std::string safe_region_context =
+       PrepareRegionContextPublic(region_context);

-  const std::string system_prompt =
-      "You are a copywriter for a craft beer travel guide. "
-      "Your writing is vivid, specific to place, and avoids generic beer "
-      "cliches. "
-      "You must output ONLY valid JSON. "
-      "The JSON schema must be exactly: {\"name\": \"string\", "
-      "\"description\": \"string\"}. "
-      "Do not include markdown formatting or backticks.";
+   const std::string system_prompt =
+       "You are the brewmaster and owner of a local craft brewery. "
+       "Write a name and a short, soulful description for your brewery that "
+       "reflects your pride in the local community and your craft. "
+       "The tone should be authentic and welcoming, like a note on a "
+       "chalkboard "
+       "menu. Output ONLY a single JSON object with keys \"name\" and "
+       "\"description\". "
+       "Do not include markdown formatting or backticks.";

-  std::string prompt =
-      "Write a brewery name and place-specific description for a craft "
-      "brewery in " +
-      city_name +
-      (country_name.empty() ? std::string("")
-                           : std::string(", ") + country_name) +
-      (safe_region_context.empty()
-           ? std::string(".")
-           : std::string(". Regional context: ") + safe_region_context);
+   std::string prompt =
+       "Write a brewery name and place-specific description for a craft "
+       "brewery in " +
+       city_name +
+       (country_name.empty() ? std::string("")
+                             : std::string(", ") + country_name) +
+       (safe_region_context.empty()
+            ? std::string(".")
+            : std::string(". Regional context: ") + safe_region_context);

-  const int max_attempts = 3;
-  std::string raw;
-  std::string last_error;
-  for (int attempt = 0; attempt < max_attempts; ++attempt) {
-    raw = Infer(system_prompt, prompt, 384);
-    spdlog::debug("LlamaGenerator: raw output (attempt {}): {}", attempt + 1,
-                  raw);
+   const int max_attempts = 3;
+   std::string raw;
+   std::string last_error;
+   for (int attempt = 0; attempt < max_attempts; ++attempt) {
+      raw = Infer(system_prompt, prompt, 384);
+      spdlog::debug("LlamaGenerator: raw output (attempt {}): {}", attempt + 1,
+                    raw);

-    std::string name;
-    std::string description;
-    const std::string validation_error =
-        ValidateBreweryJsonPublic(raw, name, description);
-    if (validation_error.empty()) {
-      return {std::move(name), std::move(description)};
-    }
+      std::string name;
+      std::string description;
+      const std::string validation_error =
+          ValidateBreweryJsonPublic(raw, name, description);
+      if (validation_error.empty()) {
+         return {std::move(name), std::move(description)};
+      }

-    last_error = validation_error;
-    spdlog::warn("LlamaGenerator: malformed brewery JSON (attempt {}): {}",
-                 attempt + 1, validation_error);
+      last_error = validation_error;
+      spdlog::warn("LlamaGenerator: malformed brewery JSON (attempt {}): {}",
+                   attempt + 1, validation_error);

-    prompt = "Your previous response was invalid. Error: " + validation_error +
-             "\nReturn ONLY valid JSON with this exact schema: "
-             "{\"name\": \"string\", \"description\": \"string\"}."
-             "\nDo not include markdown, comments, or extra keys."
-             "\n\nLocation: " +
-             city_name +
-             (country_name.empty() ? std::string("")
-                                  : std::string(", ") + country_name) +
-             (safe_region_context.empty()
-                  ? std::string("")
-                  : std::string("\nRegional context: ") + safe_region_context);
-  }
+      prompt =
+          "Your previous response was invalid. Error: " + validation_error +
+          "\nReturn ONLY valid JSON with this exact schema: "
+          "{\"name\": \"string\", \"description\": \"string\"}."
+          "\nDo not include markdown, comments, or extra keys."
+          "\n\nLocation: " +
+          city_name +
+          (country_name.empty() ? std::string("")
+                                : std::string(", ") + country_name) +
+          (safe_region_context.empty()
+               ? std::string("")
+               : std::string("\nRegional context: ") + safe_region_context);
+   }

-  spdlog::error("LlamaGenerator: malformed brewery response after {} attempts: "
-                "{}",
-                max_attempts, last_error.empty() ? raw : last_error);
-  throw std::runtime_error("LlamaGenerator: malformed brewery response");
+   spdlog::error(
+       "LlamaGenerator: malformed brewery response after {} attempts: "
+       "{}",
+       max_attempts, last_error.empty() ? raw : last_error);
+   throw std::runtime_error("LlamaGenerator: malformed brewery response");
 }
--- a/pipeline/src/data_generation/llama/generate_user.cpp
+++ b/pipeline/src/data_generation/llama/generate_user.cpp
@@ -1,56 +1,57 @@
+#include <spdlog/spdlog.h>
+
 #include <algorithm>
 #include <stdexcept>
 #include <string>

-#include <spdlog/spdlog.h>
-
 #include "data_generation/llama_generator.h"
 #include "data_generation/llama_generator_helpers.h"

 UserResult LlamaGenerator::GenerateUser(const std::string& locale) {
-  const std::string system_prompt =
-      "You generate plausible social media profiles for craft beer "
-      "enthusiasts. "
-      "Respond with exactly two lines: "
-      "the first line is a username (lowercase, no spaces, 8-20 characters), "
-      "the second line is a one-sentence bio (20-40 words). "
-      "The profile should feel consistent with the locale. "
-      "No preamble, no labels.";
+   const std::string system_prompt =
+       "You generate plausible social media profiles for craft beer "
+       "enthusiasts. "
+       "Respond with exactly two lines: "
+       "the first line is a username (lowercase, no spaces, 8-20 characters), "
+       "the second line is a one-sentence bio (20-40 words). "
+       "The profile should feel consistent with the locale. "
+       "No preamble, no labels.";

-  std::string prompt =
-      "Generate a craft beer enthusiast profile. Locale: " + locale;
+   std::string prompt =
+       "Generate a craft beer enthusiast profile. Locale: " + locale;

-  const int max_attempts = 3;
-  std::string raw;
-  for (int attempt = 0; attempt < max_attempts; ++attempt) {
-    raw = Infer(system_prompt, prompt, 128);
-    spdlog::debug("LlamaGenerator (user): raw output (attempt {}): {}",
-                  attempt + 1, raw);
+   const int max_attempts = 3;
+   std::string raw;
+   for (int attempt = 0; attempt < max_attempts; ++attempt) {
+      raw = Infer(system_prompt, prompt, 128);
+      spdlog::debug("LlamaGenerator (user): raw output (attempt {}): {}",
+                    attempt + 1, raw);

-    try {
-      auto [username, bio] = ParseTwoLineResponsePublic(
-          raw, "LlamaGenerator: malformed user response");
+      try {
+         auto [username, bio] = ParseTwoLineResponsePublic(
+             raw, "LlamaGenerator: malformed user response");

-      username.erase(
-          std::remove_if(username.begin(), username.end(),
-                         [](unsigned char ch) { return std::isspace(ch); }),
-          username.end());
+         username.erase(
+             std::remove_if(username.begin(), username.end(),
+                            [](unsigned char ch) { return std::isspace(ch); }),
+             username.end());

-      if (username.empty() || bio.empty()) {
-        throw std::runtime_error("LlamaGenerator: malformed user response");
+         if (username.empty() || bio.empty()) {
+            throw std::runtime_error("LlamaGenerator: malformed user response");
+         }
+
+         if (bio.size() > 200) bio = bio.substr(0, 200);
+
+         return {username, bio};
+      } catch (const std::exception& e) {
+         spdlog::warn(
+             "LlamaGenerator: malformed user response (attempt {}): {}",
+             attempt + 1, e.what());
      }
+   }

-      if (bio.size() > 200)
-        bio = bio.substr(0, 200);
-
-      return {username, bio};
-    } catch (const std::exception &e) {
-      spdlog::warn("LlamaGenerator: malformed user response (attempt {}): {}",
-                   attempt + 1, e.what());
-    }
-  }
-
-  spdlog::error("LlamaGenerator: malformed user response after {} attempts: {}",
-                max_attempts, raw);
-  throw std::runtime_error("LlamaGenerator: malformed user response");
+   spdlog::error(
+       "LlamaGenerator: malformed user response after {} attempts: {}",
+       max_attempts, raw);
+   throw std::runtime_error("LlamaGenerator: malformed user response");
 }
--- a/pipeline/src/data_generation/llama/helpers.cpp
+++ b/pipeline/src/data_generation/llama/helpers.cpp
@@ -1,367 +1,365 @@
 #include <algorithm>
 #include <array>
+#include <boost/json.hpp>
 #include <cctype>
 #include <sstream>
 #include <stdexcept>
 #include <string>
 #include <vector>

-#include "llama.h"
-#include <boost/json.hpp>
-
 #include "data_generation/llama_generator.h"
+#include "llama.h"

 namespace {

 std::string Trim(std::string value) {
-  auto not_space = [](unsigned char ch) { return !std::isspace(ch); };
+   auto not_space = [](unsigned char ch) { return !std::isspace(ch); };

-  value.erase(value.begin(),
-              std::find_if(value.begin(), value.end(), not_space));
-  value.erase(std::find_if(value.rbegin(), value.rend(), not_space).base(),
-              value.end());
+   value.erase(value.begin(),
+               std::find_if(value.begin(), value.end(), not_space));
+   value.erase(std::find_if(value.rbegin(), value.rend(), not_space).base(),
+               value.end());

-  return value;
+   return value;
 }

 std::string CondenseWhitespace(std::string text) {
-  std::string out;
-  out.reserve(text.size());
+   std::string out;
+   out.reserve(text.size());

-  bool in_whitespace = false;
-  for (unsigned char ch : text) {
-    if (std::isspace(ch)) {
-      if (!in_whitespace) {
-        out.push_back(' ');
-        in_whitespace = true;
+   bool in_whitespace = false;
+   for (unsigned char ch : text) {
+      if (std::isspace(ch)) {
+         if (!in_whitespace) {
+            out.push_back(' ');
+            in_whitespace = true;
+         }
+         continue;
      }
-      continue;
-    }

-    in_whitespace = false;
-    out.push_back(static_cast<char>(ch));
-  }
+      in_whitespace = false;
+      out.push_back(static_cast<char>(ch));
+   }

-  return Trim(std::move(out));
+   return Trim(std::move(out));
 }

 std::string PrepareRegionContext(std::string_view region_context,
                                 std::size_t max_chars) {
-  std::string normalized = CondenseWhitespace(std::string(region_context));
-  if (normalized.size() <= max_chars) {
-    return normalized;
-  }
+   std::string normalized = CondenseWhitespace(std::string(region_context));
+   if (normalized.size() <= max_chars) {
+      return normalized;
+   }

-  normalized.resize(max_chars);
-  const std::size_t last_space = normalized.find_last_of(' ');
-  if (last_space != std::string::npos && last_space > max_chars / 2) {
-    normalized.resize(last_space);
-  }
+   normalized.resize(max_chars);
+   const std::size_t last_space = normalized.find_last_of(' ');
+   if (last_space != std::string::npos && last_space > max_chars / 2) {
+      normalized.resize(last_space);
+   }

-  normalized += "...";
-  return normalized;
+   normalized += "...";
+   return normalized;
 }

 std::string StripCommonPrefix(std::string line) {
-  line = Trim(std::move(line));
+   line = Trim(std::move(line));

-  if (!line.empty() && (line[0] == '-' || line[0] == '*')) {
-    line = Trim(line.substr(1));
-  } else {
-    std::size_t i = 0;
-    while (i < line.size() &&
-           std::isdigit(static_cast<unsigned char>(line[i]))) {
-      ++i;
-    }
-    if (i > 0 && i < line.size() && (line[i] == '.' || line[i] == ')')) {
-      line = Trim(line.substr(i + 1));
-    }
-  }
-
-  auto strip_label = [&line](const std::string& label) {
-    if (line.size() >= label.size()) {
-      bool matches = true;
-      for (std::size_t i = 0; i < label.size(); ++i) {
-        if (std::tolower(static_cast<unsigned char>(line[i])) !=
-            std::tolower(static_cast<unsigned char>(label[i]))) {
-          matches = false;
-          break;
-        }
+   if (!line.empty() && (line[0] == '-' || line[0] == '*')) {
+      line = Trim(line.substr(1));
+   } else {
+      std::size_t i = 0;
+      while (i < line.size() &&
+             std::isdigit(static_cast<unsigned char>(line[i]))) {
+         ++i;
      }
-      if (matches) {
-        line = Trim(line.substr(label.size()));
+      if (i > 0 && i < line.size() && (line[i] == '.' || line[i] == ')')) {
+         line = Trim(line.substr(i + 1));
      }
-    }
-  };
+   }

-  strip_label("name:");
-  strip_label("brewery name:");
-  strip_label("description:");
-  strip_label("username:");
-  strip_label("bio:");
+   auto strip_label = [&line](const std::string& label) {
+      if (line.size() >= label.size()) {
+         bool matches = true;
+         for (std::size_t i = 0; i < label.size(); ++i) {
+            if (std::tolower(static_cast<unsigned char>(line[i])) !=
+                std::tolower(static_cast<unsigned char>(label[i]))) {
+               matches = false;
+               break;
+            }
+         }
+         if (matches) {
+            line = Trim(line.substr(label.size()));
+         }
+      }
+   };

-  return Trim(std::move(line));
+   strip_label("name:");
+   strip_label("brewery name:");
+   strip_label("description:");
+   strip_label("username:");
+   strip_label("bio:");
+
+   return Trim(std::move(line));
 }

-std::pair<std::string, std::string>
-ParseTwoLineResponse(const std::string& raw, const std::string& error_message) {
-  std::string normalized = raw;
-  std::replace(normalized.begin(), normalized.end(), '\r', '\n');
+std::pair<std::string, std::string> ParseTwoLineResponse(
+    const std::string& raw, const std::string& error_message) {
+   std::string normalized = raw;
+   std::replace(normalized.begin(), normalized.end(), '\r', '\n');

-  std::vector<std::string> lines;
-  std::stringstream stream(normalized);
-  std::string line;
-  while (std::getline(stream, line)) {
-    line = StripCommonPrefix(std::move(line));
-    if (!line.empty())
-      lines.push_back(std::move(line));
-  }
+   std::vector<std::string> lines;
+   std::stringstream stream(normalized);
+   std::string line;
+   while (std::getline(stream, line)) {
+      line = StripCommonPrefix(std::move(line));
+      if (!line.empty()) lines.push_back(std::move(line));
+   }

-  std::vector<std::string> filtered;
-  for (auto &l : lines) {
-    std::string low = l;
-    std::transform(low.begin(), low.end(), low.begin(), [](unsigned char c) {
-      return static_cast<char>(std::tolower(c));
-    });
-    if (!l.empty() && l.front() == '<' && low.back() == '>')
-      continue;
-    if (low.rfind("okay,", 0) == 0 || low.rfind("hmm", 0) == 0)
-      continue;
-    filtered.push_back(std::move(l));
-  }
+   std::vector<std::string> filtered;
+   for (auto& l : lines) {
+      std::string low = l;
+      std::transform(low.begin(), low.end(), low.begin(), [](unsigned char c) {
+         return static_cast<char>(std::tolower(c));
+      });
+      if (!l.empty() && l.front() == '<' && low.back() == '>') continue;
+      if (low.rfind("okay,", 0) == 0 || low.rfind("hmm", 0) == 0) continue;
+      filtered.push_back(std::move(l));
+   }

-  if (filtered.size() < 2)
-    throw std::runtime_error(error_message);
+   if (filtered.size() < 2) throw std::runtime_error(error_message);

-  std::string first = Trim(filtered.front());
-  std::string second;
-  for (size_t i = 1; i < filtered.size(); ++i) {
-    if (!second.empty())
-      second += ' ';
-    second += filtered[i];
-  }
-  second = Trim(std::move(second));
+   std::string first = Trim(filtered.front());
+   std::string second;
+   for (size_t i = 1; i < filtered.size(); ++i) {
+      if (!second.empty()) second += ' ';
+      second += filtered[i];
+   }
+   second = Trim(std::move(second));

-  if (first.empty() || second.empty())
-    throw std::runtime_error(error_message);
-  return {first, second};
+   if (first.empty() || second.empty()) throw std::runtime_error(error_message);
+   return {first, second};
 }

-std::string ToChatPrompt(const llama_model *model,
+std::string ToChatPrompt(const llama_model* model,
                         const std::string& user_prompt) {
-  const char *tmpl = llama_model_chat_template(model, nullptr);
-  if (tmpl == nullptr) {
-    return user_prompt;
-  }
+   const char* tmpl = llama_model_chat_template(model, nullptr);
+   if (tmpl == nullptr) {
+      return user_prompt;
+   }

-  const llama_chat_message message{"user", user_prompt.c_str()};
+   const llama_chat_message message{"user", user_prompt.c_str()};

-  std::vector<char> buffer(std::max<std::size_t>(1024, user_prompt.size() * 4));
-  int32_t required =
-      llama_chat_apply_template(tmpl, &message, 1, true, buffer.data(),
-                                static_cast<int32_t>(buffer.size()));
+   std::vector<char> buffer(
+       std::max<std::size_t>(1024, user_prompt.size() * 4));
+   int32_t required =
+       llama_chat_apply_template(tmpl, &message, 1, true, buffer.data(),
+                                 static_cast<int32_t>(buffer.size()));

-  if (required < 0) {
-    throw std::runtime_error("LlamaGenerator: failed to apply chat template");
-  }
-
-  if (required >= static_cast<int32_t>(buffer.size())) {
-    buffer.resize(static_cast<std::size_t>(required) + 1);
-    required = llama_chat_apply_template(tmpl, &message, 1, true, buffer.data(),
-                                         static_cast<int32_t>(buffer.size()));
-    if (required < 0) {
+   if (required < 0) {
      throw std::runtime_error("LlamaGenerator: failed to apply chat template");
-    }
-  }
+   }

-  return std::string(buffer.data(), static_cast<std::size_t>(required));
+   if (required >= static_cast<int32_t>(buffer.size())) {
+      buffer.resize(static_cast<std::size_t>(required) + 1);
+      required =
+          llama_chat_apply_template(tmpl, &message, 1, true, buffer.data(),
+                                    static_cast<int32_t>(buffer.size()));
+      if (required < 0) {
+         throw std::runtime_error(
+             "LlamaGenerator: failed to apply chat template");
+      }
+   }
+
+   return std::string(buffer.data(), static_cast<std::size_t>(required));
 }

-std::string ToChatPrompt(const llama_model *model,
+std::string ToChatPrompt(const llama_model* model,
                         const std::string& system_prompt,
                         const std::string& user_prompt) {
-  const char *tmpl = llama_model_chat_template(model, nullptr);
-  if (tmpl == nullptr) {
-    return system_prompt + "\n\n" + user_prompt;
-  }
+   const char* tmpl = llama_model_chat_template(model, nullptr);
+   if (tmpl == nullptr) {
+      return system_prompt + "\n\n" + user_prompt;
+   }

-  const llama_chat_message messages[2] = {{"system", system_prompt.c_str()},
-                                          {"user", user_prompt.c_str()}};
+   const llama_chat_message messages[2] = {{"system", system_prompt.c_str()},
+                                           {"user", user_prompt.c_str()}};

-  std::vector<char> buffer(std::max<std::size_t>(
-      1024, (system_prompt.size() + user_prompt.size()) * 4));
-  int32_t required =
-      llama_chat_apply_template(tmpl, messages, 2, true, buffer.data(),
-                                static_cast<int32_t>(buffer.size()));
+   std::vector<char> buffer(std::max<std::size_t>(
+       1024, (system_prompt.size() + user_prompt.size()) * 4));
+   int32_t required =
+       llama_chat_apply_template(tmpl, messages, 2, true, buffer.data(),
+                                 static_cast<int32_t>(buffer.size()));

-  if (required < 0) {
-    throw std::runtime_error("LlamaGenerator: failed to apply chat template");
-  }
-
-  if (required >= static_cast<int32_t>(buffer.size())) {
-    buffer.resize(static_cast<std::size_t>(required) + 1);
-    required = llama_chat_apply_template(tmpl, messages, 2, true, buffer.data(),
-                                         static_cast<int32_t>(buffer.size()));
-    if (required < 0) {
+   if (required < 0) {
      throw std::runtime_error("LlamaGenerator: failed to apply chat template");
-    }
-  }
+   }

-  return std::string(buffer.data(), static_cast<std::size_t>(required));
+   if (required >= static_cast<int32_t>(buffer.size())) {
+      buffer.resize(static_cast<std::size_t>(required) + 1);
+      required =
+          llama_chat_apply_template(tmpl, messages, 2, true, buffer.data(),
+                                    static_cast<int32_t>(buffer.size()));
+      if (required < 0) {
+         throw std::runtime_error(
+             "LlamaGenerator: failed to apply chat template");
+      }
+   }
+
+   return std::string(buffer.data(), static_cast<std::size_t>(required));
 }

-void AppendTokenPiece(const llama_vocab *vocab, llama_token token,
+void AppendTokenPiece(const llama_vocab* vocab, llama_token token,
                      std::string& output) {
-  std::array<char, 256> buffer{};
-  int32_t bytes =
-      llama_token_to_piece(vocab, token, buffer.data(),
-                           static_cast<int32_t>(buffer.size()), 0, true);
+   std::array<char, 256> buffer{};
+   int32_t bytes =
+       llama_token_to_piece(vocab, token, buffer.data(),
+                            static_cast<int32_t>(buffer.size()), 0, true);

-  if (bytes < 0) {
-    std::vector<char> dynamic_buffer(static_cast<std::size_t>(-bytes));
-    bytes = llama_token_to_piece(vocab, token, dynamic_buffer.data(),
-                                 static_cast<int32_t>(dynamic_buffer.size()), 0,
-                                 true);
-    if (bytes < 0) {
-      throw std::runtime_error(
-          "LlamaGenerator: failed to decode sampled token piece");
-    }
+   if (bytes < 0) {
+      std::vector<char> dynamic_buffer(static_cast<std::size_t>(-bytes));
+      bytes = llama_token_to_piece(vocab, token, dynamic_buffer.data(),
+                                   static_cast<int32_t>(dynamic_buffer.size()),
+                                   0, true);
+      if (bytes < 0) {
+         throw std::runtime_error(
+             "LlamaGenerator: failed to decode sampled token piece");
+      }

-    output.append(dynamic_buffer.data(), static_cast<std::size_t>(bytes));
-    return;
-  }
+      output.append(dynamic_buffer.data(), static_cast<std::size_t>(bytes));
+      return;
+   }

-  output.append(buffer.data(), static_cast<std::size_t>(bytes));
+   output.append(buffer.data(), static_cast<std::size_t>(bytes));
 }

 bool ExtractFirstJsonObject(const std::string& text, std::string& json_out) {
-  std::size_t start = std::string::npos;
-  int depth = 0;
-  bool in_string = false;
-  bool escaped = false;
+   std::size_t start = std::string::npos;
+   int depth = 0;
+   bool in_string = false;
+   bool escaped = false;

-  for (std::size_t i = 0; i < text.size(); ++i) {
-    const char ch = text[i];
+   for (std::size_t i = 0; i < text.size(); ++i) {
+      const char ch = text[i];

-    if (in_string) {
-      if (escaped) {
-        escaped = false;
-      } else if (ch == '\\') {
-        escaped = true;
-      } else if (ch == '"') {
-        in_string = false;
+      if (in_string) {
+         if (escaped) {
+            escaped = false;
+         } else if (ch == '\\') {
+            escaped = true;
+         } else if (ch == '"') {
+            in_string = false;
+         }
+         continue;
      }
-      continue;
-    }

-    if (ch == '"') {
-      in_string = true;
-      continue;
-    }
-
-    if (ch == '{') {
-      if (depth == 0) {
-        start = i;
+      if (ch == '"') {
+         in_string = true;
+         continue;
      }
-      ++depth;
-      continue;
-    }

-    if (ch == '}') {
-      if (depth == 0) {
-        continue;
+      if (ch == '{') {
+         if (depth == 0) {
+            start = i;
+         }
+         ++depth;
+         continue;
      }
-      --depth;
-      if (depth == 0 && start != std::string::npos) {
-        json_out = text.substr(start, i - start + 1);
-        return true;
-      }
-    }
-  }

-  return false;
+      if (ch == '}') {
+         if (depth == 0) {
+            continue;
+         }
+         --depth;
+         if (depth == 0 && start != std::string::npos) {
+            json_out = text.substr(start, i - start + 1);
+            return true;
+         }
+      }
+   }
+
+   return false;
 }

 std::string ValidateBreweryJson(const std::string& raw, std::string& name_out,
                                std::string& description_out) {
-  auto validate_object = [&](const boost::json::value& jv,
-                            std::string& error_out) -> bool {
-    if (!jv.is_object()) {
-      error_out = "JSON root must be an object";
-      return false;
-    }
+   auto validate_object = [&](const boost::json::value& jv,
+                              std::string& error_out) -> bool {
+      if (!jv.is_object()) {
+         error_out = "JSON root must be an object";
+         return false;
+      }

-    const auto& obj = jv.get_object();
-    if (!obj.contains("name") || !obj.at("name").is_string()) {
-      error_out = "JSON field 'name' is missing or not a string";
-      return false;
-    }
+      const auto& obj = jv.get_object();
+      if (!obj.contains("name") || !obj.at("name").is_string()) {
+         error_out = "JSON field 'name' is missing or not a string";
+         return false;
+      }

-    if (!obj.contains("description") || !obj.at("description").is_string()) {
-      error_out = "JSON field 'description' is missing or not a string";
-      return false;
-    }
+      if (!obj.contains("description") || !obj.at("description").is_string()) {
+         error_out = "JSON field 'description' is missing or not a string";
+         return false;
+      }

-    name_out = Trim(std::string(obj.at("name").as_string().c_str()));
-    description_out =
-        Trim(std::string(obj.at("description").as_string().c_str()));
+      name_out = Trim(std::string(obj.at("name").as_string().c_str()));
+      description_out =
+          Trim(std::string(obj.at("description").as_string().c_str()));

-    if (name_out.empty()) {
-      error_out = "JSON field 'name' must not be empty";
-      return false;
-    }
+      if (name_out.empty()) {
+         error_out = "JSON field 'name' must not be empty";
+         return false;
+      }

-    if (description_out.empty()) {
-      error_out = "JSON field 'description' must not be empty";
-      return false;
-    }
+      if (description_out.empty()) {
+         error_out = "JSON field 'description' must not be empty";
+         return false;
+      }

-    std::string name_lower = name_out;
-    std::string description_lower = description_out;
-    std::transform(
-        name_lower.begin(), name_lower.end(), name_lower.begin(),
-        [](unsigned char c) { return static_cast<char>(std::tolower(c)); });
-    std::transform(description_lower.begin(), description_lower.end(),
-                   description_lower.begin(), [](unsigned char c) {
-                     return static_cast<char>(std::tolower(c));
-                   });
+      std::string name_lower = name_out;
+      std::string description_lower = description_out;
+      std::transform(
+          name_lower.begin(), name_lower.end(), name_lower.begin(),
+          [](unsigned char c) { return static_cast<char>(std::tolower(c)); });
+      std::transform(description_lower.begin(), description_lower.end(),
+                     description_lower.begin(), [](unsigned char c) {
+                        return static_cast<char>(std::tolower(c));
+                     });

-    if (name_lower == "string" || description_lower == "string") {
-      error_out = "JSON appears to be a schema placeholder, not content";
-      return false;
-    }
+      if (name_lower == "string" || description_lower == "string") {
+         error_out = "JSON appears to be a schema placeholder, not content";
+         return false;
+      }

-    error_out.clear();
-    return true;
-  };
+      error_out.clear();
+      return true;
+   };

-  boost::system::error_code ec;
-  boost::json::value jv = boost::json::parse(raw, ec);
-  std::string validation_error;
-  if (ec) {
-    std::string extracted;
-    if (!ExtractFirstJsonObject(raw, extracted)) {
-      return "JSON parse error: " + ec.message();
-    }
+   boost::system::error_code ec;
+   boost::json::value jv = boost::json::parse(raw, ec);
+   std::string validation_error;
+   if (ec) {
+      std::string extracted;
+      if (!ExtractFirstJsonObject(raw, extracted)) {
+         return "JSON parse error: " + ec.message();
+      }

-    ec.clear();
-    jv = boost::json::parse(extracted, ec);
-    if (ec) {
-      return "JSON parse error: " + ec.message();
-    }
+      ec.clear();
+      jv = boost::json::parse(extracted, ec);
+      if (ec) {
+         return "JSON parse error: " + ec.message();
+      }

-    if (!validate_object(jv, validation_error)) {
+      if (!validate_object(jv, validation_error)) {
+         return validation_error;
+      }
+
+      return {};
+   }
+
+   if (!validate_object(jv, validation_error)) {
      return validation_error;
-    }
+   }

-    return {};
-  }
-
-  if (!validate_object(jv, validation_error)) {
-    return validation_error;
-  }
-
-  return {};
+   return {};
 }

 }  // namespace
@@ -369,33 +367,32 @@ std::string ValidateBreweryJson(const std::string& raw, std::string& name_out,
 // Forward declarations for helper functions exposed to other translation units
 std::string PrepareRegionContextPublic(std::string_view region_context,
                                       std::size_t max_chars) {
-  return PrepareRegionContext(region_context, max_chars);
+   return PrepareRegionContext(region_context, max_chars);
 }

-std::pair<std::string, std::string>
-ParseTwoLineResponsePublic(const std::string& raw,
-                           const std::string& error_message) {
-  return ParseTwoLineResponse(raw, error_message);
+std::pair<std::string, std::string> ParseTwoLineResponsePublic(
+    const std::string& raw, const std::string& error_message) {
+   return ParseTwoLineResponse(raw, error_message);
 }

-std::string ToChatPromptPublic(const llama_model *model,
+std::string ToChatPromptPublic(const llama_model* model,
                               const std::string& user_prompt) {
-  return ToChatPrompt(model, user_prompt);
+   return ToChatPrompt(model, user_prompt);
 }

-std::string ToChatPromptPublic(const llama_model *model,
+std::string ToChatPromptPublic(const llama_model* model,
                               const std::string& system_prompt,
                               const std::string& user_prompt) {
-  return ToChatPrompt(model, system_prompt, user_prompt);
+   return ToChatPrompt(model, system_prompt, user_prompt);
 }

-void AppendTokenPiecePublic(const llama_vocab *vocab, llama_token token,
+void AppendTokenPiecePublic(const llama_vocab* vocab, llama_token token,
                            std::string& output) {
-  AppendTokenPiece(vocab, token, output);
+   AppendTokenPiece(vocab, token, output);
 }

 std::string ValidateBreweryJsonPublic(const std::string& raw,
                                      std::string& name_out,
                                      std::string& description_out) {
-  return ValidateBreweryJson(raw, name_out, description_out);
+   return ValidateBreweryJson(raw, name_out, description_out);
 }
--- a/pipeline/src/data_generation/llama/infer.cpp
+++ b/pipeline/src/data_generation/llama/infer.cpp
@@ -1,195 +1,199 @@
+#include <spdlog/spdlog.h>
+
 #include <algorithm>
 #include <memory>
 #include <stdexcept>
 #include <string>
 #include <vector>

-#include "llama.h"
-#include <spdlog/spdlog.h>
-
 #include "data_generation/llama_generator.h"
 #include "data_generation/llama_generator_helpers.h"
+#include "llama.h"

 std::string LlamaGenerator::Infer(const std::string& prompt, int max_tokens) {
-  if (model_ == nullptr || context_ == nullptr)
-    throw std::runtime_error("LlamaGenerator: model not loaded");
+   if (model_ == nullptr || context_ == nullptr)
+      throw std::runtime_error("LlamaGenerator: model not loaded");

-  const llama_vocab *vocab = llama_model_get_vocab(model_);
-  if (vocab == nullptr)
-    throw std::runtime_error("LlamaGenerator: vocab unavailable");
+   const llama_vocab* vocab = llama_model_get_vocab(model_);
+   if (vocab == nullptr)
+      throw std::runtime_error("LlamaGenerator: vocab unavailable");

-  llama_memory_clear(llama_get_memory(context_), true);
+   llama_memory_clear(llama_get_memory(context_), true);

-  const std::string formatted_prompt = ToChatPromptPublic(model_, prompt);
+   const std::string formatted_prompt = ToChatPromptPublic(model_, prompt);

-  std::vector<llama_token> prompt_tokens(formatted_prompt.size() + 8);
-  int32_t token_count = llama_tokenize(
-      vocab, formatted_prompt.c_str(),
-      static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
-      static_cast<int32_t>(prompt_tokens.size()), true, true);
+   std::vector<llama_token> prompt_tokens(formatted_prompt.size() + 8);
+   int32_t token_count = llama_tokenize(
+       vocab, formatted_prompt.c_str(),
+       static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
+       static_cast<int32_t>(prompt_tokens.size()), true, true);

-  if (token_count < 0) {
-    prompt_tokens.resize(static_cast<std::size_t>(-token_count));
-    token_count = llama_tokenize(
-        vocab, formatted_prompt.c_str(),
-        static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
-        static_cast<int32_t>(prompt_tokens.size()), true, true);
-  }
+   if (token_count < 0) {
+      prompt_tokens.resize(static_cast<std::size_t>(-token_count));
+      token_count = llama_tokenize(
+          vocab, formatted_prompt.c_str(),
+          static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
+          static_cast<int32_t>(prompt_tokens.size()), true, true);
+   }

-  if (token_count < 0)
-    throw std::runtime_error("LlamaGenerator: prompt tokenization failed");
+   if (token_count < 0)
+      throw std::runtime_error("LlamaGenerator: prompt tokenization failed");

-  const int32_t n_ctx = static_cast<int32_t>(llama_n_ctx(context_));
-  const int32_t n_batch = static_cast<int32_t>(llama_n_batch(context_));
-  if (n_ctx <= 1 || n_batch <= 0) {
-    throw std::runtime_error("LlamaGenerator: invalid context or batch size");
-  }
+   const int32_t n_ctx = static_cast<int32_t>(llama_n_ctx(context_));
+   const int32_t n_batch = static_cast<int32_t>(llama_n_batch(context_));
+   if (n_ctx <= 1 || n_batch <= 0) {
+      throw std::runtime_error("LlamaGenerator: invalid context or batch size");
+   }

-  const int32_t effective_max_tokens = std::max(1, std::min(max_tokens, n_ctx - 1));
-  int32_t prompt_budget = std::min(n_batch, n_ctx - effective_max_tokens);
-  prompt_budget = std::max<int32_t>(1, prompt_budget);
+   const int32_t effective_max_tokens =
+       std::max(1, std::min(max_tokens, n_ctx - 1));
+   int32_t prompt_budget = std::min(n_batch, n_ctx - effective_max_tokens);
+   prompt_budget = std::max<int32_t>(1, prompt_budget);

-  prompt_tokens.resize(static_cast<std::size_t>(token_count));
-  if (token_count > prompt_budget) {
-    spdlog::warn(
-        "LlamaGenerator: prompt too long ({} tokens), truncating to {} tokens "
-        "to fit n_batch/n_ctx limits",
-        token_count, prompt_budget);
-    prompt_tokens.resize(static_cast<std::size_t>(prompt_budget));
-    token_count = prompt_budget;
-  }
+   prompt_tokens.resize(static_cast<std::size_t>(token_count));
+   if (token_count > prompt_budget) {
+      spdlog::warn(
+          "LlamaGenerator: prompt too long ({} tokens), truncating to {} "
+          "tokens "
+          "to fit n_batch/n_ctx limits",
+          token_count, prompt_budget);
+      prompt_tokens.resize(static_cast<std::size_t>(prompt_budget));
+      token_count = prompt_budget;
+   }

-  const llama_batch prompt_batch = llama_batch_get_one(
-      prompt_tokens.data(), static_cast<int32_t>(prompt_tokens.size()));
-  if (llama_decode(context_, prompt_batch) != 0)
-    throw std::runtime_error("LlamaGenerator: prompt decode failed");
+   const llama_batch prompt_batch = llama_batch_get_one(
+       prompt_tokens.data(), static_cast<int32_t>(prompt_tokens.size()));
+   if (llama_decode(context_, prompt_batch) != 0)
+      throw std::runtime_error("LlamaGenerator: prompt decode failed");

-  llama_sampler_chain_params sampler_params =
-      llama_sampler_chain_default_params();
-  using SamplerPtr =
-      std::unique_ptr<llama_sampler, decltype(&llama_sampler_free)>;
-  SamplerPtr sampler(llama_sampler_chain_init(sampler_params),
-                     &llama_sampler_free);
-  if (!sampler)
-    throw std::runtime_error("LlamaGenerator: failed to initialize sampler");
+   llama_sampler_chain_params sampler_params =
+       llama_sampler_chain_default_params();
+   using SamplerPtr =
+       std::unique_ptr<llama_sampler, decltype(&llama_sampler_free)>;
+   SamplerPtr sampler(llama_sampler_chain_init(sampler_params),
+                      &llama_sampler_free);
+   if (!sampler)
+      throw std::runtime_error("LlamaGenerator: failed to initialize sampler");

-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_temp(sampling_temperature_));
-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_top_p(sampling_top_p_, 1));
-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_dist(sampling_seed_));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_temp(sampling_temperature_));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_top_p(sampling_top_p_, 1));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_dist(sampling_seed_));

-  std::vector<llama_token> generated_tokens;
-  generated_tokens.reserve(static_cast<std::size_t>(max_tokens));
+   std::vector<llama_token> generated_tokens;
+   generated_tokens.reserve(static_cast<std::size_t>(max_tokens));

-  for (int i = 0; i < effective_max_tokens; ++i) {
-    const llama_token next = llama_sampler_sample(sampler.get(), context_, -1);
-    if (llama_vocab_is_eog(vocab, next))
-      break;
-    generated_tokens.push_back(next);
-    llama_token token = next;
-    const llama_batch one_token_batch = llama_batch_get_one(&token, 1);
-    if (llama_decode(context_, one_token_batch) != 0)
-      throw std::runtime_error(
-          "LlamaGenerator: decode failed during generation");
-  }
+   for (int i = 0; i < effective_max_tokens; ++i) {
+      const llama_token next =
+          llama_sampler_sample(sampler.get(), context_, -1);
+      if (llama_vocab_is_eog(vocab, next)) break;
+      generated_tokens.push_back(next);
+      llama_token token = next;
+      const llama_batch one_token_batch = llama_batch_get_one(&token, 1);
+      if (llama_decode(context_, one_token_batch) != 0)
+         throw std::runtime_error(
+             "LlamaGenerator: decode failed during generation");
+   }

-  std::string output;
-  for (const llama_token token : generated_tokens)
-    AppendTokenPiecePublic(vocab, token, output);
-  return output;
+   std::string output;
+   for (const llama_token token : generated_tokens)
+      AppendTokenPiecePublic(vocab, token, output);
+   return output;
 }

 std::string LlamaGenerator::Infer(const std::string& system_prompt,
                                  const std::string& prompt, int max_tokens) {
-  if (model_ == nullptr || context_ == nullptr)
-    throw std::runtime_error("LlamaGenerator: model not loaded");
+   if (model_ == nullptr || context_ == nullptr)
+      throw std::runtime_error("LlamaGenerator: model not loaded");

-  const llama_vocab *vocab = llama_model_get_vocab(model_);
-  if (vocab == nullptr)
-    throw std::runtime_error("LlamaGenerator: vocab unavailable");
+   const llama_vocab* vocab = llama_model_get_vocab(model_);
+   if (vocab == nullptr)
+      throw std::runtime_error("LlamaGenerator: vocab unavailable");

-  llama_memory_clear(llama_get_memory(context_), true);
+   llama_memory_clear(llama_get_memory(context_), true);

-  const std::string formatted_prompt =
-      ToChatPromptPublic(model_, system_prompt, prompt);
+   const std::string formatted_prompt =
+       ToChatPromptPublic(model_, system_prompt, prompt);

-  std::vector<llama_token> prompt_tokens(formatted_prompt.size() + 8);
-  int32_t token_count = llama_tokenize(
-      vocab, formatted_prompt.c_str(),
-      static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
-      static_cast<int32_t>(prompt_tokens.size()), true, true);
+   std::vector<llama_token> prompt_tokens(formatted_prompt.size() + 8);
+   int32_t token_count = llama_tokenize(
+       vocab, formatted_prompt.c_str(),
+       static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
+       static_cast<int32_t>(prompt_tokens.size()), true, true);

-  if (token_count < 0) {
-    prompt_tokens.resize(static_cast<std::size_t>(-token_count));
-    token_count = llama_tokenize(
-        vocab, formatted_prompt.c_str(),
-        static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
-        static_cast<int32_t>(prompt_tokens.size()), true, true);
-  }
+   if (token_count < 0) {
+      prompt_tokens.resize(static_cast<std::size_t>(-token_count));
+      token_count = llama_tokenize(
+          vocab, formatted_prompt.c_str(),
+          static_cast<int32_t>(formatted_prompt.size()), prompt_tokens.data(),
+          static_cast<int32_t>(prompt_tokens.size()), true, true);
+   }

-  if (token_count < 0)
-    throw std::runtime_error("LlamaGenerator: prompt tokenization failed");
+   if (token_count < 0)
+      throw std::runtime_error("LlamaGenerator: prompt tokenization failed");

-  const int32_t n_ctx = static_cast<int32_t>(llama_n_ctx(context_));
-  const int32_t n_batch = static_cast<int32_t>(llama_n_batch(context_));
-  if (n_ctx <= 1 || n_batch <= 0) {
-    throw std::runtime_error("LlamaGenerator: invalid context or batch size");
-  }
+   const int32_t n_ctx = static_cast<int32_t>(llama_n_ctx(context_));
+   const int32_t n_batch = static_cast<int32_t>(llama_n_batch(context_));
+   if (n_ctx <= 1 || n_batch <= 0) {
+      throw std::runtime_error("LlamaGenerator: invalid context or batch size");
+   }

-  const int32_t effective_max_tokens = std::max(1, std::min(max_tokens, n_ctx - 1));
-  int32_t prompt_budget = std::min(n_batch, n_ctx - effective_max_tokens);
-  prompt_budget = std::max<int32_t>(1, prompt_budget);
+   const int32_t effective_max_tokens =
+       std::max(1, std::min(max_tokens, n_ctx - 1));
+   int32_t prompt_budget = std::min(n_batch, n_ctx - effective_max_tokens);
+   prompt_budget = std::max<int32_t>(1, prompt_budget);

-  prompt_tokens.resize(static_cast<std::size_t>(token_count));
-  if (token_count > prompt_budget) {
-    spdlog::warn(
-        "LlamaGenerator: prompt too long ({} tokens), truncating to {} tokens "
-        "to fit n_batch/n_ctx limits",
-        token_count, prompt_budget);
-    prompt_tokens.resize(static_cast<std::size_t>(prompt_budget));
-    token_count = prompt_budget;
-  }
+   prompt_tokens.resize(static_cast<std::size_t>(token_count));
+   if (token_count > prompt_budget) {
+      spdlog::warn(
+          "LlamaGenerator: prompt too long ({} tokens), truncating to {} "
+          "tokens "
+          "to fit n_batch/n_ctx limits",
+          token_count, prompt_budget);
+      prompt_tokens.resize(static_cast<std::size_t>(prompt_budget));
+      token_count = prompt_budget;
+   }

-  const llama_batch prompt_batch = llama_batch_get_one(
-      prompt_tokens.data(), static_cast<int32_t>(prompt_tokens.size()));
-  if (llama_decode(context_, prompt_batch) != 0)
-    throw std::runtime_error("LlamaGenerator: prompt decode failed");
+   const llama_batch prompt_batch = llama_batch_get_one(
+       prompt_tokens.data(), static_cast<int32_t>(prompt_tokens.size()));
+   if (llama_decode(context_, prompt_batch) != 0)
+      throw std::runtime_error("LlamaGenerator: prompt decode failed");

-  llama_sampler_chain_params sampler_params =
-      llama_sampler_chain_default_params();
-  using SamplerPtr =
-      std::unique_ptr<llama_sampler, decltype(&llama_sampler_free)>;
-  SamplerPtr sampler(llama_sampler_chain_init(sampler_params),
-                     &llama_sampler_free);
-  if (!sampler)
-    throw std::runtime_error("LlamaGenerator: failed to initialize sampler");
+   llama_sampler_chain_params sampler_params =
+       llama_sampler_chain_default_params();
+   using SamplerPtr =
+       std::unique_ptr<llama_sampler, decltype(&llama_sampler_free)>;
+   SamplerPtr sampler(llama_sampler_chain_init(sampler_params),
+                      &llama_sampler_free);
+   if (!sampler)
+      throw std::runtime_error("LlamaGenerator: failed to initialize sampler");

-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_temp(sampling_temperature_));
-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_top_p(sampling_top_p_, 1));
-  llama_sampler_chain_add(sampler.get(),
-                          llama_sampler_init_dist(sampling_seed_));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_temp(sampling_temperature_));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_top_p(sampling_top_p_, 1));
+   llama_sampler_chain_add(sampler.get(),
+                           llama_sampler_init_dist(sampling_seed_));

-  std::vector<llama_token> generated_tokens;
-  generated_tokens.reserve(static_cast<std::size_t>(max_tokens));
+   std::vector<llama_token> generated_tokens;
+   generated_tokens.reserve(static_cast<std::size_t>(max_tokens));

-  for (int i = 0; i < effective_max_tokens; ++i) {
-    const llama_token next = llama_sampler_sample(sampler.get(), context_, -1);
-    if (llama_vocab_is_eog(vocab, next))
-      break;
-    generated_tokens.push_back(next);
-    llama_token token = next;
-    const llama_batch one_token_batch = llama_batch_get_one(&token, 1);
-    if (llama_decode(context_, one_token_batch) != 0)
-      throw std::runtime_error(
-          "LlamaGenerator: decode failed during generation");
-  }
+   for (int i = 0; i < effective_max_tokens; ++i) {
+      const llama_token next =
+          llama_sampler_sample(sampler.get(), context_, -1);
+      if (llama_vocab_is_eog(vocab, next)) break;
+      generated_tokens.push_back(next);
+      llama_token token = next;
+      const llama_batch one_token_batch = llama_batch_get_one(&token, 1);
+      if (llama_decode(context_, one_token_batch) != 0)
+         throw std::runtime_error(
+             "LlamaGenerator: decode failed during generation");
+   }

-  std::string output;
-  for (const llama_token token : generated_tokens)
-    AppendTokenPiecePublic(vocab, token, output);
-  return output;
+   std::string output;
+   for (const llama_token token : generated_tokens)
+      AppendTokenPiecePublic(vocab, token, output);
+   return output;
 }
--- a/pipeline/src/data_generation/llama/load.cpp
+++ b/pipeline/src/data_generation/llama/load.cpp
@@ -1,42 +1,42 @@
+#include <spdlog/spdlog.h>
+
 #include <stdexcept>
 #include <string>

-#include "llama.h"
-#include <spdlog/spdlog.h>
-
 #include "data_generation/llama_generator.h"
+#include "llama.h"

 void LlamaGenerator::Load(const std::string& model_path) {
-  if (model_path.empty())
-    throw std::runtime_error("LlamaGenerator: model path must not be empty");
+   if (model_path.empty())
+      throw std::runtime_error("LlamaGenerator: model path must not be empty");

-  if (context_ != nullptr) {
-    llama_free(context_);
-    context_ = nullptr;
-  }
-  if (model_ != nullptr) {
-    llama_model_free(model_);
-    model_ = nullptr;
-  }
+   if (context_ != nullptr) {
+      llama_free(context_);
+      context_ = nullptr;
+   }
+   if (model_ != nullptr) {
+      llama_model_free(model_);
+      model_ = nullptr;
+   }

-  llama_backend_init();
+   llama_backend_init();

-  llama_model_params model_params = llama_model_default_params();
-  model_ = llama_model_load_from_file(model_path.c_str(), model_params);
-  if (model_ == nullptr) {
-    throw std::runtime_error(
-        "LlamaGenerator: failed to load model from path: " + model_path);
-  }
+   llama_model_params model_params = llama_model_default_params();
+   model_ = llama_model_load_from_file(model_path.c_str(), model_params);
+   if (model_ == nullptr) {
+      throw std::runtime_error(
+          "LlamaGenerator: failed to load model from path: " + model_path);
+   }

-  llama_context_params context_params = llama_context_default_params();
-  context_params.n_ctx = 2048;
+   llama_context_params context_params = llama_context_default_params();
+   context_params.n_ctx = 2048;

-  context_ = llama_init_from_model(model_, context_params);
-  if (context_ == nullptr) {
-    llama_model_free(model_);
-    model_ = nullptr;
-    throw std::runtime_error("LlamaGenerator: failed to create context");
-  }
+   context_ = llama_init_from_model(model_, context_params);
+   if (context_ == nullptr) {
+      llama_model_free(model_);
+      model_ = nullptr;
+      throw std::runtime_error("LlamaGenerator: failed to create context");
+   }

-  spdlog::info("[LlamaGenerator] Loaded model: {}", model_path);
+   spdlog::info("[LlamaGenerator] Loaded model: {}", model_path);
 }
--- a/pipeline/src/data_generation/llama/set_sampling_options.cpp
+++ b/pipeline/src/data_generation/llama/set_sampling_options.cpp
@@ -1,26 +1,25 @@
 #include <stdexcept>

-#include "llama.h"
-
 #include "data_generation/llama_generator.h"
+#include "llama.h"

 void LlamaGenerator::SetSamplingOptions(float temperature, float top_p,
                                        int seed) {
-  if (temperature < 0.0f) {
-    throw std::runtime_error(
-        "LlamaGenerator: sampling temperature must be >= 0");
-  }
-  if (!(top_p > 0.0f && top_p <= 1.0f)) {
-    throw std::runtime_error(
-        "LlamaGenerator: sampling top-p must be in (0, 1]");
-  }
-  if (seed < -1) {
-    throw std::runtime_error(
-        "LlamaGenerator: seed must be >= 0, or -1 for random");
-  }
+   if (temperature < 0.0f) {
+      throw std::runtime_error(
+          "LlamaGenerator: sampling temperature must be >= 0");
+   }
+   if (!(top_p > 0.0f && top_p <= 1.0f)) {
+      throw std::runtime_error(
+          "LlamaGenerator: sampling top-p must be in (0, 1]");
+   }
+   if (seed < -1) {
+      throw std::runtime_error(
+          "LlamaGenerator: seed must be >= 0, or -1 for random");
+   }

-  sampling_temperature_ = temperature;
-  sampling_top_p_ = top_p;
-  sampling_seed_ = (seed < 0) ? static_cast<uint32_t>(LLAMA_DEFAULT_SEED)
-                              : static_cast<uint32_t>(seed);
+   sampling_temperature_ = temperature;
+   sampling_top_p_ = top_p;
+   sampling_seed_ = (seed < 0) ? static_cast<uint32_t>(LLAMA_DEFAULT_SEED)
+                               : static_cast<uint32_t>(seed);
 }
--- a/pipeline/src/data_generation/mock_generator.cpp
+++ b/pipeline/src/data_generation/mock_generator.cpp
@@ -1,7 +1,7 @@
-#include "data_generation/mock_generator.h"
+#include <string>
+#include <vector>

-#include <functional>
-#include <spdlog/spdlog.h>
+#include "data_generation/mock_generator.h"

 const std::vector<std::string> MockGenerator::kBreweryAdjectives = {
    "Craft",      "Heritage", "Local",  "Artisan",  "Pioneer",    "Golden",
@@ -63,42 +63,3 @@ const std::vector<std::string> MockGenerator::kBios = {
    "Craft beer fan mapping tasting notes and favorite brew routes.",
    "Always ready to trade recommendations for underrated local breweries.",
    "Keeping a running list of must-try collab releases and tap takeovers."};
-
-void MockGenerator::Load(const std::string & /*modelPath*/) {
-  spdlog::info("[MockGenerator] No model needed");
-}
-
-std::size_t MockGenerator::DeterministicHash(const std::string &a,
-                                             const std::string &b) {
-  std::size_t seed = std::hash<std::string>{}(a);
-  const std::size_t mixed = std::hash<std::string>{}(b);
-  seed ^= mixed + 0x9e3779b97f4a7c15ULL + (seed << 6) + (seed >> 2);
-  seed = (seed << 13) | (seed >> ((sizeof(std::size_t) * 8) - 13));
-  return seed;
-}
-
-BreweryResult MockGenerator::GenerateBrewery(const std::string &city_name,
-                                             const std::string &country_name,
-                                             const std::string &region_context) {
-  const std::string location_key =
-      country_name.empty() ? city_name : city_name + "," + country_name;
-  const std::size_t hash = region_context.empty()
-                               ? std::hash<std::string>{}(location_key)
-                               : DeterministicHash(location_key, region_context);
-
-  BreweryResult result;
-  result.name = kBreweryAdjectives[hash % kBreweryAdjectives.size()] + " " +
-                kBreweryNouns[(hash / 7) % kBreweryNouns.size()];
-  result.description =
-      kBreweryDescriptions[(hash / 13) % kBreweryDescriptions.size()];
-  return result;
-}
-
-UserResult MockGenerator::GenerateUser(const std::string &locale) {
-  const std::size_t hash = std::hash<std::string>{}(locale);
-
-  UserResult result;
-  result.username = kUsernames[hash % kUsernames.size()];
-  result.bio = kBios[(hash / 11) % kBios.size()];
-  return result;
-}
--- a/pipeline/src/data_generation/mock/deterministic_hash.cpp
+++ b/pipeline/src/data_generation/mock/deterministic_hash.cpp
@@ -0,0 +1,12 @@
+#include <string>
+
+#include "data_generation/mock_generator.h"
+
+std::size_t MockGenerator::DeterministicHash(const std::string& a,
+                                             const std::string& b) {
+   std::size_t seed = std::hash<std::string>{}(a);
+   const std::size_t mixed = std::hash<std::string>{}(b);
+   seed ^= mixed + 0x9e3779b97f4a7c15ULL + (seed << 6) + (seed >> 2);
+   seed = (seed << 13) | (seed >> ((sizeof(std::size_t) * 8) - 13));
+   return seed;
+}
--- a/pipeline/src/data_generation/mock/generate_brewery.cpp
+++ b/pipeline/src/data_generation/mock/generate_brewery.cpp
@@ -0,0 +1,21 @@
+#include <functional>
+#include <string>
+
+#include "data_generation/mock_generator.h"
+
+BreweryResult MockGenerator::GenerateBrewery(
+    const std::string& city_name, const std::string& country_name,
+    const std::string& region_context) {
+   const std::string location_key =
+       country_name.empty() ? city_name : city_name + "," + country_name;
+   const std::size_t hash =
+       region_context.empty() ? std::hash<std::string>{}(location_key)
+                              : DeterministicHash(location_key, region_context);
+
+   BreweryResult result;
+   result.name = kBreweryAdjectives[hash % kBreweryAdjectives.size()] + " " +
+                 kBreweryNouns[(hash / 7) % kBreweryNouns.size()];
+   result.description =
+       kBreweryDescriptions[(hash / 13) % kBreweryDescriptions.size()];
+   return result;
+}
--- a/pipeline/src/data_generation/mock/generate_user.cpp
+++ b/pipeline/src/data_generation/mock/generate_user.cpp
@@ -0,0 +1,13 @@
+#include <functional>
+#include <string>
+
+#include "data_generation/mock_generator.h"
+
+UserResult MockGenerator::GenerateUser(const std::string& locale) {
+   const std::size_t hash = std::hash<std::string>{}(locale);
+
+   UserResult result;
+   result.username = kUsernames[hash % kUsernames.size()];
+   result.bio = kBios[(hash / 11) % kBios.size()];
+   return result;
+}
--- a/pipeline/src/data_generation/mock/load.cpp
+++ b/pipeline/src/data_generation/mock/load.cpp
@@ -0,0 +1,9 @@
+#include <spdlog/spdlog.h>
+
+#include <string>
+
+#include "data_generation/mock_generator.h"
+
+void MockGenerator::Load(const std::string& /*modelPath*/) {
+   spdlog::info("[MockGenerator] No model needed");
+}