mirror of
https://github.com/aaronpo97/the-biergarten-app.git
synced 2026-06-01 01:54:00 +00:00
Pipeline: Add Runpod docker configuration (#222)
* Begin work on Runpod docker config * Reduce docker image size * Create .dockerignore
This commit is contained in:
@@ -3,7 +3,8 @@
|
||||
|
||||
/**
|
||||
* @file data_model/models.h
|
||||
* @brief Core data models: locations, application configuration, and generation inputs.
|
||||
* @brief Core data models: locations, application configuration, and generation
|
||||
* inputs.
|
||||
*/
|
||||
|
||||
#include <boost/program_options.hpp>
|
||||
@@ -94,6 +95,9 @@ struct GeneratorOptions {
|
||||
/// @brief Use mocked generator instead of actual LLM inference.
|
||||
bool use_mocked = false;
|
||||
|
||||
/// @brief Number of layers to offload to GPU.
|
||||
int n_gpu_layers = 0;
|
||||
|
||||
/// @brief Specific sampling parameters for this generator.
|
||||
/// If nullopt, the application should use global defaults.
|
||||
std::optional<SamplingOptions> sampling;
|
||||
|
||||
Reference in New Issue
Block a user