ThemisDB/examples/lora_training_example.cpp at develop · makr-code/ThemisDB · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
/*
╔═════════════════════════════════════════════════════════════════════╗
║ ThemisDB - Hybrid Database System                                   ║
╠═════════════════════════════════════════════════════════════════════╣
  File:            lora_training_example.cpp                          ║
  Version:         0.0.47                                             ║
  Last Modified:   2026-04-15 18:43:54                                ║
  Author:          unknown                                            ║
╠═════════════════════════════════════════════════════════════════════╣
  Quality Metrics:                                                    ║
    • Maturity Level:  🟢 PRODUCTION-READY                             ║
    • Quality Score:   99.0/100                                       ║
    • Total Lines:     242                                            ║
    • Open Issues:     TODOs: 0, Stubs: 0                             ║
╠═════════════════════════════════════════════════════════════════════╣
  Status: ✅ Production Ready                                          ║
╚═════════════════════════════════════════════════════════════════════╝
 */

/**
 * @file lora_training_example.cpp
 * @brief Example demonstrating LoRA training with llama.cpp base models
 *
 * This example shows:
 * 1. Loading a frozen base model (GGUF format)
 * 2. Creating LoRA adapters
 * 3. Loading and preparing training data
 * 4. Training the LoRA adapters
 * 5. Exporting the trained adapters
 */

#include "llm/lora_framework/base_model_adapter.h"
#include "llm/lora_framework/data_loader.h"
#include "llm/lora_framework/lora_layers.h"
#include <spdlog/spdlog.h>
#include <fmt/format.h>
#include <iostream>

using namespace themis::llm::lora;

int main(int argc, char** argv) {
    // Configure logging
    spdlog::set_level(spdlog::level::info);

    spdlog::info("=== LoRA Training Example ===");

    // ========================================
    // 1. Configure LoRA-Enhanced Model
    // ========================================

    LoRAEnhancedModel::Config model_config;

    // Base model settings
    // Note: This example uses a placeholder path. Update with actual model path.
    model_config.base_model_path = (argc > 1) ? argv[1] : "models/llama-2-7b.gguf";

    // LoRA hyperparameters
    model_config.lora_config.rank = 8;                    // Small rank for quick testing
    model_config.lora_config.alpha = 16.0f;              // Scaling factor (2*rank)
    model_config.lora_config.learning_rate = 3e-4f;      // Learning rate

    // Target modules (which layers to adapt)
    model_config.target_modules = {
        "attention.wq",   // Query projection
        "attention.wv"    // Value projection
    };

    spdlog::info("Configuration:");
    spdlog::info("  Base model: {}", model_config.base_model_path);
    spdlog::info("  LoRA rank: {}", model_config.lora_config.rank);
    spdlog::info("  LoRA alpha: {}", model_config.lora_config.alpha);
    spdlog::info("  Target modules: {}", fmt::join(model_config.target_modules, ", "));

    // ========================================
    // 2. Initialize Model
    // ========================================

    spdlog::info("\n=== Initializing Model ===");

    LoRAEnhancedModel model(model_config);

    if (!model.initialize()) {
        spdlog::error("Failed to initialize model. Check if model file exists: {}",
                     model_config.base_model_path);
        spdlog::info("\nNote: This example requires a GGUF model file.");
        spdlog::info("You can:");
        spdlog::info("1. Download a model from HuggingFace");
        spdlog::info("2. Convert a model to GGUF format");
        spdlog::info("3. Provide model path as command line argument");
        spdlog::info("\nUsage: {} <path_to_model.gguf>", argv[0]);
        return 1;
    }

    spdlog::info("Model initialized successfully!");
    spdlog::info("  Base parameters: {:L}", model.getBaseModelParameterCount());
    spdlog::info("  LoRA parameters: {:L}", model.getLoRAParameterCount());

    float reduction = 100.0f * (1.0f -
        static_cast<float>(model.getLoRAParameterCount()) /
        static_cast<float>(model.getBaseModelParameterCount()));
    spdlog::info("  Parameter reduction: {:.2f}%", reduction);

    // ========================================
    // 3. Setup Data Loader
    // ========================================

    spdlog::info("\n=== Setting Up Data Loader ===");

    // Create tokenizer (using simple character-level tokenizer for demo)
    auto tokenizer = std::make_shared<SimpleTokenizer>();

    // Configure data loader
    DataLoaderConfig data_config;
    data_config.batch_size = 2;
    data_config.max_sequence_length = 128;
    data_config.shuffle = true;

    DataLoader loader(tokenizer, data_config);

    // Create toy dataset for demonstration
    // In production, you would load from file: loader.loadFromFile("data/train.json")
    spdlog::info("Creating toy dataset (10 samples)...");
    auto samples = data_utils::createToyDataset(10);

    if (!loader.loadFromSamples(samples)) {
        spdlog::error("Failed to load training data");
        return 1;
    }

    spdlog::info("Dataset loaded:");
    spdlog::info("  Total samples: {}", loader.size());
    spdlog::info("  Batch size: {}", data_config.batch_size);
    spdlog::info("  Number of batches: {}", loader.num_batches());

    // ========================================
    // 4. Setup Optimizer
    // ========================================

    spdlog::info("\n=== Setting Up Optimizer ===");

    SGDOptimizer optimizer(
        model_config.lora_config.learning_rate,
        0.9f,   // momentum
        0.01f   // weight_decay
    );

    // Register LoRA parameters for optimization
    auto params = model.getTrainableParameters();
    optimizer.add_parameters(params);

    spdlog::info("Optimizer configured:");
    spdlog::info("  Learning rate: {}", model_config.lora_config.learning_rate);
    spdlog::info("  Trainable parameters: {}", params.size());

    // ========================================
    // 5. Training Loop
    // ========================================

    spdlog::info("\n=== Starting Training ===");

    const int num_epochs = 2;  // Small number for demo

    for (int epoch = 0; epoch < num_epochs; ++epoch) {
        spdlog::info("\nEpoch {}/{}", epoch + 1, num_epochs);

        loader.reset();
        float epoch_loss = 0.0f;
        int step = 0;

        while (loader.hasNext()) {
            // Get batch
            auto batch = loader.getNextBatch();

            // NOTE: This is a simplified training loop
            // In production, you would:
            // 1. Forward pass through model with batch
            // 2. Compute loss (e.g., cross-entropy)
            // 3. Backward pass to compute gradients
            // 4. Optimizer step to update parameters

            // For now, just simulate with a decreasing loss
            float step_loss = 1.0f / (step + 1);
            epoch_loss += step_loss;

            // Zero gradients
            optimizer.zero_grad();

            // Normally: forward, compute loss, backward
            // ... (actual training implementation)

            // Optimizer step
            optimizer.step();

            // Log progress
            if (step % 1 == 0) {
                spdlog::info("  Step {}: Loss = {:.4f}", step, step_loss);
            }

            step++;
        }

        float avg_loss = epoch_loss / step;
        spdlog::info("Epoch {} completed. Average loss: {:.4f}", epoch + 1, avg_loss);
    }

    // ========================================
    // 6. Export Trained Adapter
    // ========================================

    spdlog::info("\n=== Exporting Trained Adapter ===");

    auto weights = model.exportLoRAWeights();

    spdlog::info("Exported LoRA weights:");
    spdlog::info("  Number of layers: {}", weights.size());

    for (const auto& [layer_name, weight_pair] : weights) {
        const auto& B = weight_pair.first;
        const auto& A = weight_pair.second;

        spdlog::info("  Layer: {}", layer_name);
        spdlog::info("    B matrix: {} elements", B.size());
        spdlog::info("    A matrix: {} elements", A.size());
    }

    // In production, you would save these weights:
    // - To file (safetensors, GGUF, etc.)
    // - To ThemisDB blob store
    // - Along with metadata (hyperparameters, training stats, etc.)

    spdlog::info("\n=== Training Complete ===");
    spdlog::info("Next steps:");
    spdlog::info("1. Save adapter weights to file");
    spdlog::info("2. Load adapter for inference");
    spdlog::info("3. Evaluate on validation set");
    spdlog::info("4. Generate sample outputs");

    return 0;
}