Fix msan error, uninitialized model_training

This arose during the unpacking of LoaderArgs into individual ctor args. Probably better to pass LoaderArgs in, and have only a single ctor to reduce confusion. Also fix includes. PiperOrigin-RevId: 617386447
2024-03-20 05:12:06 +01:00 · 2024-03-20 05:12:06 +01:00 · f8baac80f9
parent 52940d435f
commit f8baac80f9
3 changed files with 9 additions and 8 deletions
--- a/gemma.cc
+++ b/gemma.cc
@ -25,6 +25,8 @@
 #include "compression/compress-inl.h"
 // copybara:import_next_line:gemma_cpp
 #include "ops.h"
+// copybara:import_next_line:gemma_cpp
+#include "util/args.h"  // Path
 #include "hwy/contrib/matvec/matvec-inl.h"
 #include "hwy/highway.h"
 #include "hwy/profiler.h"
@ -818,8 +820,9 @@ void GemmaImpl<ConfigGemma7B>::Generate(
 }

 Gemma::Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
-             const Path& weights_path, Model model_type,
-             hwy::ThreadPool& pool) {
+             const Path& weights_path, Model model_type, ModelTraining training,
+             hwy::ThreadPool& pool)
+    : model_training(training) {
  std::unique_ptr<sentencepiece::SentencePieceProcessor> tokenizer;
  {
    PROFILER_ZONE("Startup.tokenizer");
--- a/gemma.h
+++ b/gemma.h
@ -16,12 +16,9 @@
 #ifndef THIRD_PARTY_GEMMA_CPP_GEMMA_H_
 #define THIRD_PARTY_GEMMA_CPP_GEMMA_H_

-#include <algorithm>
-#include <cctype>
 #include <functional>
 #include <memory>
 #include <random>
-#include <string>
 #include <vector>

 // copybara:import_next_line:gemma_cpp
@ -31,7 +28,7 @@
 #include "configs.h"  // kSeqLen
 // copybara:end
 // copybara:import_next_line:gemma_cpp
-#include "util/args.h"  // ArgsBase
+#include "util/args.h"  // Path
 // copybara:end
 #include "hwy/aligned_allocator.h"
 #include "hwy/base.h"  // hwy::bfloat16_t
@ -75,7 +72,8 @@ struct GemmaInterface;

 struct Gemma {
  Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
-        const Path& weights_path, Model model_type, hwy::ThreadPool& pool);
+        const Path& weights_path, Model model_type, ModelTraining training,
+        hwy::ThreadPool& pool);
  ~Gemma();  // must be defined after GemmaInterface's dtor is defined.
  const sentencepiece::SentencePieceProcessor* Tokenizer() const;
  std::unique_ptr<GemmaInterface> impl_;
--- a/run.cc
+++ b/run.cc
@ -236,7 +236,7 @@ void Run(LoaderArgs& loader, InferenceArgs& inference, AppArgs& app) {
  }

  gcpp::Gemma model(loader.tokenizer, loader.compressed_weights, loader.weights,
-                    loader.ModelType(), pool);
+                    loader.ModelType(), loader.ModelTraining(), pool);

  auto kv_cache = CreateKVCache(loader.ModelType());