No public description

PiperOrigin-RevId: 617315030
2024-03-19 23:35:58 +01:00 · 2024-03-19 23:35:58 +01:00 · ffd02c59ad
parent 7d5364bb80
commit ffd02c59ad
9 changed files with 41 additions and 27 deletions
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@ -72,4 +72,4 @@ jobs:
        with:
          path: ~/.cache/bazel
          key: bazel-${{ runner.os }}
-      - run: bazel build --cxxopt=-std=c++20 //...
+      - run: bazel build -c opt --cxxopt=-std=c++20 //...
--- a/BUILD.bazel
+++ b/BUILD.bazel
@ -4,9 +4,7 @@
 load("@rules_license//rules:license.bzl", "license")
 package(
-    default_applicable_licenses = [
+    default_applicable_licenses = ["//:license"],
        "//:license",  # Placeholder comment, do not modify
    ],
    default_visibility = ["//visibility:public"],
 )
--- a/bazel/BUILD
+++ b/bazel/BUILD
@ -1,4 +1,3 @@
 # Required for referencing bazel:com_google_sentencepiece.patch
 package(
    default_applicable_licenses = ["//:license"],
    default_visibility = ["//:__subpackages__"],
--- a/compression/BUILD
+++ b/compression/BUILD
@ -1,12 +1,10 @@
 # Weight compression, I/O and analysis
 package(
-    default_applicable_licenses = [
+    default_applicable_licenses = ["//:license"],
        "//:license",  # Placeholder comment, do not modify
    ],
    default_visibility = [
-        # Placeholder for internal visibility,
+        "//learning/gemini/prod/contrib/gemini_cpp:__subpackages__",
-        "//:__subpackages__",  # Placeholder, do not modify
+        "//:__subpackages__",
    ],
 )
--- a/examples/hello_world/run.cc
+++ b/examples/hello_world/run.cc
@ -17,10 +17,13 @@
 // copybara:import_next_line:gemma_cpp
 #include "gemma.h"
-// copybara:import_next_line:gemma_cpp
+// copybara:end
 #include "util/app.h"  // LoaderArgs
 // copybara:import_next_line:gemma_cpp
 #include "util/args.h"
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "util/app.h" // LoaderArgs
 // copybara:end
 #include "hwy/contrib/thread_pool/thread_pool.h"
 std::vector<int> tokenize(
--- a/gemma.cc
+++ b/gemma.cc
@ -25,8 +25,6 @@
 #include "compression/compress-inl.h"
 // copybara:import_next_line:gemma_cpp
 #include "ops.h"
 // copybara:import_next_line:gemma_cpp
 #include "util/args.h"  // Path
 #include "hwy/contrib/matvec/matvec-inl.h"
 #include "hwy/highway.h"
 #include "hwy/profiler.h"
@ -52,8 +50,6 @@
 #include <string>
 #include <vector>
 // Placeholder for internal header, do not modify.
 // copybara:import_next_line:gemma_cpp
 #include "compression/compress.h"
 // copybara:import_next_line:gemma_cpp
@ -817,9 +813,8 @@ void GemmaImpl<ConfigGemma7B>::Generate(
 }
 Gemma::Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
-             const Path& weights_path, Model model_type, ModelTraining training,
+             const Path& weights_path, Model model_type,
-             hwy::ThreadPool& pool)
+             hwy::ThreadPool& pool) {
    : model_training(training) {
  std::unique_ptr<sentencepiece::SentencePieceProcessor> tokenizer;
  {
    PROFILER_ZONE("Startup.tokenizer");
@ -844,6 +839,11 @@ Gemma::Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
  }
 }
 Gemma::Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
             Model model_type, hwy::ThreadPool& pool)
    : Gemma(tokenizer_path, compressed_weights_path, Path{""}, model_type,
            pool) {}
 Gemma::~Gemma() = default;  // after GemmaInterface is defined
 const sentencepiece::SentencePieceProcessor* Gemma::Tokenizer() const {
--- a/gemma.h
+++ b/gemma.h
@ -16,20 +16,29 @@
 #ifndef THIRD_PARTY_GEMMA_CPP_GEMMA_H_
 #define THIRD_PARTY_GEMMA_CPP_GEMMA_H_
 #include <algorithm>
 #include <cctype>
 #include <functional>
 #include <memory>
 #include <random>
 #include <string>
 #include <vector>
 // copybara:import_next_line:gemma_cpp
 #include "compression/compress.h"  // SfpStream/NuqStream
 // copybara:end
 // copybara:import_next_line:gemma_cpp
-#include "util/args.h"             // Path
+#include "configs.h"  // kSeqLen
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "util/args.h"  // ArgsBase
 // copybara:end
 #include "hwy/aligned_allocator.h"
 #include "hwy/base.h"  // hwy::bfloat16_t
 #include "hwy/contrib/thread_pool/thread_pool.h"
 // copybara:import_next_line:sentencepiece
 #include "src/sentencepiece_processor.h"
 // copybara:end
 namespace gcpp {
@ -66,8 +75,9 @@ struct GemmaInterface;
 struct Gemma {
  Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
-        const Path& weights_path, Model model_type, ModelTraining training,
+        const Path& weights_path, Model model_type, hwy::ThreadPool& pool);
-        hwy::ThreadPool& pool);
+  Gemma(const Path& tokenizer_path, const Path& compressed_weights_path,
        Model model_type, hwy::ThreadPool& pool);
  ~Gemma();  // must be defined after GemmaInterface's dtor is defined.
  const sentencepiece::SentencePieceProcessor* Tokenizer() const;
  std::unique_ptr<GemmaInterface> impl_;
--- a/run.cc
+++ b/run.cc
@ -22,15 +22,18 @@
 #include <thread>  // NOLINT
 #include <vector>
 // Placeholder for internal header, do not modify.
 // copybara:import_next_line:gemma_cpp
 #include "compression/compress.h"
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "gemma.h"  // Gemma
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "util/app.h"
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "util/args.h"  // HasHelp
 // copybara:end
 #include "hwy/base.h"
 #include "hwy/contrib/thread_pool/thread_pool.h"
 #include "hwy/highway.h"
@ -231,8 +234,8 @@ void Run(LoaderArgs& loader, InferenceArgs& inference, AppArgs& app) {
             [](uint64_t /*task*/, size_t thread) { PinThreadToCore(thread); });
  }
-  gcpp::Gemma model(loader.tokenizer, loader.compressed_weights, loader.weights,
+  gcpp::Gemma model(loader.tokenizer, loader.compressed_weights,
-                    loader.ModelType(), loader.ModelTraining(), pool);
+                    loader.ModelType(), pool);
  auto kv_cache = CreateKVCache(loader.ModelType());
@ -274,8 +277,6 @@ int main(int argc, char** argv) {
  {
    PROFILER_ZONE("Startup.misc");
    // Placeholder for internal init, do not modify.
    gcpp::LoaderArgs loader(argc, argv);
    gcpp::InferenceArgs inference(argc, argv);
    gcpp::AppArgs app(argc, argv);
--- a/util/app.h
+++ b/util/app.h
@ -34,10 +34,15 @@
 // copybara:import_next_line:gemma_cpp
 #include "configs.h"
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "gemma.h"
 // copybara:end
 // copybara:import_next_line:gemma_cpp
 #include "util/args.h"
 // copybara:end
 #include "hwy/base.h"  // HWY_ASSERT
 namespace gcpp {