Merge remote-tracking branch 'remotes/nodchip/master' into trainer

2025-12-24 19:16:49 +08:00 · 2020-09-23 19:13:07 +08:00
parent 5be8b573be 2931463d3a
commit 9827411b7c
18 changed files with 253 additions and 570 deletions
--- a/src/nnue/evaluate_nnue_learner.cpp
+++ b/src/nnue/evaluate_nnue_learner.cpp
@@ -5,15 +5,12 @@
 #include <filesystem>

 #include "../learn/learn.h"
-#include "../learn/learning_tools.h"

 #include "../position.h"
 #include "../uci.h"
 #include "../misc.h"
 #include "../thread_win32_osx.h"

-#include "../eval/evaluate_common.h"
-
 #include "evaluate_nnue.h"
 #include "evaluate_nnue_learner.h"
 #include "trainer/features/factorizer_feature_set.h"
@@ -24,215 +21,191 @@
 #include "trainer/trainer_clipped_relu.h"
 #include "trainer/trainer_sum.h"

-namespace Eval {
-
-namespace NNUE {
-
-namespace {
-
-// learning data
-std::vector<Example> examples;
-
-// Mutex for exclusive control of examples
-std::mutex examples_mutex;
-
-// number of samples in mini-batch
-uint64_t batch_size;
-
-// random number generator
-std::mt19937 rng;
-
-// learner
-std::shared_ptr<Trainer<Network>> trainer;
-
 // Learning rate scale
-double global_learning_rate_scale;
+double global_learning_rate;

-// Get the learning rate scale
-double GetGlobalLearningRateScale() {
-  return global_learning_rate_scale;
-}
+namespace Eval::NNUE {

-// Tell the learner options such as hyperparameters
-void SendMessages(std::vector<Message> messages) {
-  for (auto& message : messages) {
-    trainer->SendMessage(&message);
-    assert(message.num_receivers > 0);
-  }
-}
+  namespace {

-}  // namespace
+    // learning data
+    std::vector<Example> examples;

-// Initialize learning
-void InitializeTraining(double eta1, uint64_t eta1_epoch,
-                        double eta2, uint64_t eta2_epoch, double eta3) {
-  std::cout << "Initializing NN training for "
-            << GetArchitectureString() << std::endl;
+    // Mutex for exclusive control of examples
+    std::mutex examples_mutex;

-  assert(feature_transformer);
-  assert(network);
-  trainer = Trainer<Network>::Create(network.get(), feature_transformer.get());
+    // number of samples in mini-batch
+    uint64_t batch_size;

-  if (Options["SkipLoadingEval"]) {
-    trainer->Initialize(rng);
-  }
+    // random number generator
+    std::mt19937 rng;

-  global_learning_rate_scale = 1.0;
-  EvalLearningTools::Weight::init_eta(eta1, eta2, eta3, eta1_epoch, eta2_epoch);
-}
+    // learner
+    std::shared_ptr<Trainer<Network>> trainer;

-// set the number of samples in the mini-batch
-void SetBatchSize(uint64_t size) {
-  assert(size > 0);
-  batch_size = size;
-}
-
-// set the learning rate scale
-void SetGlobalLearningRateScale(double scale) {
-  global_learning_rate_scale = scale;
-}
-
-// Set options such as hyperparameters
-void SetOptions(const std::string& options) {
-  std::vector<Message> messages;
-  for (const auto& option : Split(options, ',')) {
-    const auto fields = Split(option, '=');
-    assert(fields.size() == 1 || fields.size() == 2);
-    if (fields.size() == 1) {
-      messages.emplace_back(fields[0]);
-    } else {
-      messages.emplace_back(fields[0], fields[1]);
-    }
-  }
-  SendMessages(std::move(messages));
-}
-
-// Reread the evaluation function parameters for learning from the file
-void RestoreParameters(const std::string& dir_name) {
-  const std::string file_name = Path::Combine(dir_name, NNUE::savedfileName);
-  std::ifstream stream(file_name, std::ios::binary);
-#ifndef NDEBUG
-  bool result =
-#endif
-  ReadParameters(stream);
-#ifndef NDEBUG
-  assert(result);
-#endif
-
-  SendMessages({{"reset"}});
-}
-
-void FinalizeNet() {
-  SendMessages({{"clear_unobserved_feature_weights"}});
-}
-
-// Add 1 sample of learning data
-void AddExample(Position& pos, Color rootColor,
-                const Learner::PackedSfenValue& psv, double weight) {
-  Example example;
-  if (rootColor == pos.side_to_move()) {
-    example.sign = 1;
-  } else {
-    example.sign = -1;
-  }
-  example.psv = psv;
-  example.weight = weight;
-
-  Features::IndexList active_indices[2];
-  for (const auto trigger : kRefreshTriggers) {
-    RawFeatures::AppendActiveIndices(pos, trigger, active_indices);
-  }
-  if (pos.side_to_move() != WHITE) {
-    active_indices[0].swap(active_indices[1]);
-  }
-  for (const auto color : Colors) {
-    std::vector<TrainingFeature> training_features;
-    for (const auto base_index : active_indices[color]) {
-      static_assert(Features::Factorizer<RawFeatures>::GetDimensions() <
-                    (1 << TrainingFeature::kIndexBits), "");
-      Features::Factorizer<RawFeatures>::AppendTrainingFeatures(
-          base_index, &training_features);
-    }
-    std::sort(training_features.begin(), training_features.end());
-
-    auto& unique_features = example.training_features[color];
-    for (const auto& feature : training_features) {
-      if (!unique_features.empty() &&
-          feature.GetIndex() == unique_features.back().GetIndex()) {
-        unique_features.back() += feature;
-      } else {
-        unique_features.push_back(feature);
+    // Tell the learner options such as hyperparameters
+    void SendMessages(std::vector<Message> messages) {
+      for (auto& message : messages) {
+        trainer->SendMessage(&message);
+        assert(message.num_receivers > 0);
      }
    }
+
+  }  // namespace
+
+  // Initialize learning
+  void InitializeTraining(const std::string& seed) {
+    std::cout << "Initializing NN training for "
+              << GetArchitectureString() << std::endl;
+
+    assert(feature_transformer);
+    assert(network);
+    trainer = Trainer<Network>::Create(network.get(), feature_transformer.get());
+    rng.seed(PRNG(seed).rand<uint64_t>());
+
+    if (Options["SkipLoadingEval"]) {
+      trainer->Initialize(rng);
+    }
  }

-  std::lock_guard<std::mutex> lock(examples_mutex);
-  examples.push_back(std::move(example));
-}
+  // set the number of samples in the mini-batch
+  void SetBatchSize(uint64_t size) {
+    assert(size > 0);
+    batch_size = size;
+  }
+  
+  // Set options such as hyperparameters
+  void SetOptions(const std::string& options) {
+    std::vector<Message> messages;
+    for (const auto& option : Split(options, ',')) {
+      const auto fields = Split(option, '=');
+      assert(fields.size() == 1 || fields.size() == 2);
+      if (fields.size() == 1) {
+        messages.emplace_back(fields[0]);
+      } else {
+        messages.emplace_back(fields[0], fields[1]);
+      }
+    }
+    SendMessages(std::move(messages));
+  }

-// update the evaluation function parameters
-void UpdateParameters(uint64_t epoch) {
-  assert(batch_size > 0);
+  // Reread the evaluation function parameters for learning from the file
+  void RestoreParameters(const std::string& dir_name) {
+    const std::string file_name = Path::Combine(dir_name, NNUE::savedfileName);
+    std::ifstream stream(file_name, std::ios::binary);
+#ifndef NDEBUG
+    bool result =
+#endif
+    ReadParameters(stream);
+#ifndef NDEBUG
+    assert(result);
+#endif

-  EvalLearningTools::Weight::calc_eta(epoch);
-  const auto learning_rate = static_cast<LearnFloatType>(
-      get_eta() / batch_size);
+    SendMessages({{"reset"}});
+  }

-  std::lock_guard<std::mutex> lock(examples_mutex);
-  std::shuffle(examples.begin(), examples.end(), rng);
-  while (examples.size() >= batch_size) {
-    std::vector<Example> batch(examples.end() - batch_size, examples.end());
-    examples.resize(examples.size() - batch_size);
+  void FinalizeNet() {
+    SendMessages({{"clear_unobserved_feature_weights"}});
+  }

-    const auto network_output = trainer->Propagate(batch);
+  // Add 1 sample of learning data
+  void AddExample(Position& pos, Color rootColor,
+                  const Learner::PackedSfenValue& psv, double weight) {
+    Example example;
+    if (rootColor == pos.side_to_move()) {
+      example.sign = 1;
+    } else {
+      example.sign = -1;
+    }
+    example.psv = psv;
+    example.weight = weight;

-    std::vector<LearnFloatType> gradients(batch.size());
-    for (std::size_t b = 0; b < batch.size(); ++b) {
-      const auto shallow = static_cast<Value>(Round<std::int32_t>(
-          batch[b].sign * network_output[b] * kPonanzaConstant));
-      const auto& psv = batch[b].psv;
-      const double gradient = batch[b].sign * Learner::calc_grad(shallow, psv);
-      gradients[b] = static_cast<LearnFloatType>(gradient * batch[b].weight);
+    Features::IndexList active_indices[2];
+    for (const auto trigger : kRefreshTriggers) {
+      RawFeatures::AppendActiveIndices(pos, trigger, active_indices);
+    }
+    if (pos.side_to_move() != WHITE) {
+      active_indices[0].swap(active_indices[1]);
+    }
+    for (const auto color : Colors) {
+      std::vector<TrainingFeature> training_features;
+      for (const auto base_index : active_indices[color]) {
+        static_assert(Features::Factorizer<RawFeatures>::GetDimensions() <
+                      (1 << TrainingFeature::kIndexBits), "");
+        Features::Factorizer<RawFeatures>::AppendTrainingFeatures(
+            base_index, &training_features);
+      }
+      std::sort(training_features.begin(), training_features.end());
+
+      auto& unique_features = example.training_features[color];
+      for (const auto& feature : training_features) {
+        if (!unique_features.empty() &&
+            feature.GetIndex() == unique_features.back().GetIndex()) {
+          unique_features.back() += feature;
+        } else {
+          unique_features.push_back(feature);
+        }
+      }
    }

-    trainer->Backpropagate(gradients.data(), learning_rate);
+    std::lock_guard<std::mutex> lock(examples_mutex);
+    examples.push_back(std::move(example));
  }
-  SendMessages({{"quantize_parameters"}});
-}

-// Check if there are any problems with learning
-void CheckHealth() {
-  SendMessages({{"check_health"}});
-}
+  // update the evaluation function parameters
+  void UpdateParameters() {
+    assert(batch_size > 0);

-}  // namespace NNUE
+    const auto learning_rate = static_cast<LearnFloatType>(
+        global_learning_rate / batch_size);

-// save merit function parameters to a file
-void save_eval(std::string dir_name) {
-  auto eval_dir = Path::Combine(Options["EvalSaveDir"], dir_name);
-  std::cout << "save_eval() start. folder = " << eval_dir << std::endl;
+    std::lock_guard<std::mutex> lock(examples_mutex);
+    std::shuffle(examples.begin(), examples.end(), rng);
+    while (examples.size() >= batch_size) {
+      std::vector<Example> batch(examples.end() - batch_size, examples.end());
+      examples.resize(examples.size() - batch_size);

-  // mkdir() will fail if this folder already exists, but
-  // Apart from that. If not, I just want you to make it.
-  // Also, assume that the folders up to EvalSaveDir have been dug.
-  std::filesystem::create_directories(eval_dir);
+      const auto network_output = trainer->Propagate(batch);

-  const std::string file_name = Path::Combine(eval_dir, NNUE::savedfileName);
-  std::ofstream stream(file_name, std::ios::binary);
+      std::vector<LearnFloatType> gradients(batch.size());
+      for (std::size_t b = 0; b < batch.size(); ++b) {
+        const auto shallow = static_cast<Value>(Round<std::int32_t>(
+            batch[b].sign * network_output[b] * kPonanzaConstant));
+        const auto& psv = batch[b].psv;
+        const double gradient = batch[b].sign * Learner::calc_grad(shallow, psv);
+        gradients[b] = static_cast<LearnFloatType>(gradient * batch[b].weight);
+      }
+
+      trainer->Backpropagate(gradients.data(), learning_rate);
+    }
+    SendMessages({{"quantize_parameters"}});
+  }
+
+  // Check if there are any problems with learning
+  void CheckHealth() {
+    SendMessages({{"check_health"}});
+  }
+
+  // save merit function parameters to a file
+  void save_eval(std::string dir_name) {
+    auto eval_dir = Path::Combine(Options["EvalSaveDir"], dir_name);
+    std::cout << "save_eval() start. folder = " << eval_dir << std::endl;
+
+    // mkdir() will fail if this folder already exists, but
+    // Apart from that. If not, I just want you to make it.
+    // Also, assume that the folders up to EvalSaveDir have been dug.
+    std::filesystem::create_directories(eval_dir);
+
+    const std::string file_name = Path::Combine(eval_dir, NNUE::savedfileName);
+    std::ofstream stream(file_name, std::ios::binary);
 #ifndef NDEBUG
-  bool result =
+    bool result =
 #endif
-  NNUE::WriteParameters(stream);
+    WriteParameters(stream);
 #ifndef NDEBUG
-  assert(result);
+    assert(result);
 #endif

-  std::cout << "save_eval() finished. folder = " << eval_dir << std::endl;
-}
-
-// get the current eta
-double get_eta() {
-  return NNUE::GetGlobalLearningRateScale() * EvalLearningTools::Weight::eta;
-}
-
-}  // namespace Eval
+    std::cout << "save_eval() finished. folder = " << eval_dir << std::endl;
+  }
+}  // namespace Eval::NNUE