Cleanup nnue

2025-12-24 19:16:49 +08:00 · 2020-10-14 21:45:38 +02:00
parent c286f9cd7d
commit 497f689aa3
10 changed files with 1003 additions and 970 deletions
--- a/src/nnue/evaluate_nnue_learner.cpp
+++ b/src/nnue/evaluate_nnue_learner.cpp
@@ -1,18 +1,10 @@
-// Code for learning NNUE evaluation function
-
-#include <random>
+#include <random>
 #include <fstream>
 #include <filesystem>

-#include "../learn/learn.h"
-
-#include "../position.h"
-#include "../uci.h"
-#include "../misc.h"
-#include "../thread_win32_osx.h"
-
 #include "evaluate_nnue.h"
 #include "evaluate_nnue_learner.h"
+
 #include "trainer/features/factorizer_feature_set.h"
 #include "trainer/features/factorizer_half_kp.h"
 #include "trainer/trainer_feature_transformer.h"
@@ -21,191 +13,207 @@
 #include "trainer/trainer_clipped_relu.h"
 #include "trainer/trainer_sum.h"

+#include "position.h"
+#include "uci.h"
+#include "misc.h"
+#include "thread_win32_osx.h"
+
+#include "learn/learn.h"
+
 // Learning rate scale
 double global_learning_rate;

+// Code for learning NNUE evaluation function
 namespace Eval::NNUE {

-  namespace {
+    namespace {

-    // learning data
-    std::vector<Example> examples;
+        // learning data
+        std::vector<Example> examples;

-    // Mutex for exclusive control of examples
-    std::mutex examples_mutex;
+        // Mutex for exclusive control of examples
+        std::mutex examples_mutex;

-    // number of samples in mini-batch
-    uint64_t batch_size;
+        // number of samples in mini-batch
+        uint64_t batch_size;

-    // random number generator
-    std::mt19937 rng;
+        // random number generator
+        std::mt19937 rng;

-    // learner
-    std::shared_ptr<Trainer<Network>> trainer;
+        // learner
+        std::shared_ptr<Trainer<Network>> trainer;

-    // Tell the learner options such as hyperparameters
-    void SendMessages(std::vector<Message> messages) {
-      for (auto& message : messages) {
-        trainer->SendMessage(&message);
-        assert(message.num_receivers > 0);
-      }
-    }
-
-  }  // namespace
-
-  // Initialize learning
-  void InitializeTraining(const std::string& seed) {
-    std::cout << "Initializing NN training for "
-              << GetArchitectureString() << std::endl;
-
-    assert(feature_transformer);
-    assert(network);
-    trainer = Trainer<Network>::Create(network.get(), feature_transformer.get());
-    rng.seed(PRNG(seed).rand<uint64_t>());
-
-    if (Options["SkipLoadingEval"]) {
-      trainer->Initialize(rng);
-    }
-  }
-
-  // set the number of samples in the mini-batch
-  void SetBatchSize(uint64_t size) {
-    assert(size > 0);
-    batch_size = size;
-  }
-  
-  // Set options such as hyperparameters
-  void SetOptions(const std::string& options) {
-    std::vector<Message> messages;
-    for (const auto& option : Split(options, ',')) {
-      const auto fields = Split(option, '=');
-      assert(fields.size() == 1 || fields.size() == 2);
-      if (fields.size() == 1) {
-        messages.emplace_back(fields[0]);
-      } else {
-        messages.emplace_back(fields[0], fields[1]);
-      }
-    }
-    SendMessages(std::move(messages));
-  }
-
-  // Reread the evaluation function parameters for learning from the file
-  void RestoreParameters(const std::string& dir_name) {
-    const std::string file_name = Path::Combine(dir_name, NNUE::savedfileName);
-    std::ifstream stream(file_name, std::ios::binary);
-#ifndef NDEBUG
-    bool result =
-#endif
-    ReadParameters(stream);
-#ifndef NDEBUG
-    assert(result);
-#endif
-
-    SendMessages({{"reset"}});
-  }
-
-  void FinalizeNet() {
-    SendMessages({{"clear_unobserved_feature_weights"}});
-  }
-
-  // Add 1 sample of learning data
-  void AddExample(Position& pos, Color rootColor,
-                  const Learner::PackedSfenValue& psv, double weight) {
-    Example example;
-    if (rootColor == pos.side_to_move()) {
-      example.sign = 1;
-    } else {
-      example.sign = -1;
-    }
-    example.psv = psv;
-    example.weight = weight;
-
-    Features::IndexList active_indices[2];
-    for (const auto trigger : kRefreshTriggers) {
-      RawFeatures::AppendActiveIndices(pos, trigger, active_indices);
-    }
-    if (pos.side_to_move() != WHITE) {
-      active_indices[0].swap(active_indices[1]);
-    }
-    for (const auto color : Colors) {
-      std::vector<TrainingFeature> training_features;
-      for (const auto base_index : active_indices[color]) {
-        static_assert(Features::Factorizer<RawFeatures>::GetDimensions() <
-                      (1 << TrainingFeature::kIndexBits), "");
-        Features::Factorizer<RawFeatures>::AppendTrainingFeatures(
-            base_index, &training_features);
-      }
-      std::sort(training_features.begin(), training_features.end());
-
-      auto& unique_features = example.training_features[color];
-      for (const auto& feature : training_features) {
-        if (!unique_features.empty() &&
-            feature.GetIndex() == unique_features.back().GetIndex()) {
-          unique_features.back() += feature;
-        } else {
-          unique_features.push_back(feature);
+        // Tell the learner options such as hyperparameters
+        void SendMessages(std::vector<Message> messages) {
+            for (auto& message : messages) {
+                trainer->SendMessage(&message);
+                assert(message.num_receivers > 0);
+            }
+        }
+
+    }  // namespace
+
+    // Initialize learning
+    void InitializeTraining(const std::string& seed) {
+        std::cout << "Initializing NN training for "
+                  << GetArchitectureString() << std::endl;
+
+        assert(feature_transformer);
+        assert(network);
+        trainer = Trainer<Network>::Create(network.get(), feature_transformer.get());
+        rng.seed(PRNG(seed).rand<uint64_t>());
+
+        if (Options["SkipLoadingEval"]) {
+            trainer->Initialize(rng);
        }
-      }
    }

-    std::lock_guard<std::mutex> lock(examples_mutex);
-    examples.push_back(std::move(example));
-  }
-
-  // update the evaluation function parameters
-  void UpdateParameters() {
-    assert(batch_size > 0);
-
-    const auto learning_rate = static_cast<LearnFloatType>(
-        global_learning_rate / batch_size);
-
-    std::lock_guard<std::mutex> lock(examples_mutex);
-    std::shuffle(examples.begin(), examples.end(), rng);
-    while (examples.size() >= batch_size) {
-      std::vector<Example> batch(examples.end() - batch_size, examples.end());
-      examples.resize(examples.size() - batch_size);
-
-      const auto network_output = trainer->Propagate(batch);
-
-      std::vector<LearnFloatType> gradients(batch.size());
-      for (std::size_t b = 0; b < batch.size(); ++b) {
-        const auto shallow = static_cast<Value>(Round<std::int32_t>(
-            batch[b].sign * network_output[b] * kPonanzaConstant));
-        const auto& psv = batch[b].psv;
-        const double gradient = batch[b].sign * Learner::calc_grad(shallow, psv);
-        gradients[b] = static_cast<LearnFloatType>(gradient * batch[b].weight);
-      }
-
-      trainer->Backpropagate(gradients.data(), learning_rate);
+    // set the number of samples in the mini-batch
+    void SetBatchSize(uint64_t size) {
+        assert(size > 0);
+        batch_size = size;
    }
-    SendMessages({{"quantize_parameters"}});
-  }

-  // Check if there are any problems with learning
-  void CheckHealth() {
-    SendMessages({{"check_health"}});
-  }
+    // Set options such as hyperparameters
+    void SetOptions(const std::string& options) {
+        std::vector<Message> messages;
+        for (const auto& option : Split(options, ',')) {
+          const auto fields = Split(option, '=');
+          assert(fields.size() == 1 || fields.size() == 2);

-  // save merit function parameters to a file
-  void save_eval(std::string dir_name) {
-    auto eval_dir = Path::Combine(Options["EvalSaveDir"], dir_name);
-    std::cout << "save_eval() start. folder = " << eval_dir << std::endl;
+          if (fields.size() == 1) {
+              messages.emplace_back(fields[0]);
+          } else {
+              messages.emplace_back(fields[0], fields[1]);
+          }
+        }

-    // mkdir() will fail if this folder already exists, but
-    // Apart from that. If not, I just want you to make it.
-    // Also, assume that the folders up to EvalSaveDir have been dug.
-    std::filesystem::create_directories(eval_dir);
+        SendMessages(std::move(messages));
+    }

-    const std::string file_name = Path::Combine(eval_dir, NNUE::savedfileName);
-    std::ofstream stream(file_name, std::ios::binary);
+    // Reread the evaluation function parameters for learning from the file
+    void RestoreParameters(const std::string& dir_name) {
+        const std::string file_name = Path::Combine(dir_name, NNUE::savedfileName);
+        std::ifstream stream(file_name, std::ios::binary);
 #ifndef NDEBUG
-    bool result =
+        bool result =
 #endif
-    WriteParameters(stream);
+        ReadParameters(stream);
 #ifndef NDEBUG
-    assert(result);
+        assert(result);
 #endif

-    std::cout << "save_eval() finished. folder = " << eval_dir << std::endl;
-  }
+        SendMessages({{"reset"}});
+    }
+
+    void FinalizeNet() {
+        SendMessages({{"clear_unobserved_feature_weights"}});
+    }
+
+    // Add 1 sample of learning data
+    void AddExample(Position& pos, Color rootColor,
+                    const Learner::PackedSfenValue& psv, double weight) {
+
+        Example example;
+        if (rootColor == pos.side_to_move()) {
+            example.sign = 1;
+        } else {
+            example.sign = -1;
+        }
+
+        example.psv = psv;
+        example.weight = weight;
+
+        Features::IndexList active_indices[2];
+        for (const auto trigger : kRefreshTriggers) {
+            RawFeatures::AppendActiveIndices(pos, trigger, active_indices);
+        }
+
+        if (pos.side_to_move() != WHITE) {
+            active_indices[0].swap(active_indices[1]);
+        }
+
+        for (const auto color : Colors) {
+            std::vector<TrainingFeature> training_features;
+            for (const auto base_index : active_indices[color]) {
+                static_assert(Features::Factorizer<RawFeatures>::GetDimensions() <
+                              (1 << TrainingFeature::kIndexBits), "");
+                Features::Factorizer<RawFeatures>::AppendTrainingFeatures(
+                    base_index, &training_features);
+            }
+
+            std::sort(training_features.begin(), training_features.end());
+
+            auto& unique_features = example.training_features[color];
+            for (const auto& feature : training_features) {
+                if (!unique_features.empty() &&
+                    feature.GetIndex() == unique_features.back().GetIndex()) {
+
+                    unique_features.back() += feature;
+                } else {
+                    unique_features.push_back(feature);
+                }
+            }
+        }
+
+        std::lock_guard<std::mutex> lock(examples_mutex);
+        examples.push_back(std::move(example));
+    }
+
+    // update the evaluation function parameters
+    void UpdateParameters() {
+        assert(batch_size > 0);
+
+        const auto learning_rate = static_cast<LearnFloatType>(
+            global_learning_rate / batch_size);
+
+        std::lock_guard<std::mutex> lock(examples_mutex);
+        std::shuffle(examples.begin(), examples.end(), rng);
+        while (examples.size() >= batch_size) {
+            std::vector<Example> batch(examples.end() - batch_size, examples.end());
+            examples.resize(examples.size() - batch_size);
+
+            const auto network_output = trainer->Propagate(batch);
+
+            std::vector<LearnFloatType> gradients(batch.size());
+            for (std::size_t b = 0; b < batch.size(); ++b) {
+                const auto shallow = static_cast<Value>(Round<std::int32_t>(
+                    batch[b].sign * network_output[b] * kPonanzaConstant));
+                const auto& psv = batch[b].psv;
+                const double gradient = batch[b].sign * Learner::calc_grad(shallow, psv);
+                gradients[b] = static_cast<LearnFloatType>(gradient * batch[b].weight);
+            }
+
+            trainer->Backpropagate(gradients.data(), learning_rate);
+        }
+        SendMessages({{"quantize_parameters"}});
+    }
+
+    // Check if there are any problems with learning
+    void CheckHealth() {
+        SendMessages({{"check_health"}});
+    }
+
+    // save merit function parameters to a file
+    void save_eval(std::string dir_name) {
+        auto eval_dir = Path::Combine(Options["EvalSaveDir"], dir_name);
+        std::cout << "save_eval() start. folder = " << eval_dir << std::endl;
+
+        // mkdir() will fail if this folder already exists, but
+        // Apart from that. If not, I just want you to make it.
+        // Also, assume that the folders up to EvalSaveDir have been dug.
+        std::filesystem::create_directories(eval_dir);
+
+        const std::string file_name = Path::Combine(eval_dir, NNUE::savedfileName);
+        std::ofstream stream(file_name, std::ios::binary);
+#ifndef NDEBUG
+        bool result =
+#endif
+        WriteParameters(stream);
+#ifndef NDEBUG
+        assert(result);
+#endif
+
+        std::cout << "save_eval() finished. folder = " << eval_dir << std::endl;
+    }
 }  // namespace Eval::NNUE