Add new library for ML stuff & a neural net implementation

2022-01-19 19:22:46 +03:00 · 2022-01-19 19:22:46 +03:00 · b2fea97c8f
commit b2fea97c8f
parent 889fce973b
7 changed files with 267 additions and 0 deletions
--- a/libs/ml/CMakeLists.txt
+++ b/libs/ml/CMakeLists.txt
@ -0,0 +1,6 @@
+file(GLOB_RECURSE PSEMEK_ML_HEADERS RELATIVE "${CMAKE_CURRENT_SOURCE_DIR}" "include/*.hpp")
+file(GLOB_RECURSE PSEMEK_ML_SOURCES RELATIVE "${CMAKE_CURRENT_SOURCE_DIR}" "source/*.cpp")
+
+psemek_add_library(psemek-ml ${PSEMEK_ML_HEADERS} ${PSEMEK_ML_SOURCES})
+target_include_directories(psemek-ml PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}/include")
+target_link_libraries(psemek-ml PUBLIC psemek-util psemek-geom psemek-random)
--- a/libs/ml/include/psemek/ml/activation.hpp
+++ b/libs/ml/include/psemek/ml/activation.hpp
@ -0,0 +1,55 @@
+#pragma once
+
+#include <cmath>
+#include <exception>
+
+namespace psemek::ml
+{
+
+	// All activation functions are chosen in a way so that the derivative
+	//   can be expressed as a function of the activation function's value, i.e.
+	//   f'(x) = G(f(x)) for some G: R -> R
+	enum class activation_type
+	{
+		sigmoid,
+		tanh,
+		relu,
+	};
+
+	struct unknown_activation_type
+		: std::exception
+	{
+		char const * what() noexcept;
+	};
+
+	template <typename T>
+	T activation(T x, activation_type type)
+	{
+		switch (type) {
+		case activation_type::sigmoid:
+			return 1.f / (1.f + std::exp(-x));
+		case activation_type::tanh:
+			return 2.f / (1.f + std::exp(- 2.f * x)) - 1.f;
+		case activation_type::relu:
+			return std::max(T{0}, x);
+		default:
+			throw unknown_activation_type{};
+		}
+	}
+
+	template <typename T>
+	T activation_derivative(T value, activation_type type)
+	{
+		switch (type) {
+		case activation_type::sigmoid:
+			return value * (T{1} - value);
+		case activation_type::tanh:
+			return T{1} - value * value;
+		case activation_type::relu:
+			return value == T{0} ? T{0} : T{1};
+		default:
+			throw unknown_activation_type{};
+		}
+	}
+
+}
--- a/libs/ml/include/psemek/ml/neural_net.hpp
+++ b/libs/ml/include/psemek/ml/neural_net.hpp
@ -0,0 +1,109 @@
+#pragma once
+
+#include <psemek/ml/activation.hpp>
+#include <psemek/random/uniform.hpp>
+
+#include <vector>
+#include <exception>
+
+namespace psemek::ml
+{
+
+	struct empty_neural_net_error
+		: std::exception
+	{
+		char const * what() noexcept;
+	};
+
+	namespace detail
+	{
+
+		inline std::pair<std::vector<std::size_t>, std::vector<activation_type>> make_nn_ctor_args(std::vector<std::size_t> layer_sizes, activation_type type)
+		{
+			if (layer_sizes.empty())
+				throw empty_neural_net_error{};
+			std::vector<activation_type> activation_types(layer_sizes.size() - 1, type);
+			return {std::move(layer_sizes), std::move(activation_types)};
+		}
+
+		inline std::size_t weight_count(std::vector<std::size_t> const & layer_sizes)
+		{
+			std::size_t result = 0;
+			for (std::size_t l = 0; l + 1 < layer_sizes.size(); ++l)
+				result += (layer_sizes[l] + 1) * layer_sizes[l + 1];
+			return result;
+		}
+
+	}
+
+	template <typename T>
+	struct neural_net
+	{
+		neural_net() = default;
+		neural_net(std::vector<std::size_t> layer_sizes);
+		neural_net(std::vector<std::size_t> layer_sizes, activation_type type);
+		neural_net(std::vector<std::size_t> layer_sizes, std::vector<activation_type> activation_types);
+
+		// A non-empty neural net is basically unusable
+		bool empty() const { return layer_sizes_.empty(); }
+
+		std::size_t layer_count() const { return layer_sizes_.size(); }
+		std::size_t const * layer_sizes() const { return layer_sizes_.data(); }
+
+		std::size_t activation_type_count() const { return activation_types_.size(); }
+		activation_type const * activation_types() const { return activation_types_.data(); }
+
+		// Weights are stored in a sequential manner, in the order in which they
+		//   appear in evalution of the neural net, i.e. first come the weights
+		//   between layers 0 and 1 (including the bias) in row-major order, then
+		//   1-2 in row-major order, etc.
+		std::size_t weight_count() const { return weights_.size(); }
+		T const * weights() const { return weights_.data(); }
+		T * weights() { return weights_.data(); }
+
+	private:
+		std::vector<std::size_t> layer_sizes_;
+		std::vector<activation_type> activation_types_;
+		std::vector<T> weights_;
+
+		// proxy constructor to overcome unspecified evaluation order in
+		//   neural_net(std::move(layer_sizes), std::vector{layer_sizes.size(), activation_type::tanh})
+		neural_net(std::pair<std::vector<std::size_t>, std::vector<activation_type>> args);
+
+		void assert_nonempty() const
+		{
+			if (empty())
+				throw empty_neural_net_error{};
+		}
+	};
+
+	extern template struct neural_net<float>;
+	extern template struct neural_net<double>;
+
+	template <typename T>
+	neural_net<T>::neural_net(std::vector<std::size_t> layer_sizes)
+		: neural_net(std::move(layer_sizes), activation_type::tanh)
+	{}
+
+	template <typename T>
+	neural_net<T>::neural_net(std::vector<std::size_t> layer_sizes, activation_type type)
+		: neural_net(detail::make_nn_ctor_args(std::move(layer_sizes), type))
+	{}
+
+	template <typename T>
+	neural_net<T>::neural_net(std::vector<std::size_t> layer_sizes, std::vector<activation_type> activation_types)
+		: layer_sizes_(layer_sizes)
+		, activation_types_(activation_types)
+		, weights_(detail::weight_count(layer_sizes_))
+	{
+		if (layer_sizes_.empty())
+			throw empty_neural_net_error{};
+	}
+
+	template <typename T>
+	neural_net<T>::neural_net(std::pair<std::vector<std::size_t>, std::vector<activation_type>> args)
+		: neural_net(std::move(args.first), std::move(args.second))
+	{}
+
+
+}
--- a/libs/ml/include/psemek/ml/neural_net_evaluator.hpp
+++ b/libs/ml/include/psemek/ml/neural_net_evaluator.hpp
@ -0,0 +1,57 @@
+#pragma once
+
+#include <psemek/ml/neural_net.hpp>
+
+#include <stdexcept>
+
+namespace psemek::ml
+{
+
+	struct wrong_neural_net_input_size
+		: std::runtime_error
+	{
+		wrong_neural_net_input_size(std::size_t expected, std::size_t actual);
+	};
+
+	// A class that stores temporary data to facilitate
+	//   allocation-free multiple evaluations of a neural net
+	template <typename T>
+	struct neural_net_evaluator
+	{
+		std::vector<T> evaluate(neural_net<T> const & nn, std::vector<T> input) const;
+	private:
+		mutable std::vector<T> temp_;
+	};
+
+	extern template struct neural_net_evaluator<float>;
+	extern template struct neural_net_evaluator<double>;
+
+	template <typename T>
+	std::vector<T> neural_net_evaluator<T>::evaluate(neural_net<T> const & nn, std::vector<T> input) const
+	{
+		std::size_t const * layer_sizes = nn.layer_sizes();
+		T const * weights = nn.weights();
+
+		if (layer_sizes[0] != input.size())
+			throw wrong_neural_net_input_size{layer_sizes[0], input.size()};
+
+		for (std::size_t l = 0; l + 1 < nn.layer_count(); ++l)
+		{
+			temp_.resize(layer_sizes[l + 1]);
+
+			for (std::size_t i = 0; i < layer_sizes[l + 1]; ++i)
+			{
+				temp_[i] = *weights++;
+
+				for (std::size_t j = 0; j < layer_sizes[l]; ++j)
+					temp_[i] += (*weights++) * input[j];
+
+				temp_[i] = activation(temp_[i], nn.activation_types()[l]);
+			}
+
+			std::swap(temp_, input);
+		}
+
+		return input;
+	}
+}
--- a/libs/ml/source/activation.cpp
+++ b/libs/ml/source/activation.cpp
@ -0,0 +1,11 @@
+#include <psemek/ml/activation.hpp>
+
+namespace psemek::ml
+{
+
+	char const * unknown_activation_type::what() noexcept
+	{
+		return "unknown activation type";
+	}
+
+}
--- a/libs/ml/source/neural_net.cpp
+++ b/libs/ml/source/neural_net.cpp
@ -0,0 +1,14 @@
+#include <psemek/ml/neural_net.hpp>
+
+namespace psemek::ml
+{
+
+	char const * empty_neural_net_error::what() noexcept
+	{
+		return "neural net must have at least a single layer";
+	}
+
+	template struct neural_net<float>;
+	template struct neural_net<double>;
+
+}
--- a/libs/ml/source/neural_net_evaluator.cpp
+++ b/libs/ml/source/neural_net_evaluator.cpp
@ -0,0 +1,15 @@
+#include <psemek/ml/neural_net_evaluator.hpp>
+
+#include <psemek/util/to_string.hpp>
+
+namespace psemek::ml
+{
+
+	wrong_neural_net_input_size::wrong_neural_net_input_size(std::size_t expected, std::size_t actual)
+		: std::runtime_error(util::to_string("wrong neural net input size: expected ", expected, ", got ", actual))
+	{}
+
+	template struct neural_net_evaluator<float>;
+	template struct neural_net_evaluator<double>;
+
+}