Updated and renamed classes for custom module

This commit is contained in:
Alejandro Saucedo 2020-09-27 15:08:04 +01:00
parent 8959d90fa6
commit 104d7e8a6b
6 changed files with 207 additions and 85 deletions

View file

@ -5,73 +5,138 @@
#include "KomputeModelMLNode.h"
KomputeModelMLNode::KomputeModelMLNode() {
std::cout << "CALLING CONSTRUCTOR" << std::endl;
this->_init();
}
void KomputeModelMLNode::add(float value) {
// Set the new data in the local device
this->mSecondaryTensor->setData({value});
// Execute recorded sequence
if (std::shared_ptr<kp::Sequence> sq = this->mSequence.lock()) {
sq->eval();
void KomputeModelMLNode::train(Array yArr, Array xIArr, Array xJArr) {
assert(yArr.size() == xIArr.size());
assert(xIArr.size() == xJArr.size());
std::vector<float> yData;
std::vector<float> xIData;
std::vector<float> xJData;
std::vector<float> zerosData;
for (size_t i = 0; i < yArr.size(); i++) {
yData.push_back(yArr[i]);
xIData.push_back(xIArr[i]);
xJData.push_back(xJArr[i]);
zerosData.push_back(0);
}
else {
throw std::runtime_error("Sequence pointer no longer available");
uint32_t ITERATIONS = 100;
float learningRate = 0.1;
std::shared_ptr<kp::Tensor> xI{ new kp::Tensor(xIData) };
std::shared_ptr<kp::Tensor> xJ{ new kp::Tensor(xJData) };
std::shared_ptr<kp::Tensor> y{ new kp::Tensor(yData) };
std::shared_ptr<kp::Tensor> wIn{ new kp::Tensor({ 0.001, 0.001 }) };
std::shared_ptr<kp::Tensor> wOutI{ new kp::Tensor(zerosData) };
std::shared_ptr<kp::Tensor> wOutJ{ new kp::Tensor(zerosData) };
std::shared_ptr<kp::Tensor> bIn{ new kp::Tensor({ 0 }) };
std::shared_ptr<kp::Tensor> bOut{ new kp::Tensor(zerosData) };
std::shared_ptr<kp::Tensor> lOut{ new kp::Tensor(zerosData) };
std::vector<std::shared_ptr<kp::Tensor>> params = { xI, xJ, y,
wIn, wOutI, wOutJ,
bIn, bOut, lOut };
{
kp::Manager mgr;
if (std::shared_ptr<kp::Sequence> sq =
mgr.getOrCreateManagedSequence("createTensors").lock()) {
sq->begin();
sq->record<kp::OpTensorCreate>(params);
sq->end();
sq->eval();
// Record op algo base
sq->begin();
sq->record<kp::OpTensorSyncDevice>({ wIn, bIn });
sq->record<kp::OpAlgoBase<>>(
params, std::vector<char>(LR_SHADER.begin(), LR_SHADER.end()));
sq->record<kp::OpTensorSyncLocal>({ wOutI, wOutJ, bOut, lOut });
sq->end();
// Iterate across all expected iterations
for (size_t i = 0; i < ITERATIONS; i++) {
sq->eval();
for (size_t j = 0; j < bOut->size(); j++) {
wIn->data()[0] -= learningRate * wOutI->data()[j];
wIn->data()[1] -= learningRate * wOutJ->data()[j];
bIn->data()[0] -= learningRate * bOut->data()[j];
}
}
}
}
SPDLOG_INFO("RESULT: <<<<<<<<<<<<<<<<<<<");
SPDLOG_INFO(wIn->data()[0]);
SPDLOG_INFO(wIn->data()[1]);
SPDLOG_INFO(bIn->data()[0]);
this->mWeights = kp::Tensor(wIn->data());
this->mBias = kp::Tensor(bIn->data());
}
void KomputeModelMLNode::reset() {
Array KomputeModelMLNode::predict(Array xI, Array xJ) {
assert(xI.size() == xJ.size());
Array retArray;
// We run the inference in the CPU for simplicity
// BUt you can also implement the inference on GPU
// GPU implementation would speed up minibatching
for (size_t i = 0; i < xI.size(); i++) {
float xIVal = xI[i];
float xJVal = xJ[i];
float result = (xIVal * this->mWeights.data()[0]
+ xJVal * this->mWeights.data()[1]
+ this->mBias.data()[0]);
// Instead of using sigmoid we'll just return full numbers
Variant var = result > 0 ? 1 : 0;
retArray.push_back(var);
}
return retArray;
}
float KomputeModelMLNode::get_total() const {
return this->mPrimaryTensor->data()[0];
Array KomputeModelMLNode::get_params() {
Array retArray;
SPDLOG_INFO(this->mWeights.size() + this->mBias.size());
if(this->mWeights.size() + this->mBias.size() == 0) {
return retArray;
}
retArray.push_back(this->mWeights.data()[0]);
retArray.push_back(this->mWeights.data()[1]);
retArray.push_back(this->mBias.data()[0]);
retArray.push_back(99.0);
return retArray;
}
void KomputeModelMLNode::_init() {
std::cout << "CALLING INIT" << std::endl;
this->mPrimaryTensor = this->mManager.buildTensor({ 0.0 });
this->mSecondaryTensor = this->mManager.buildTensor({ 0.0 });
this->mSequence = this->mManager.getOrCreateManagedSequence("AdditionSeq");
// We now record the steps in the sequence
if (std::shared_ptr<kp::Sequence> sq = this->mSequence.lock())
{
std::string shader(R"(
#version 450
layout (local_size_x = 1) in;
layout(set = 0, binding = 0) buffer a { float pa[]; };
layout(set = 0, binding = 1) buffer b { float pb[]; };
void main() {
uint index = gl_GlobalInvocationID.x;
pa[index] = pb[index] + pa[index];
}
)");
sq->begin();
// First we ensure secondary tensor loads to GPU
// No need to sync the primary tensor as it should not be changed
sq->record<kp::OpTensorSyncDevice>(
{ this->mSecondaryTensor });
// Then we run the operation with both tensors
sq->record<kp::OpAlgoBase<>>(
{ this->mPrimaryTensor, this->mSecondaryTensor },
std::vector<char>(shader.begin(), shader.end()));
// We map the result back to local
sq->record<kp::OpTensorSyncLocal>(
{ this->mPrimaryTensor });
sq->end();
}
else {
throw std::runtime_error("Sequence pointer no longer available");
}
}
void KomputeModelMLNode::_process(float delta) {
@ -82,8 +147,8 @@ void KomputeModelMLNode::_bind_methods() {
ClassDB::bind_method(D_METHOD("_process", "delta"), &KomputeModelMLNode::_process);
ClassDB::bind_method(D_METHOD("_init"), &KomputeModelMLNode::_init);
ClassDB::bind_method(D_METHOD("add", "value"), &KomputeModelMLNode::add);
ClassDB::bind_method(D_METHOD("reset"), &KomputeModelMLNode::reset);
ClassDB::bind_method(D_METHOD("get_total"), &KomputeModelMLNode::get_total);
ClassDB::bind_method(D_METHOD("train", "yArr", "xIArr", "xJArr"), &KomputeModelMLNode::train);
ClassDB::bind_method(D_METHOD("predict", "xI", "xJ"), &KomputeModelMLNode::predict);
ClassDB::bind_method(D_METHOD("get_params"), &KomputeModelMLNode::get_params);
}

View file

@ -12,9 +12,11 @@ class KomputeModelMLNode : public Node {
public:
KomputeModelMLNode();
void add(float value);
void reset();
float get_total() const;
void train(Array y, Array xI, Array xJ);
Array predict(Array xI, Array xJ);
Array get_params();
void _process(float delta);
void _init();
@ -23,9 +25,64 @@ protected:
static void _bind_methods();
private:
kp::Manager mManager;
std::weak_ptr<kp::Sequence> mSequence;
std::shared_ptr<kp::Tensor> mPrimaryTensor;
std::shared_ptr<kp::Tensor> mSecondaryTensor;
kp::Tensor mWeights;
kp::Tensor mBias;
};
static std::string LR_SHADER = R"(
#version 450
layout (constant_id = 0) const uint M = 0;
layout (local_size_x = 1) in;
layout(set = 0, binding = 0) buffer bxi { float xi[]; };
layout(set = 0, binding = 1) buffer bxj { float xj[]; };
layout(set = 0, binding = 2) buffer by { float y[]; };
layout(set = 0, binding = 3) buffer bwin { float win[]; };
layout(set = 0, binding = 4) buffer bwouti { float wouti[]; };
layout(set = 0, binding = 5) buffer bwoutj { float woutj[]; };
layout(set = 0, binding = 6) buffer bbin { float bin[]; };
layout(set = 0, binding = 7) buffer bbout { float bout[]; };
layout(set = 0, binding = 8) buffer blout { float lout[]; };
float m = float(M);
float sigmoid(float z) {
return 1.0 / (1.0 + exp(-z));
}
float inference(vec2 x, vec2 w, float b) {
// Compute the linear mapping function
float z = dot(w, x) + b;
// Calculate the y-hat with sigmoid
float yHat = sigmoid(z);
return yHat;
}
float calculateLoss(float yHat, float y) {
return -(y * log(yHat) + (1.0 - y) * log(1.0 - yHat));
}
void main() {
uint idx = gl_GlobalInvocationID.x;
vec2 wCurr = vec2(win[0], win[1]);
float bCurr = bin[0];
vec2 xCurr = vec2(xi[idx], xj[idx]);
float yCurr = y[idx];
float yHat = inference(xCurr, wCurr, bCurr);
float dZ = yHat - yCurr;
vec2 dW = (1. / m) * xCurr * dZ;
float dB = (1. / m) * dZ;
wouti[idx] = dW.x;
woutj[idx] = dW.y;
bout[idx] = dB;
lout[idx] = calculateLoss(yHat, yCurr);
}
)";

View file

@ -5,10 +5,10 @@
#include "core/class_db.h"
#include "KomputeModelMLNode.h"
void register_kompute_summator_types() {
void register_kompute_model_ml_types() {
ClassDB::register_class<KomputeModelMLNode>();
}
void unregister_kompute_summator_types() {
void unregister_kompute_model_ml_types() {
// Nothing to do here in this example.
}

View file

@ -1,4 +1,4 @@
/* summator.cpp */
#pragma once
#include <vector>
#include <string>
@ -15,8 +15,8 @@ KomputeModelML::KomputeModelML() {
void KomputeModelML::train(Array yArr, Array xIArr, Array xJArr) {
assert(y.size() == xI.size());
assert(xI.size() == xJ.size());
assert(yArr.size() == xIArr.size());
assert(xIArr.size() == xJArr.size());
std::vector<float> yData;
std::vector<float> xIData;

View file

@ -5,4 +5,4 @@
[node name="Parent" type="Node2D"]
script = ExtResource( 1 )
[node name="CustomKomputeNode" type="KomputeSummatorNode" parent="."]
[node name="EditorKomputeModelMLNode" type="KomputeModelMLNode" parent="."]

View file

@ -2,27 +2,27 @@ extends Node2D
# Called when the node enters the scene tree for the first time.
func _ready():
print("hello")
var xi = [0, 1, 1, 1, 1, 1]
var xj = [0, 0, 0, 0, 1, 1]
var y = [0, 0, 0, 0, 1, 1]
# Use existing node
print($CustomKomputeNode.get_total())
print("Running training and predict on existing node")
$CustomKomputeNode.add(10)
print($CustomKomputeNode.get_total())
$EditorKomputeModelMLNode.train(y, xi, xj)
$CustomKomputeNode.add(10)
print($CustomKomputeNode.get_total())
var preds = $EditorKomputeModelMLNode.predict(xi, xj)
print(preds)
print("Running training and predict on new instance")
# Create new instance
var s = KomputeSummatorNode.new()
var s = KomputeModelMLNode.new()
# This will print 0 as it's a new instance
print(s.get_total())
s.train(y, xi, xj)
print("")
# Now we can again send further commands
s.add(10)
print(s.get_total())
preds = s.predict(xi, xj)
s.add(10)
print(s.get_total())
print(preds)