cpp/html/model_8cpp_source.html

 /*

     Beatmup image and signal processing library

     Copyright (C) 2020, lnstadrum


     This program is free software: you can redistribute it and/or modify

     it under the terms of the GNU General Public License as published by

     the Free Software Foundation, either version 3 of the License, or

     (at your option) any later version.


     This program is distributed in the hope that it will be useful,

     but WITHOUT ANY WARRANTY; without even the implied warranty of

     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

     GNU General Public License for more details.


     You should have received a copy of the GNU General Public License

     along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


 #include "model.h"

 #include "../utils/bitset.h"

 #include <sstream>


 using namespace Beatmup;

 using namespace NNets;


 Model::Model(Context& context, std::initializer_list<AbstractOperation*> ops):

     ProgramBank(context),

     profiler(nullptr), ready(false),

     ops(ops.begin(), ops.end())

 {

     // establish feedforward connections

     for (size_t i = 1; i < this->ops.size(); ++i)

         addConnection(*this->ops[i - 1], *this->ops[i]);

 }


 Model::Model(Context& context): Model(context, {}) {}


 Model::~Model() {

     for (auto op : ops)

         op->disconnect();

     freeMemory();

 }


 void Model::append(AbstractOperation* newOp, bool connect) {

     for (auto op : ops) {

         if (op == newOp)

             throw RuntimeError("Cannot add operation " + newOp->getName() + " to the model: already added");

         else

             if (op->getName() == newOp->getName())

                 throw RuntimeError("Cannot add operation " + newOp->getName() + " to the model: an operation with the same exists in the model");

     }

     ops.push_back(newOp);

     if (connect)

         addConnection(*ops[ops.size() - 2], *ops.back(), 0, 0, 0);

     ready = false;

 }


 void Model::append(std::initializer_list<AbstractOperation*> newOps, bool connect) {

     for (auto op : newOps)

         append(op, connect);

 }


 void Model::addOperation(const std::string& opName, AbstractOperation* newOp) {

     auto it = std::find_if(ops.begin(), ops.end(), [&opName](AbstractOperation* op){ return op->getName() == opName; });

     if (it == ops.end())

         throw InvalidArgument("Cannot find operation " + opName);

     ops.insert(it, newOp);

 }


 void Model::addOperation(const AbstractOperation& op, AbstractOperation* newOp) {

     auto it = std::find(ops.begin(), ops.end(), &op);

     if (it == ops.end())

         throw InvalidArgument("Operation " + op.getName() + " is not in the model");

     ops.insert(it, newOp);

 }


 void Model::addConnection(const std::string& sourceOpName, const std::string& destOpName, int output, int input, int shuffle) {

     auto& source = getOperation(sourceOpName);

     auto& dest = getOperation(destOpName);

     addConnection(source, dest, output, input, shuffle);

 }


 void Model::addConnection(AbstractOperation& source, AbstractOperation& dest, int output, int input, int shuffle) {

     RuntimeError::check(0 <= output && output < source.getOutputCount(),

         "Operation " + source.getName() + " does not have output #" + std::to_string(output));

     RuntimeError::check(0 <= input && input < dest.getInputCount(),

         "Operation " + dest.getName() + " does not have input #" + std::to_string(input));

     connections.emplace(&source, Connection{ &dest, output, input, shuffle });

     ready = false;

 }


 void Model::addOutput(const std::string& opName, int output) {

     auto op = (*this)[opName];

     auto outputs = userOutputs.equal_range(op);

     for (auto i = outputs.first; i != outputs.second; ++i)

         if (i->second.index == output)

             // already added

             return;

     userOutputs.emplace(op, UserOutput{ output });

     ready = false;

 }


 void Model::addOutput(const AbstractOperation& operation, int output) {

     RuntimeError::check(isOperationInModel(operation), "Operation " + operation.getName() + " is not in the model");

     auto outputs = userOutputs.equal_range(&operation);

     for (auto i = outputs.first; i != outputs.second; ++i)

         if (i->second.index == output)

             // already added

             return;

     userOutputs.emplace(&operation, UserOutput{ output });

     ready = false;

 }


 const float* Model::getOutputData(size_t& numSamples, const std::string& operation, int output) const {

     return getOutputData(numSamples, *(*this)[operation], output);

 }


 const float* Model::getOutputData(size_t& numSamples, const AbstractOperation& operation, int output) const {

     auto outputs = userOutputs.equal_range(&operation);

     for (auto i = outputs.first; i != outputs.second; ++i)

         if (i->second.index == output) {

             numSamples = i->second.data.size();

             return i->second.data.data();

         }


     numSamples = 0;

     return nullptr;

 }


 void Model::prepare(GraphicPipeline& gpu,  ChunkCollection& data) {

     if (ready)

         return;

     freeMemory();


     std::map<Storage*, std::vector<AbstractOperation*>> refs;

         // Contains ops that use a specific storage as input, meaning that it cannot be reused elsewhere.

         // If no ops refer a storage, in can be recycled.


     // find input depth capping

     // If too many channels are sampled by an op having multiple inputs, its input storages will have reserved channels.

     const int sampledChannelsLimit = 4 * gpu.getLimit(GraphicPipeline::Limit::TEXTURE_IMAGE_UNITS);

     std::map<AbstractOperation*, int> sampledChannels;   // op => number of sampled channels

     for (auto conn : connections) {

         auto* op = conn.second.dest;

         // get the number of sampled channels

         int min, max;

         op->getSampledChannels(conn.second.input, min, max);

         // cap the maximum: a storage will not have more channels than the limit anyway

         max = std::min(max, sampledChannelsLimit);

         // add to input channels

         sampledChannels[op] += max;

     }


     // loop through connected ops

     data.open();

     preparingProgress.reset(ops.size());

     for (auto src : ops) {

         std::vector<Beatmup::Object*> outputs(src->getOutputCount(), nullptr);  // src output index => storage/vector bound to the output

         std::vector<int> paddings(src->getOutputCount(), 0);    // src output index => max padding over all connections

         Bitset connectedOutputs(src->getOutputCount(), false);


         // loop over connections to find max paddings per output

         auto connections = this->connections.equal_range(src);

         for (auto i = connections.first; i != connections.second; ++i) {

             const auto& conn = i->second;

             paddings[conn.output] = std::max(paddings[conn.output], conn.dest->getInputPadding(conn.input));

         }


         // loop over connections

         for (auto i = connections.first; i != connections.second; ++i) {

             const auto& conn = i->second;

             auto* dst = conn.dest;

             connectedOutputs.set(conn.output);


             if (outputs[conn.output])

                 RuntimeError::check(src->acceptsStorageOutput(conn.output) ^ src->acceptsVectorOutput(conn.output) ^ src->acceptsTextureOutput(conn.output),

                     "Operation output accepting different types can only have a single connection");

                     // To avoid output type mismatch when connecting second time


             // if a regular Storage is accepted by both source and destination

             if (src->acceptsStorageOutput(conn.output) && dst->acceptsStorageInput(conn.input)) {

                 const Size size = src->getOutputSize(conn.output);

                 Storage* storage = nullptr;


                 // check if the output storage is already allocated

                 if (outputs[conn.output]) {

                     storage = static_cast<Storage*>(outputs[conn.output]);

                     refs[storage].push_back(dst);

                 }


                 else {

                     // decide on reserved depth (if capping)

                     int depthCapping = 0;

                     if (sampledChannels[dst] > sampledChannelsLimit) {

                         // the op exceeds the limit

                         int min, max;

                         dst->getSampledChannels(conn.input, min, max);

                         const int cappingMargin = std::min(sampledChannelsLimit, size[2]) - min;    // this is how much we can cap at the current input

                         if (cappingMargin > 0) {

                             depthCapping = std::min(cappingMargin, sampledChannels[dst] - sampledChannelsLimit);

                             // reduce the excess

                             sampledChannels[dst] -= depthCapping;

                         }

                     }


                     // try to recycle an existing storage first

                     for (auto& i : refs) {

                         auto candidate = i.first;

                         auto& users = i.second;

                         const int reservedDepth = sampledChannelsLimit - 4 * candidate->getNumberOfTextures();

                         // check if (1) size matches, (2) padding is sufficient, (3) reserved depth matches the number of channels to cap or no capping

                         if (candidate->getSize() == size && candidate->getPadding() >= dst->getInputPadding(conn.input) && (reservedDepth == depthCapping || depthCapping == 0)

                             && users.empty())

                         {

                             // found!

                             storage = candidate;

                             users.push_back(dst);

                             break;

                         }

                         if (storage)

                             break;

                     }


                     // no matching storage found, allocate a new one

                     if (!storage) {

                         storage = (size[0] == 1 && size[1] == 1) ?

                             // allocate flat storage if the output size is of 1x1 pixels

                             &allocateFlatStorage(gpu, size[2]) :

                             &allocateStorage(gpu,

                                 size,

                                 src->usesGpu(), !src->usesGpu(),

                                 paddings[conn.output],

                                 depthCapping

                             );

                         refs.emplace(storage, std::vector<AbstractOperation*>{ dst });

                     }


                     // mark output as allocated

                     outputs[conn.output] = storage;

                 }


                 // connect

                 src->setOutput(*storage, conn.output);

                 if (conn.shuffle > 0)

                     dst->setInput(Storage::View(*storage, conn.shuffle), conn.input);

                 else

                     dst->setInput(*storage, conn.input);

             }


             // if a Vector is accepted

             else if (src->acceptsVectorOutput(conn.output) && dst->acceptsVectorInput(conn.input)) {

                 RuntimeError::check(conn.shuffle == 0, "Cannot shuffle vector");

                 GL::Vector* vector;


                 // check if the output storage is already allocated

                 if (outputs[conn.output])

                     vector = static_cast<GL::Vector*>(outputs[conn.output]);

                 else {

                     vector = &allocateVector(gpu, src->getOutputSize(conn.output).volume());

                     outputs[conn.output] = vector;

                 }


                 // connect

                 src->setOutput(*vector, conn.output);

                 dst->setInput(*vector, conn.input);

             }


             // if a texture is accepted

             else if (src->acceptsTextureOutput(conn.output) && dst->acceptsTextureInput(conn.input)) {

                 RuntimeError::check(conn.shuffle == 0, "Cannot shuffle texture");

                 InternalBitmap* texture;


                 // check if the output storage is already allocated

                 if (outputs[conn.output])

                     texture = static_cast<InternalBitmap*>(outputs[conn.output]);

                 else

                     outputs[conn.output] = texture = &allocateTexture(gpu, src->getOutputSize(conn.output));


                 // connect

                 src->setOutput(*texture, conn.output);

                 dst->setInput(*texture, conn.input);

             }


             else

                 throw RuntimeError("Cannot connect " + src->getName() + " (output #" + std::to_string(conn.output) + ") "

                     "to " + dst->getName() + " (input #" + std::to_string(conn.input) + "): storage type mismatch");

         }


         // allocate user outputs if not yet

         auto userOutputs = this->userOutputs.equal_range(src);

         for (auto i = userOutputs.first; i != userOutputs.second; ++i) {

             int idx = i->second.index;

             if (idx >= src->getOutputCount())

                 throw InvalidArgument("Operation " + src->getName() + " does not have output #" + std::to_string(idx));

             if (!connectedOutputs[idx])

                 if (src->acceptsStorageOutput(idx)) {

                     src->setOutput(allocateStorage(gpu, src->getOutputSize(idx), src->usesGpu(), !src->usesGpu()), idx);

                 }

                 else if (src->acceptsVectorOutput(idx)) {

                     src->setOutput(allocateVector(gpu, src->getOutputSize(idx).volume()), idx);

                 }

         }


         // prepare operation

         src->prepare(gpu, data, *this);


         // remove references to storages used by the current operation. This allows their reuse in other connections.

         for (auto& i : refs) {

             auto& users = i.second;

             for (auto op = users.begin(); op != users.end(); )

                 if (*op == src)

                     users.erase(op);

                 else

                     ++op;

         }


         // advance the progress bar

         preparingProgress();

     }


     data.close();

     ready = true;

 }


 void Model::execute(TaskThread& thread, GraphicPipeline* gpu) {

     if (gpu)

         gpu->switchMode(GraphicPipeline::Mode::INFERENCE);


     // reset the progress tracker

     inferenceProgress.reset(ops.size());


     // loop through ops

     for (auto op : ops) {

         if (thread.isTaskAborted())

             return;


         // start profiling

         if (thread.isManaging() && profiler)

             (*profiler)(op->getName());


         // run operation

         try {

             if (gpu)

                 op->execute(thread, *gpu);

             else

                 op->execute(thread);

         } catch (const std::exception& ex) {

             throw InferenceTimeError(*op, ex);

         }


         // get user outputs

         auto userOutputs = this->userOutputs.equal_range(op);

         for (auto it = userOutputs.first; it != userOutputs.second; ++it) {

             int idx = it->second.index;

             auto& data = it->second.data;

             if (gpu)

                 if (op->acceptsStorageOutput(idx)) {

                     // get data pointer from storage

                     auto view = op->getOutput(idx);

                     if (!view.getStorage().isUpToDate(ProcessingTarget::CPU))

                         view.getStorage().pull(*gpu);


                     // copy to the vector

                     Storage::Scanner scan(view);

                     scan.move(0, 0);

                     data.resize(view.getSize().volume());

                     for (auto it = data.begin(); it != data.end(); it += view.getDepth()) {

                         scan.fill(it, data.end());

                         ++scan;

                     }

                 }

                 else if (op->acceptsVectorOutput(idx)) {

                     GL::Vector* vector;

                     op->getOutput(vector, idx);

                     vector->fetch(*gpu, data);

                 }

         }


         if (thread.isManaging()) {

             // stop profiler

             if (profiler) {

                 gpu->flush();   // wait till GPU is done

                 profiler->lap();

             }


             // increase inference progress

             inferenceProgress();

         }

     }

 }


 bool Model::isOperationInModel(const AbstractOperation& operation) const {

     for (auto op : ops)

         if (op == &operation)

             return true;

     return false;

 }


 void Model::freeMemory() {

     for (auto storage : storages)

         delete storage;

     storages.clear();

     for (auto vector : vectors)

         delete vector;

     vectors.clear();

     for (auto texture : textures)

         delete texture;

     textures.clear();

 }


 Storage& Model::allocateStorage(GraphicPipeline& gpu, const Size size, bool forGpu, bool forCpu, const int pad, const int reservedDepth) {

     Storage* storage = new Storage(context, gpu, size, pad, reservedDepth);

     if (forGpu)

         storage->allocate(gpu);

     if (forCpu)

         storage->allocate();

     storages.push_back(storage);

     return *storage;

 }


 Storage& Model::allocateFlatStorage(GraphicPipeline& gpu, int size) {

     Storage* storage = new Storage(context, gpu, Size(1, 1, size));

     storage->allocate(gpu);

     storages.push_back(storage);

     return *storage;

 }


 GL::Vector& Model::allocateVector(GraphicPipeline& gpu, const int size) {

     GL::Vector::Format format;

 #ifdef BEATMUP_OPENGLVERSION_GLES20

     format = GL::Vector::Format::FIXED16;

 #else

     format = GL::Vector::Format::FLOAT;

 #endif

     GL::Vector* vector = new GL::Vector(context, gpu, size, format);

     vectors.push_back(vector);

     return *vector;

 }


 InternalBitmap& Model::allocateTexture(GraphicPipeline& gpu, const Size size) {

     PixelFormat pixelFormat(PixelFormat::TripleByte);

     switch (size.getDepth()) {

     case 1:

         pixelFormat = PixelFormat::SingleByte;

         break;

     case 3:

         pixelFormat = PixelFormat::TripleByte;

         break;

     case 4:

         pixelFormat = PixelFormat::QuadByte;

         break;

     default:

         throw InvalidArgument("Unsupported depth: " + std::to_string(size.getDepth()));

     }

     textures.push_back(new InternalBitmap(context, pixelFormat, size.getWidth(), size.getHeight()));

     return *textures.back();

 }


 bool Model::isPreceding(const AbstractOperation& first, const AbstractOperation& second) const {

     for (size_t firstIdx = 0; firstIdx < ops.size(); ++firstIdx)

         if (ops[firstIdx] == &first) {

             for (size_t secondIdx = firstIdx + 1; secondIdx < ops.size(); ++secondIdx)

                 if (ops[secondIdx] == &second)

                     return true;

             return false;

         }

     return false;

 }


 AbstractOperation* Model::operator[](const std::string& operationName) {

     for (auto op : ops)

         if (op->getName() == operationName)

             return op;

     throw InvalidArgument("Operation not found: " + operationName);

 }


 const AbstractOperation* Model::operator[](const std::string& operationName) const {

     for (auto op : ops)

         if (op->getName() == operationName)

             return op;

     throw InvalidArgument("Operation not found: " + operationName);

 }


 unsigned long Model::countMultiplyAdds() const {

     unsigned long result = 0;

     for (auto op : ops)

         result += op->countMultiplyAdds();

     return result;

 }


 unsigned long Model::countTexelFetches() const {

     unsigned long result = 0;

     for (auto op : ops)

         result += op->countTexelFetches();

     return result;

 }


 size_t Model::getMemorySize() const {

     size_t size = 0;

     for (auto& entry : storages)

         size += entry->getMemorySize();

     for (auto& entry : vectors)

         size += entry->getMemorySize();

     for (auto& entry : textures)

         size += entry->getMemorySize();

     return size;

 }


 Listing Model::serialize() const {

     /** \page NNetsConnectionsSerialization  Connections serialization

         Every connection is serialized in a single block in \c connections part.


         Example:

         \code{yaml}

          - from: source operation name

            to: destination operation name

            from_output: 0       # output number of the source operation, defaults to 0

            to_input: 0          # input number of the destination operation, defaults to 0

            shuffle: 1           # shuffling step, defaults to 1

         \endcode

         Shuffling step description is given \ref NNetsShufflingExplained "here".

     */

     Listing listing;


     // serialize operations

     for (const auto& op : ops)

         listing.emplace("ops", op->serialize());


     // serialize connections

     for (const auto& conn : connections) {

         const auto& info = conn.second;

         Listing::Block block;

         block.set("from", conn.first->getName());

         block.set("to", info.dest->getName());

         if (info.output > 0)

             block.set("from_output", info.output);

         if (info.input > 0)

             block.set("to_input", info.input);

         if (info.shuffle > 0)

             block.set("shuffle", info.shuffle);

         listing.emplace("connections", std::move(block));

     }


     // in case if no connections, add empty block

     if (connections.empty())

         listing.emplace("connections", {});


     return listing;

 }


 std::string Model::serializeToString() const {

     Listing listing(serialize());

     std::stringstream strstr;

     listing.printOut(strstr);

     return strstr.str();

 }


 InferenceTimeError::InferenceTimeError(const AbstractOperation& op, const std::exception& ex):

     Exception("Error in %s: %s", op.getName().c_str(), ex.what())

 {}

Beatmup::Bitset
A set of boolean flags.
Definition: bitset.h:30

Beatmup::Bitset::set
void set(size_t i, bool value=true)
Definition: bitset.h:67

Beatmup::ChunkCollection
A key-value pair set storing pieces of arbitrary data (chunks) under string keys.
Definition: chunkfile.h:36

Beatmup::ChunkCollection::close
virtual void close()=0
Closes the collection after a reading session.

Beatmup::ChunkCollection::open
virtual void open()=0
Opens the collection to read chunks from it.

Beatmup::Context
Basic class: task and memory management, any kind of static data.
Definition: context.h:59

Beatmup::Exception
Base class for all exceptions.
Definition: exception.h:37

Beatmup::GL::ProgramBank::context
Context & context
Definition: program_bank.h:44

Beatmup::GL::Vector
Real-valued vector usable by GPU.
Definition: linear_mapping.h:29

Beatmup::GL::Vector::fetch
void fetch(GraphicPipeline &gpu, std::vector< float > &output) const
Grabs vector values back from GPU to user memory.
Definition: linear_mapping.cpp:489

Beatmup::GL::Vector::Format
Format
Vector data format.
Definition: linear_mapping.h:34

Beatmup::GL::Vector::Format::FIXED16
@ FIXED16
16 bit per element

Beatmup::GL::Vector::Format::FLOAT
@ FLOAT
32 bit per element, floating point

Beatmup::GraphicPipeline
Internal low-level GPU control API.
Definition: pipeline.h:33

Beatmup::GraphicPipeline::switchMode
void switchMode(Mode mode)
Switches GPU mode.
Definition: pipeline.cpp:941

Beatmup::GraphicPipeline::getLimit
int getLimit(Limit limit) const
Definition: pipeline.cpp:936

Beatmup::GraphicPipeline::Mode::INFERENCE
@ INFERENCE
Textures are feature maps computed in fragment shaders.

Beatmup::GraphicPipeline::Limit::TEXTURE_IMAGE_UNITS
@ TEXTURE_IMAGE_UNITS
maximum number of texture units per fragment shader

Beatmup::GraphicPipeline::flush
void flush()
Waits until all operations submitted to GPU are finished.
Definition: pipeline.cpp:931

Beatmup::InternalBitmap
Bitmap whose memory is managed by the Beatmup engine.
Definition: internal_bitmap.h:35

Beatmup::InvalidArgument
Definition: exception.h:70

Beatmup::Listing::Block
Set of key-value pairs.
Definition: listing.h:46

Beatmup::Listing::Block::set
void set(const std::string &key, T value)
Sets a value for a specific key.

Beatmup::Listing
Parser of simple YAML-like listings.
Definition: listing.h:40

Beatmup::Listing::printOut
void printOut(std::ostream &stream)
Prints out the listing to an output stream.
Definition: listing.cpp:184

Beatmup::Listing::emplace
void emplace(const std::string &key, Block &&block)
Adds a block to a chapter.
Definition: listing.cpp:200

Beatmup::NNets::AbstractOperation
Abstract neural net operation (layer).
Definition: operation.h:46

Beatmup::NNets::AbstractOperation::getOutputCount
virtual int getOutputCount() const
Returns number of operation outputs.
Definition: operation.h:135

Beatmup::NNets::AbstractOperation::getInputCount
virtual int getInputCount() const
Returns number of operation inputs.
Definition: operation.h:129

Beatmup::NNets::AbstractOperation::getName
std::string getName() const
Definition: operation.h:242

Beatmup::NNets::InferenceTimeError
Wrapper for exceptions occuring during the model inference.
Definition: model.h:357

Beatmup::NNets::InferenceTimeError::InferenceTimeError
InferenceTimeError(const AbstractOperation &op, const std::exception &ex)
Definition: model.cpp:587

Beatmup::NNets::Model
Neural net model.
Definition: model.h:92

Beatmup::NNets::Model::getMemorySize
size_t getMemorySize() const
Returns the amount of texture memory in bytes currently allocated by the model to run the inference.
Definition: model.cpp:524

Beatmup::NNets::Model::allocateFlatStorage
Storage & allocateFlatStorage(GraphicPipeline &gpu, const int size)
Allocates a new flat storage.
Definition: model.cpp:439

Beatmup::NNets::Model::ready
bool ready
if true, ops are connected to each other and storages are allocated
Definition: model.h:125

Beatmup::NNets::Model::ops
std::vector< AbstractOperation * > ops
model operations
Definition: model.h:122

Beatmup::NNets::Model::freeMemory
void freeMemory()
Frees all allocated storages.
Definition: model.cpp:415

Beatmup::NNets::Model::userOutputs
std::multimap< const AbstractOperation *, UserOutput > userOutputs
operation => user output mapping
Definition: model.h:114

Beatmup::NNets::Model::getOperation
OperationClass & getOperation(const std::string &operationName)
Retrieves an operation by its name.
Definition: model.h:303

Beatmup::NNets::Model::countTexelFetches
unsigned long countTexelFetches() const
Provides an estimation of the total number of texels fetched by all the operations in the model per i...
Definition: model.cpp:516

Beatmup::NNets::Model::allocateStorage
Storage & allocateStorage(GraphicPipeline &gpu, const Size size, bool forGpu=true, bool forCpu=false, const int pad=0, const int reservedChannels=0)
Allocates a new storage.
Definition: model.cpp:428

Beatmup::NNets::Model::inferenceProgress
ProgressTracking inferenceProgress
inference progress
Definition: model.h:124

Beatmup::NNets::Model::profiler
Profiler * profiler
pointer to a Profiler attached to the model
Definition: model.h:119

Beatmup::NNets::Model::addConnection
void addConnection(AbstractOperation &source, AbstractOperation &dest, int output=0, int input=0, int shuffle=0)
Definition: model.cpp:91

Beatmup::NNets::Model::serialize
Listing serialize() const
Returns serialized representation of the model as a Listing.

Beatmup::NNets::Model::preparingProgress
ProgressTracking preparingProgress
model preparation progress
Definition: model.h:123

Beatmup::NNets::Model::addOutput
void addOutput(const std::string &operation, int output=0)
Enables reading output data from the model memory through getOutputData().
Definition: model.cpp:101

Beatmup::NNets::Model::storages
std::vector< Storage * > storages
allocated storages used during the inference
Definition: model.h:116

Beatmup::NNets::Model::isOperationInModel
bool isOperationInModel(const AbstractOperation &operation) const
Checks if a specific operation makes part of the model.
Definition: model.cpp:407

Beatmup::NNets::Model::countMultiplyAdds
unsigned long countMultiplyAdds() const
Provides an estimation of the number of multiply-adds characterizing the model complexity.
Definition: model.cpp:508

Beatmup::NNets::Model::allocateVector
GL::Vector & allocateVector(GraphicPipeline &gpu, const int size)
Allocates a vector that can be used as operation input or output.
Definition: model.cpp:447

Beatmup::NNets::Model::Model
Model(Context &context, std::initializer_list< AbstractOperation * > ops)
Instantiates a model from a list of operations interconnecting them in a feedforward fashion.
Definition: model.cpp:27

Beatmup::NNets::Model::connections
std::multimap< const AbstractOperation *, Connection > connections
source operation => connection descriptor mapping
Definition: model.h:113

Beatmup::NNets::Model::prepare
virtual void prepare(GraphicPipeline &gpu, ChunkCollection &data)
Prepares all operations: reads the model data from chunks and builds GPU programs.
Definition: model.cpp:143

Beatmup::NNets::Model::serializeToString
std::string serializeToString() const
Returns serialized representation of the model as a string.
Definition: model.cpp:579

Beatmup::NNets::Model::operator[]
AbstractOperation * operator[](const std::string &operationName)
Definition: model.cpp:492

Beatmup::NNets::Model::execute
void execute(TaskThread &thread, GraphicPipeline *gpu)
Runs the inference.
Definition: model.cpp:339

Beatmup::NNets::Model::textures
std::vector< InternalBitmap * > textures
allocated images used during the inference
Definition: model.h:118

Beatmup::NNets::Model::addOperation
void addOperation(const std::string &opName, AbstractOperation *newOp)
Adds a new operation to the model before another operation in the execution order.
Definition: model.cpp:68

Beatmup::NNets::Model::isPreceding
bool isPreceding(const AbstractOperation &first, const AbstractOperation &second) const
Checks whether an operation goes before another operation in the model according the ops execution or...
Definition: model.cpp:480

Beatmup::NNets::Model::~Model
~Model()
Definition: model.cpp:40

Beatmup::NNets::Model::vectors
std::vector< GL::Vector * > vectors
allocated vectors used during the inference
Definition: model.h:117

Beatmup::NNets::Model::allocateTexture
InternalBitmap & allocateTexture(GraphicPipeline &gpu, const Size size)
Allocates a texture that can be used as operation input or output.
Definition: model.cpp:460

Beatmup::NNets::Model::append
void append(AbstractOperation *newOp, bool connect=false)
Adds a new operation to the model.
Definition: model.cpp:47

Beatmup::NNets::Model::getOutputData
const float * getOutputData(size_t &numSamples, const std::string &operation, int output=0) const
Reads data from the model memory.
Definition: model.cpp:125

Beatmup::NNets::Size
Operation 3D input/output size.
Definition: storage.h:37

Beatmup::NNets::Storage::Scanner
Scans a storageview in RAM for further computations on CPU.
Definition: storage.h:466

Beatmup::NNets::Storage::Scanner::move
void move(int x, int y)
Sets the pointer to a specific spatial position.
Definition: storage.cpp:663

Beatmup::NNets::Storage::Scanner::fill
void fill(T begin, T limit)
Extracts the content of feature maps at the current position.
Definition: storage.h:508

Beatmup::NNets::Storage::View
Maps a 3D tensor onto a storage.
Definition: storage.h:308

Beatmup::NNets::Storage
3D tensor stored in a set of textures.
Definition: storage.h:126

Beatmup::NNets::Storage::allocate
void allocate(GraphicPipeline &gpu)
Allocates the storage in GPU memory.
Definition: storage.cpp:167

Beatmup::Profiler::lap
void lap()
Definition: profiler.cpp:37

Beatmup::ProgressTracking::reset
void reset(unsigned int max)
Resets the progress to zero.
Definition: progress_tracking.h:38

Beatmup::RuntimeError
Definition: exception.h:61

Beatmup::RuntimeError::check
static void check(const bool condition, const std::string &message)
Definition: exception.h:64

Beatmup::TaskThread
Thread executing tasks.
Definition: parallelism.h:154

Beatmup::TaskThread::isManaging
bool isManaging() const
Definition: parallelism.h:172

Beatmup::TaskThread::isTaskAborted
virtual bool isTaskAborted() const =0
Returns true if the task is asked to stop from outside.

model.h

Beatmup
Definition: basic_types.h:22

Beatmup::PixelFormat
PixelFormat
Definition: abstract_bitmap.h:70

Beatmup::SingleByte
@ SingleByte
single channel of 8 bits per pixel (like grayscale), unsigned integer values
Definition: abstract_bitmap.h:71

Beatmup::QuadByte
@ QuadByte
4 channels of 8 bits per pixel (like RGBA), unsigned integer values
Definition: abstract_bitmap.h:73

Beatmup::TripleByte
@ TripleByte
3 channels of 8 bits per pixel (like RGB), unsigned integer values
Definition: abstract_bitmap.h:72

Beatmup::CPU
@ CPU
Definition: basic_types.h:55

std::to_string
std::string to_string(Beatmup::NNets::ActivationFunction function)

std::min
CustomPoint< numeric > min(const CustomPoint< numeric > &a, const CustomPoint< numeric > &b)
Definition: geometry.h:724

std::max
CustomPoint< numeric > max(const CustomPoint< numeric > &a, const CustomPoint< numeric > &b)
Definition: geometry.h:728

Beatmup::NNets::Model::Connection
Connection descriptor.
Definition: model.h:98

Beatmup::NNets::Model::UserOutput
A user-defined output descriptor.
Definition: model.h:108

format
JNIEnv jobject jint format
Definition: wrapper_audio.cpp:36

pixelFormat
jlong jint jint jint jint pixelFormat
Definition: wrapper_core.cpp:236

end
jlong jint jint end
Definition: wrapper_core.cpp:534

result
Beatmup::IntPoint result
Definition: wrapper_core.cpp:256

size
jlong jobject size
Definition: wrapper_imag.cpp:772

src
return(jlong) new Beatmup jlong jstring src
Definition: wrapper_imag.cpp:1152

op
jlong jint op
Definition: wrapper_imag.cpp:744

opName
JNIEnv jlong jobject jstring opName
Definition: wrapper_nnets.cpp:187