0
0
Fork 0
mirror of https://github.com/matrix-construct/construct synced 2025-01-16 09:36:54 +01:00
construct/include/ircd/gpt/pipe/model.h

121 lines
2.4 KiB
C
Raw Normal View History

2021-03-30 03:22:42 +02:00
// Matrix Construct
//
// Copyright (C) Matrix Construct Developers, Authors & Contributors
// Copyright (C) 2016-2021 Jason Volk <jason@zemos.net>
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice is present in all copies. The
// full license for this software is available in the LICENSE file.
#pragma once
#define HAVE_IRCD_GPT_PIPE_MODEL_H
struct ircd::gpt::pipe::model
{
struct matrix;
2021-03-30 03:22:42 +02:00
struct tensor;
struct norm;
struct proj;
struct fcon;
struct attn;
struct ffnn;
struct block;
2022-06-20 03:59:29 +02:00
struct embed;
2021-03-30 03:22:42 +02:00
struct decoder;
2022-06-20 03:59:29 +02:00
const gpt::model::decoder *decode_const {nullptr};
gpt::model::decoder *decode_mutable {nullptr};
2021-03-30 03:22:42 +02:00
std::unique_ptr<model::decoder> decode;
2022-06-20 03:59:29 +02:00
model(const gpt::model::decoder &);
model(gpt::model::decoder &);
2021-03-30 03:22:42 +02:00
~model() noexcept;
};
struct ircd::gpt::pipe::model::matrix
{
cl::data
param, // Weights
moment[2]; // Adaptive moment estimations
matrix(cl::data *, const off_t, const const_buffer &param);
matrix(cl::data *, const off_t, const mutable_buffer &param);
};
2021-03-30 03:22:42 +02:00
struct ircd::gpt::pipe::model::tensor
{
matrix
bias,
weight;
2021-03-30 03:22:42 +02:00
2022-06-20 03:59:29 +02:00
tensor(cl::data *, const off_t, const const_buffer &bias, const off_t, const const_buffer &weight);
tensor(cl::data *, const off_t, const mutable_buffer &bias, const off_t, const mutable_buffer &weight);
2021-03-30 03:22:42 +02:00
};
struct ircd::gpt::pipe::model::attn
{
tensor
norm,
fcon,
proj;
2022-06-20 03:59:29 +02:00
attn(cl::data *, const off_t, const gpt::model::attn &);
attn(cl::data *, const off_t, gpt::model::attn &);
2021-03-30 03:22:42 +02:00
};
struct ircd::gpt::pipe::model::ffnn
{
tensor
norm,
fcon,
proj;
2021-03-30 03:22:42 +02:00
2022-06-20 03:59:29 +02:00
ffnn(cl::data *, const off_t, const gpt::model::ffnn &);
ffnn(cl::data *, const off_t, gpt::model::ffnn &);
2021-03-30 03:22:42 +02:00
};
struct ircd::gpt::pipe::model::block
{
2022-06-20 03:59:29 +02:00
model::attn
attn;
2022-06-20 03:59:29 +02:00
model::ffnn
ffnn;
2021-03-30 03:22:42 +02:00
block(cl::data *, const off_t, const gpt::model::block &, const size_t);
block(cl::data *, const off_t, gpt::model::block &, const size_t);
2021-03-30 03:22:42 +02:00
};
2022-06-20 03:59:29 +02:00
struct ircd::gpt::pipe::model::embed
{
2022-06-20 03:59:29 +02:00
tensor
norm;
matrix
pos,
token;
2022-06-20 03:59:29 +02:00
embed(cl::data *, const off_t, const gpt::model::embed &);
embed(cl::data *, const off_t, gpt::model::embed &);
};
2021-03-30 03:22:42 +02:00
struct ircd::gpt::pipe::model::decoder
{
// Combined-layer memory roots
cl::data
master[3];
// Layer blocks
model::block
2022-06-20 03:59:29 +02:00
layer[12];
2022-06-20 03:59:29 +02:00
// Language model head
model::embed
embed;
2021-03-30 03:22:42 +02:00
decoder(const gpt::model::decoder &);
decoder(gpt::model::decoder &);
2021-03-30 03:22:42 +02:00
~decoder() noexcept;
};