construct/include/ircd/gpt/pipe/model.h

// Matrix Construct
//
// Copyright (C) Matrix Construct Developers, Authors & Contributors
// Copyright (C) 2016-2021 Jason Volk <jason@zemos.net>
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice is present in all copies. The
// full license for this software is available in the LICENSE file.

#pragma once
#define HAVE_IRCD_GPT_PIPE_MODEL_H

struct ircd::gpt::pipe::model
{
	struct matrix;
	struct tensor;
	struct norm;
	struct proj;
	struct fcon;
	struct attn;
	struct ffnn;
	struct block;
	struct decoder;
	struct language;

	std::unique_ptr<model::decoder> decode;
	std::unique_ptr<model::language> embed;
	bool invalid {false};

	model(const gpt::model::decoder &, const gpt::model::embed &);
	model(gpt::model::decoder &, gpt::model::embed &);
	~model() noexcept;
};

struct ircd::gpt::pipe::model::matrix
{
	cl::data
	param,       // Weights
	moment[2];   // Adaptive moment estimations

	matrix(cl::data *, const off_t, const const_buffer &param);
	matrix(cl::data *, const off_t, const mutable_buffer &param);
};

struct ircd::gpt::pipe::model::tensor
{
	matrix
	bias,
	weight;

	tensor(cl::data *, const off_t, const const_buffer &bias, const const_buffer &weight);
	tensor(cl::data *, const off_t, const mutable_buffer &bias, const mutable_buffer &weight);
};

struct ircd::gpt::pipe::model::attn
{
	tensor
	norm,
	fcon,
	proj;

	cl::data
	mask;

	attn(cl::data *, const off_t, const gpt::model::norm &, const gpt::model::attn &);
	attn(cl::data *, const off_t, gpt::model::norm &, gpt::model::attn &);
};

struct ircd::gpt::pipe::model::ffnn
{
	tensor
	norm,
	fcon,
	proj;

	ffnn(cl::data *, const off_t, const gpt::model::norm &, const gpt::model::ffnn &);
	ffnn(cl::data *, const off_t, gpt::model::norm &, gpt::model::ffnn &);
};

struct ircd::gpt::pipe::model::block
{
	// Single layer memory roots
	cl::data
	master[3];

	// Layer units
	model::attn attn;
	model::ffnn ffnn;

	block(cl::data *, const off_t, const gpt::model::block &, const size_t);
	block(cl::data *, const off_t, gpt::model::block &, const size_t);
	block(const gpt::model::block &, const size_t);
	block(gpt::model::block &, const size_t);
};

struct ircd::gpt::pipe::model::language
{
	cl::data
	master[3];

	matrix
	pos,
	token;

	language(cl::data *, const off_t, const gpt::model::embed &);
	language(cl::data *, const off_t, gpt::model::embed &);
	language(const gpt::model::embed &);
	language( gpt::model::embed &);
	~language() noexcept;
};

struct ircd::gpt::pipe::model::decoder
{
	// Combined-layer memory roots
	cl::data
	master[3];

	// Layer blocks
	model::block
	block[12];

	// Final norm
	tensor norm;

	decoder(const gpt::model::decoder &);
	decoder(gpt::model::decoder &);
	~decoder() noexcept;
};
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`// Matrix Construct`
			`//`
			`// Copyright (C) Matrix Construct Developers, Authors & Contributors`
			`// Copyright (C) 2016-2021 Jason Volk <jason@zemos.net>`
			`//`
			`// Permission to use, copy, modify, and/or distribute this software for any`
			`// purpose with or without fee is hereby granted, provided that the above`
			`// copyright notice and this permission notice is present in all copies. The`
			`// full license for this software is available in the LICENSE file.`

			`#pragma once`
			`#define HAVE_IRCD_GPT_PIPE_MODEL_H`

			`struct ircd::gpt::pipe::model`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`struct matrix;`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`struct tensor;`
			`struct norm;`
			`struct proj;`
			`struct fcon;`
			`struct attn;`
			`struct ffnn;`
			`struct block;`
			`struct decoder;`
			`struct language;`

			`std::unique_ptr<model::decoder> decode;`
			`std::unique_ptr<model::language> embed;`
ircd::gpt::pipe: Add model invalidation for device resynchronization. 2021-04-22 21:11:25 +02:00			`bool invalid {false};`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00
			`model(const gpt::model::decoder &, const gpt::model::embed &);`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`model(gpt::model::decoder &, gpt::model::embed &);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`~model() noexcept;`
			`};`

ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`struct ircd::gpt::pipe::model::matrix`
			`{`
			`cl::data`
			`param, // Weights`
			`moment[2]; // Adaptive moment estimations`

			`matrix(cl::data *, const off_t, const const_buffer &param);`
			`matrix(cl::data *, const off_t, const mutable_buffer &param);`
			`};`

ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`struct ircd::gpt::pipe::model::tensor`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`matrix`
			`bias,`
			`weight;`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`tensor(cl::data *, const off_t, const const_buffer &bias, const const_buffer &weight);`
			`tensor(cl::data *, const off_t, const mutable_buffer &bias, const mutable_buffer &weight);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`};`

			`struct ircd::gpt::pipe::model::attn`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`tensor`
			`norm,`
			`fcon,`
			`proj;`

			`cl::data`
			`mask;`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`attn(cl::data *, const off_t, const gpt::model::norm &, const gpt::model::attn &);`
			`attn(cl::data *, const off_t, gpt::model::norm &, gpt::model::attn &);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`};`

			`struct ircd::gpt::pipe::model::ffnn`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`tensor`
			`norm,`
			`fcon,`
			`proj;`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`ffnn(cl::data *, const off_t, const gpt::model::norm &, const gpt::model::ffnn &);`
			`ffnn(cl::data *, const off_t, gpt::model::norm &, gpt::model::ffnn &);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`};`

			`struct ircd::gpt::pipe::model::block`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`// Single layer memory roots`
			`cl::data`
			`master[3];`

			`// Layer units`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`model::attn attn;`
			`model::ffnn ffnn;`

ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`block(cl::data *, const off_t, const gpt::model::block &, const size_t);`
			`block(cl::data *, const off_t, gpt::model::block &, const size_t);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`block(const gpt::model::block &, const size_t);`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`block(gpt::model::block &, const size_t);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`};`

ircd::gpt::pipe::model: Additional sub-buffering for lmhead. 2021-04-22 21:10:22 +02:00			`struct ircd::gpt::pipe::model::language`
			`{`
			`cl::data`
			`master[3];`

			`matrix`
			`pos,`
			`token;`

			`language(cl::data *, const off_t, const gpt::model::embed &);`
			`language(cl::data *, const off_t, gpt::model::embed &);`
			`language(const gpt::model::embed &);`
			`language( gpt::model::embed &);`
			`~language() noexcept;`
			`};`

ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`struct ircd::gpt::pipe::model::decoder`
			`{`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`// Combined-layer memory roots`
			`cl::data`
			`master[3];`

			`// Layer blocks`
			`model::block`
			`block[12];`

			`// Final norm`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`tensor norm;`

			`decoder(const gpt::model::decoder &);`
ircd::gpt: Add adaptive moment state to pipe model; move task prelim defs. 2021-04-17 20:53:50 +02:00			`decoder(gpt::model::decoder &);`
ircd::gpt: Transformer Pipe. 2021-03-30 03:22:42 +02:00			`~decoder() noexcept;`
			`};`