// Matrix Construct // // Copyright (C) Matrix Construct Developers, Authors & Contributors // Copyright (C) 2016-2021 Jason Volk // // Permission to use, copy, modify, and/or distribute this software for any // purpose with or without fee is hereby granted, provided that the above // copyright notice and this permission notice is present in all copies. The // full license for this software is available in the LICENSE file. #pragma once #define HAVE_IRCD_GPT_OPTS_H /// Task Options Page /// /// The option block is directly shared with task software as constant data. /// This stucture and its mutable companion in `task.h` determine the outcome /// of the next execution cycle; options are immutable to device software but /// may be changed by the host between executions cycles if desired. /// struct ircd_gpt_opts { #ifdef __cplusplus ircd_gpt_opts(const ircd::gpt::model::decoder * = nullptr) noexcept; #endif /// Reference to the model (currently not available in device software). #ifndef __cplusplus const void *model; #else const ircd::gpt::model::decoder *model; #endif /// Seed for the task's PRNG. ulong seed; /// Limit number of output tokens. Default of -1 is unlimited; the number /// of tokens generated will be limited by other factors. uint limit; /// Flip random coins over the top k logits each round. Setting to 1 /// deterministically selects the top logit. uint top_k; /// Flip a random coin between 0 and top_p ( = 90 = 0.9) for logit select. uint top_p; /// Registers the top n result logits in the ctrl block each cycle. uint top_n; /// Number of target labels to register results for in the ctrl block. uint labels; /// Bitbar toggling various debug modes uint debug; /// Specifies the token context size in tokens. uint context_tokens; /// Specifies the token buffer size in tokens. uint buffer_tokens; /// Decoding layers. uint layers; /// SIMD lane count. uint lanes; /// Embedding vector elements uint embed_elems; /// Cross-attention dimension uint attn_rank; /// Attention unit fcon width multiple uint attn_mult; /// (computed) MLP unit fcon width multiple uint ffnn_mult; /// (computed) attention unit width multiple uint attn_elems; /// FFNN unit width multiple uint ffnn_elems; /// SIMD lane count uint lanes; /// (computed) `embed_elems` / `lanes` uint embed_width; /// (computed) Attention unit X dimension uint attn_width; /// (computed) Attention unit Y dimension uint attn_height; /// (computed) MLP backend X dimension uint ffnn_width; /// (computed) MLP backend Y dimension uint ffnn_height; /// Number of possible target n-grams. uint logits; /// Training steps uint training_steps; /// Validation steps uint validation_steps; /// Testing steps uint testing_steps; /// Learning rate float alpha; /// Decay rate float beta[2]; /// Denorm smoothing float epsilon; } __attribute__((aligned(4096))); #ifdef __cplusplus namespace ircd::gpt { using opts = ::ircd_gpt_opts; } static_assert(sizeof(struct ircd_gpt_opts) == 4096); static_assert(std::is_standard_layout::value); #endif