ircd::gpt::pipe: Add model invalidation for device resynchronization.

2024-11-25 08:12:37 +01:00 · 2021-04-22 12:11:25 -07:00 · 2021-04-22 12:11:25 -07:00 · 2a3c54afa2
commit 2a3c54afa2
parent bd460a80ce
4 changed files with 28 additions and 2 deletions
--- a/include/ircd/gpt/pipe/exec.h
+++ b/include/ircd/gpt/pipe/exec.h
@ -29,7 +29,9 @@ struct ircd::gpt::pipe::exec

 	const_buffer
 	send_opts,         // Set when sending the options page.
-	send_ctrl;         // Set when sending the control page.
+	send_ctrl,         // Set when sending the control page.
+	send_coil,         // Set when sending the updated model.
+	send_head;         // Set when sending the updated model.

 	mutable_buffer
 	recv_ctrl;         // Set when receiving the control page.
@ -46,6 +48,8 @@ struct ircd::gpt::pipe::exec
 	cl::exec
 	release_opts,      // Release the options page.
 	release_ctrl,      // Release the control page.
+	release_coil,      // Release updates to the model.
+	release_head,      // Release updates to the model.
 	lm_embed,          // Compute token and positional embeddings.
 	coil[12 * 2],      // Pass over all layers.
 	lm_norm,           // Final normalization.
--- a/include/ircd/gpt/pipe/model.h
+++ b/include/ircd/gpt/pipe/model.h
@ -26,6 +26,7 @@ struct ircd::gpt::pipe::model

 	std::unique_ptr<model::decoder> decode;
 	std::unique_ptr<model::language> embed;
+	bool invalid {false};

 	model(const gpt::model::decoder &, const gpt::model::embed &);
 	model(gpt::model::decoder &, gpt::model::embed &);
--- a/ircd/gpt_model.cc
+++ b/ircd/gpt_model.cc
@ -161,7 +161,7 @@ ircd::gpt::model::init_from_cache(const string_view &cache_path)

 	const fs::fd fd
 	{
-		cache_path, std::ios::in | std::ios::out
+		cache_path, std::ios::in //| std::ios::out
 	};

 	fs::map::opts map_opts
@ -171,6 +171,7 @@ ircd::gpt::model::init_from_cache(const string_view &cache_path)

 	map_opts.huge2mb = true;
 	map_opts.locked = false;
+	map_opts.shared = false;
 	default_model_shm = fs::map
 	{
 		fd, map_opts, sizeof(decoder)
--- a/ircd/gpt_pipe.cc
+++ b/ircd/gpt_pipe.cc
@ -260,6 +260,16 @@ ircd::gpt::pipe::exec::exec(task &task,
 	reinterpret_cast<const char *>(task.ctrl),
 	release? sizeof(struct ircd_gpt_task): 0
 }
+,send_coil
+{
+	reinterpret_cast<const char *>(gpt::model::default_model),
+	release && desc->model->invalid? (sizeof(gpt::model::block) * 12 + sizeof(gpt::model::norm)): 0
+}
+,send_head
+{
+	reinterpret_cast<const char *>(&gpt::model::default_model->word),
+	release && desc->model->invalid? sizeof(gpt::model::embed): 0
+}
 ,recv_ctrl
 {
 	reinterpret_cast<char *>(task.ctrl),
@ -309,6 +319,14 @@ ircd::gpt::pipe::exec::exec(task &task,
 {
 	desc->ctrl, send_ctrl
 }
+,release_coil
+{
+	desc->model->decode->master[0], send_coil
+}
+,release_head
+{
+	desc->model->embed->master[0], send_head
+}
 ,lm_embed
 {
 	desc->lm_embed, range_lm_embed, anode_opts
@ -361,6 +379,8 @@ ircd::gpt::pipe::exec::exec(task &task,
 	desc->ctrl, recv_ctrl
 }
 {
+	if(release && desc->model->invalid)
+		desc->model->invalid = false;
 }

 ircd::gpt::pipe::exec::~exec()