2021-04-02 12:51:59 -07:00
|
|
|
// Matrix Construct
|
|
|
|
//
|
|
|
|
// Copyright (C) Matrix Construct Developers, Authors & Contributors
|
|
|
|
// Copyright (C) 2016-2021 Jason Volk <jason@zemos.net>
|
|
|
|
//
|
|
|
|
// Permission to use, copy, modify, and/or distribute this software for any
|
|
|
|
// purpose with or without fee is hereby granted, provided that the above
|
|
|
|
// copyright notice and this permission notice is present in all copies. The
|
|
|
|
// full license for this software is available in the LICENSE file.
|
|
|
|
|
2021-05-02 14:43:10 -07:00
|
|
|
#pragma once
|
|
|
|
#define HAVE_IRCD_SIMT_MEAN_H
|
|
|
|
|
2021-05-02 14:51:49 -07:00
|
|
|
/// Averaging state; this is for computing running averages
|
|
|
|
/// XXX eventually
|
|
|
|
struct ircd_math_mean
|
|
|
|
{
|
2022-06-19 18:51:50 -07:00
|
|
|
/// Summand spread. TODO XXX
|
|
|
|
float sum[4];
|
|
|
|
|
|
|
|
/// Divisor.
|
|
|
|
uint div;
|
|
|
|
|
|
|
|
/// Last addend.
|
|
|
|
float last;
|
|
|
|
|
|
|
|
/// Computed mean.
|
|
|
|
float mean;
|
2021-05-02 14:51:49 -07:00
|
|
|
};
|
|
|
|
|
2022-10-05 18:46:39 +00:00
|
|
|
#ifdef __OPENCL_VERSION__
|
|
|
|
/// Clear the `ircd_math_mean` state to zero.
|
|
|
|
inline void
|
|
|
|
ircd_simt_math_mean_clear(__local struct ircd_math_mean *const mean)
|
|
|
|
{
|
|
|
|
mean->sum[0] = 0.0f;
|
|
|
|
mean->sum[1] = 0.0f;
|
|
|
|
mean->sum[2] = 0.0f;
|
|
|
|
mean->sum[3] = 0.0f;
|
|
|
|
mean->div = 0;
|
|
|
|
mean->last = 0.0f;
|
|
|
|
mean->mean = 0.0f;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2021-11-09 15:47:27 -08:00
|
|
|
#ifdef __OPENCL_VERSION__
|
2021-04-02 12:51:59 -07:00
|
|
|
/// Compute average of all elements in the input. The result is broadcast
|
|
|
|
/// to all elements of the output.
|
2021-04-15 10:07:17 -07:00
|
|
|
///
|
|
|
|
/// provide:
|
|
|
|
/// li = local thread id
|
|
|
|
/// ln = local group size
|
|
|
|
///
|
2021-04-02 12:51:59 -07:00
|
|
|
inline void
|
2022-01-07 10:59:31 -08:00
|
|
|
ircd_simt_math_mean_f4lldr(__local float4 *const buf,
|
2021-11-05 19:26:39 -07:00
|
|
|
const uint ln,
|
|
|
|
const uint li)
|
2021-04-02 12:51:59 -07:00
|
|
|
{
|
2022-01-07 10:59:31 -08:00
|
|
|
ircd_simt_reduce_add_f4lldr(buf, ln, li);
|
2021-04-02 12:51:59 -07:00
|
|
|
|
2021-04-15 10:07:17 -07:00
|
|
|
if(li == 0)
|
2022-01-07 10:59:31 -08:00
|
|
|
{
|
|
|
|
const float
|
2022-12-28 02:13:36 +00:00
|
|
|
sum = ircd_simt_hadd_f4(buf[li]),
|
2022-01-23 11:04:23 -08:00
|
|
|
div = ln * 4,
|
|
|
|
res = sum / div;
|
2021-04-02 12:51:59 -07:00
|
|
|
|
2022-01-07 10:59:31 -08:00
|
|
|
buf[li] = res;
|
|
|
|
}
|
|
|
|
|
|
|
|
ircd_simt_broadcast_f4lldr(buf, ln, li);
|
2021-04-02 12:51:59 -07:00
|
|
|
}
|
2021-05-02 14:43:10 -07:00
|
|
|
#endif
|