1#undef __ae2f_MACRO_GENERATED
2#define __ae2f_MACRO_GENERATED 1
6#define ae2f_NEED_CLASS 0
8#include <ae2fVK/clspv_clkeys.h>
9#undef __ae2f_MACRO_GENERATED
10#define __ae2f_MACRO_GENERATED 1
11#include <ae2f/Ann/Slp.core.h>
12#undef __ae2f_MACRO_GENERATED
13#define __ae2f_MACRO_GENERATED 1
14#include <ae2f/Ann/Slp.auto.h>
15#undef __ae2f_MACRO_GENERATED
16#define __ae2f_MACRO_GENERATED 1
18#undef __ae2f_MACRO_GENERATED
19#define __ae2f_MACRO_GENERATED 1
38)\
39{
40 if((iidx) == 0
&& (oidx) < (osz)) {
41 _clSlpPredict_t _v_predict;
42 (_v_predict).m_tmp = 0
;
43 for((_v_predict).m_j = (isz); (_v_predict).m_j--;) {
45 += p_inp[(_v_predict).m_j] * p_weight[(_v_predict).m_j + (isz) * (oidx)];
48 (_v_predict).m_tmp += (p_bias)[oidx];
49 ACT(&(_v_predict).m_ret, (_v_predict).m_tmp);
50 (loc)[oidx] = (_v_predict).m_ret;
52}
59#define _clSlpPredict_Q(
74)\
75{
76 if((oidx) < (osz) && (iidx) < (isz)) {
78 (p_weight)[(oidx) * (isz) + (iidx)] * (p_inp)[iidx]
82 ACT((&(v_predict).m_ret), ((v_predict).m_sum + (p_bias)[oidx]));
83 (loc)[oidx] = (v_predict).m_ret;
86}
93#undef __ae2f_MACRO_GENERATED
95#define __ae2f_MACRO_GENERATED 0
#define ae2f_structdef(key, name)
__kernel void kTrainAuto(__global void *glob, __local ae2f_float_t *loc, lrlsz_t lr)
loc ae2f_float_t[lsz - 1][Page]: OutStream ae2f_float_t[lsz - 1][Page]: DeltaStream
#define p_weight
sizeof(ae2f_float_t) * pgsz_sqr * llsz
#define ACT(layer_idx, r, x)
#define ACT_DERIV(layer_idx, r, x)
#define p_outstream
sizeof(ae2f_float_t) * lsz * pgsz
__kernel void kPredictStream(__global void *glob, __local ae2f_float_t *loc, const uint32_t lsz)
loc ae2f_float_t[Page]: inp ae2f_float_t[Page]: out
#define p_deltastream
sizeof(ae2f_float_t) * pgsz * llsz
#define p_goal
sizeof(ae2f_float_t) * pgsz
#define p_bias
sizeof(ae2f_float_t) * pgsz * llsz
__kernel void kPredict(__global void *glob, __local ae2f_float_t *loc, const uint32_t lsz)
loc ae2f_float_t[Page]: inp ae2f_float_t[Page]: out
char STATIC_ASSERT_LRLSZEL_SZ[sizeof(lrlszel_t)==(sizeof(uint32_t) > sizeof(ae2f_float_t) ? sizeof(uint32_t) :sizeof(ae2f_float_t)) ? 1 :-1]
#define p_layerszlist
lsz * sizeof(uint32_t)
char STATIC_ASSERT_LRLSZ_SZ[sizeof(lrlsz_t)==sizeof(lrlszel_t) *3 ? 1 :-1]
__kernel void kFollow(__global void *glob, __local ae2f_float_t *loc, lrlsz_t lr)
loc ae2f_float_t[lsz - 1][Page]: OutStream ae2f_float_t[lsz - 1][Page]: DeltaStream
#define CLK_ALL_MEM_FENCE
Contains both LOCAL and GLOBAL.
size_t get_global_id(uint dimindx)
#define work_group_reduce_add(x)
size_t get_global_size(uint dimindx)
void barrier(cl_mem_fence_flags flags)
#define __ae2f_AnnSlpFollowOneW_imp(inp, delta, weight, learningrate, inp_sz, inp_idx, out_sz, out_idx)
Weights.
#define __ae2f_AnnSlpFollowOneB_imp(r_bias, delta, learningrate_bias)
#define __ae2f_AnnSlpFetchDeltaOne_imp(v_fetchdelta_0, v_fetchdelta_1, out, out_desired, actderiv_opt, lossderiv, retdelta, oidx, osz)
#define _clMlpGetHD1(r_delta_then, i_weight, i_delta, i_iidx, i_isz, i_oidx, i_osz)
#define _clMlpRvrse(v_tmp, r_delta_then, i_oidx, i_iidx, i_isz, i_actderiv_then, i_inp, i_deltaseed)
delta to delta Propagate
#define clMlpGetHD(...)
GetHidDelta Need no structure.
void clMlpGetHD1_t(ae2f_float_t *const r_delta, const ae2f_float_t *const i_weight, const ae2f_float_t *const i_delta, const size_t i_iidx, const size_t i_isz, const size_t i_oidx, const size_t i_osz)
#define _clMlpGetHD(ONE, r_delta_then, i_weight, i_delta, i_iidx, i_isz, i_oidx, i_osz)
#define _clSlpPredict(v_predict, loc, p_inp, p_weight, p_bias, iidx, isz, oidx, osz, ACT)
ae2f_AnnSlpPredictOne_t _clSlpPredict_t