Bug Summary

File:nnc/ccv_cnnp_model_addons.c
Warning:line 1149, column 2
The left operand of '%' is a garbage value

Annotated Source Code

Press '?' to see keyboard shortcuts

clang -cc1 -cc1 -triple x86_64-unknown-linux-gnu -analyze -disable-free -clear-ast-before-backend -disable-llvm-verifier -discard-value-names -main-file-name ccv_cnnp_model_addons.c -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -mrelocation-model pic -pic-level 2 -pic-is-pie -mframe-pointer=none -fmath-errno -ffp-contract=on -fno-rounding-math -mconstructor-aliases -funwind-tables=2 -target-cpu x86-64 -target-feature +sse2 -tune-cpu generic -debugger-tuning=gdb -fdebug-compilation-dir=/home/liu/actions-runner/_work/ccv/ccv/lib/nnc -fcoverage-compilation-dir=/home/liu/actions-runner/_work/ccv/ccv/lib/nnc -resource-dir /usr/local/lib/clang/19 -I ../ -I /usr/local/cuda/include -D HAVE_CBLAS -D HAVE_LIBPNG -D HAVE_LIBJPEG -D HAVE_FFTW3 -D HAVE_PTHREAD -D HAVE_LIBLINEAR -D HAVE_TESSERACT -D HAVE_AVCODEC -D HAVE_AVFORMAT -D HAVE_AVUTIL -D HAVE_SWSCALE -D HAVE_SSE2 -D HAVE_GSL -D HAVE_CUDA -D HAVE_CUDNN -D HAVE_NCCL -D USE_SYSTEM_CUB -I /usr/local/include -internal-isystem /usr/local/lib/clang/19/include -internal-isystem /usr/local/include -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/12/../../../../x86_64-linux-gnu/include -internal-externc-isystem /usr/include/x86_64-linux-gnu -internal-externc-isystem /include -internal-externc-isystem /usr/include -O3 -ferror-limit 19 -fgnuc-version=4.2.1 -fskip-odr-check-in-gmf -vectorize-loops -vectorize-slp -analyzer-output=html -faddrsig -D__GCC_HAVE_DWARF2_CFI_ASM=1 -o /home/liu/actions-runner/_work/ccv/ccv/_analyze/2026-05-20-090030-2802958-1 -x c ccv_cnnp_model_addons.c
1#include "ccv_nnc.h"
2#include "ccv_nnc_easy.h"
3#include "ccv_nnc_internal.h"
4#include "ccv_internal.h"
5#include "_ccv_cnnp_model.h"
6
7// MARK - Add-on Functions
8
9static int _ccv_cnnp_model_clip_grad_norm_reduce_norm2(const ccv_nnc_cmd_t cmd, const ccv_nnc_hint_t hint, const int flags, ccv_nnc_tensor_t* const* const inputs, const int input_size, ccv_nnc_tensor_t* const* const outputs, const int output_size, ccv_nnc_stream_context_t* const stream_context)
10{
11 const int device_id = CCV_TENSOR_GET_DEVICE_ID(inputs[0]->info.type)(((inputs[0]->info.type) & 0xfff00) >> 8);
12 ccv_nnc_tensor_t* const old_norm2 = outputs[1 + device_id * 2];
13 ccv_nnc_tensor_t* const norm2 = outputs[1 + device_id * 2 + 1];
14 const int tensor_count = ccv_nnc_tensor_count(inputs[0]->info);
15 if (tensor_count == 1)
16 ccv_nnc_cmd_exec(CMD_MUL_FORWARD(1)ccv_nnc_cmd(CCV_NNC_MUL_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, hint, flags, TENSOR_LIST(inputs[0], inputs[0])(ccv_nnc_tensor_t* []){inputs[0], inputs[0]}, (1 +1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2)(ccv_nnc_tensor_t* []){norm2}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
17 else {
18 ccv_nnc_cmd_exec(CMD_REDUCE_NORM2_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_NORM2_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
, hint, flags, TENSOR_LIST(inputs[0])(ccv_nnc_tensor_t* []){inputs[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2)(ccv_nnc_tensor_t* []){norm2}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
19 ccv_nnc_cmd_exec(CMD_MUL_FORWARD(1)ccv_nnc_cmd(CCV_NNC_MUL_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, hint, flags, TENSOR_LIST(norm2, norm2)(ccv_nnc_tensor_t* []){norm2, norm2}, (1 +1 +1 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2)(ccv_nnc_tensor_t* []){norm2}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
20 }
21 ccv_nnc_cmd_exec(CMD_ADD_FORWARD(1, 1)ccv_nnc_cmd(CCV_NNC_ADD_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1, 1}}}, 0)
, hint, flags, TENSOR_LIST(old_norm2, norm2)(ccv_nnc_tensor_t* []){old_norm2, norm2}, (1 +1 +1 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(old_norm2)(ccv_nnc_tensor_t* []){old_norm2}, (1 +1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
22 return CCV_NNC_EXEC_SUCCESS;
23}
24
25static ccv_nnc_cmd_vtab_t clip_grad_norm_reduce_norm2_vtab = {
26 .exec = _ccv_cnnp_model_clip_grad_norm_reduce_norm2
27};
28
29static int _ccv_cnnp_model_clip_grad_norm_scatter_norm2(const ccv_nnc_cmd_t cmd, const ccv_nnc_hint_t hint, const int flags, ccv_nnc_tensor_t* const* const inputs, const int input_size, ccv_nnc_tensor_t* const* const outputs, const int output_size, ccv_nnc_stream_context_t* const stream_context)
30{
31 const int device_id = CCV_TENSOR_GET_DEVICE_ID(inputs[0]->info.type)(((inputs[0]->info.type) & 0xfff00) >> 8);
32 ccv_nnc_tensor_t* const norm2 = inputs[1 + device_id * 2];
33 ccv_nnc_cmd_exec(CMD_MUL_FORWARD(1)ccv_nnc_cmd(CCV_NNC_MUL_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, hint, flags, TENSOR_LIST(inputs[0], norm2)(ccv_nnc_tensor_t* []){inputs[0], norm2}, (1 +1 +1 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(outputs[0])(ccv_nnc_tensor_t* []){outputs[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
34 return CCV_NNC_EXEC_SUCCESS;
35}
36
37static ccv_nnc_cmd_vtab_t clip_grad_norm_scatter_norm2_vtab = {
38 .exec = _ccv_cnnp_model_clip_grad_norm_scatter_norm2
39};
40
41void ccv_cnnp_model_parameters_clip_grad_norm(ccv_cnnp_model_t* const model, const ccv_cnnp_model_io_t parameters, int norm_type, float max_norm, ccv_nnc_stream_context_t* const stream_context)
42{
43 assert(norm_type == 2)((void) sizeof ((norm_type == 2) ? 1 : 0), __extension__ ({ if
(norm_type == 2) ; else __assert_fail ("norm_type == 2", "ccv_cnnp_model_addons.c"
, 43, __extension__ __PRETTY_FUNCTION__); }))
;
44 ccv_cnnp_compiled_data_t* const compiled_data = model->compiled_data;
45 assert(compiled_data)((void) sizeof ((compiled_data) ? 1 : 0), __extension__ ({ if
(compiled_data) ; else __assert_fail ("compiled_data", "ccv_cnnp_model_addons.c"
, 45, __extension__ __PRETTY_FUNCTION__); }))
;
46 const int parallel_count = ccv_max(model->parallel_count, 1)({ typeof (model->parallel_count) _a = (model->parallel_count
); typeof (1) _b = (1); (_a > _b) ? _a : _b; })
;
47 ccv_nnc_tensor_t* norm2[parallel_count * 2];
48 ccv_nnc_tensor_t* max_normt[parallel_count];
49 const int stream_type = model->compiled_data->stream_type;
50 int i;
51 if (stream_type == CCV_STREAM_CONTEXT_GPU)
52 {
53 for (i = 0; i < parallel_count; i++)
54 {
55 ccv_nnc_tensor_param_t info = {
56 .type = CCV_TENSOR_GPU_MEMORY,
57 .format = CCV_TENSOR_FORMAT_NHWC,
58 .datatype = CCV_32F,
59 .dim = {1},
60 };
61 CCV_TENSOR_SET_DEVICE_ID(info.type, i)(info.type) = (((info.type) & ~0xfff00) | (((i) & 0xfff
) << 8))
;
62 norm2[i * 2] = ccv_nnc_tensor_new(ccv_nnc_xpu_alloc(&compiled_data->xpu_alloc, i, stream_context, ccv_nnc_tensor_data_size(info)), info, 0);
63 norm2[i * 2 + 1] = ccv_nnc_tensor_new(ccv_nnc_xpu_alloc(&compiled_data->xpu_alloc, i, stream_context, ccv_nnc_tensor_data_size(info)), info, 0);
64 max_normt[i] = ccv_nnc_tensor_new(ccv_nnc_xpu_alloc(&compiled_data->xpu_alloc, i, stream_context, ccv_nnc_tensor_data_size(info)), info, 0);
65 }
66 } else {
67 for (i = 0; i < parallel_count; i++)
68 {
69 ccv_nnc_tensor_param_t info = {
70 .type = CCV_TENSOR_CPU_MEMORY,
71 .format = CCV_TENSOR_FORMAT_NHWC,
72 .datatype = CCV_32F,
73 .dim = {1},
74 };
75 norm2[i * 2] = ccv_nnc_tensor_new(0, info, 0);
76 norm2[i * 2 + 1] = ccv_nnc_tensor_new(0, info, 0);
77 max_normt[i] = ccv_nnc_tensor_new(0, info, 0);
78 }
79 }
80 // zero out old norm2.
81 if (parallel_count > 1)
82 {
83 ccv_nnc_stream_context_t* streams[parallel_count];
84 ccv_nnc_stream_signal_t* signal;
85 if (stream_context)
86 signal = ccv_nnc_stream_context_emit_signal_new(stream_context);
87 for (i = 0; i < parallel_count; i++)
88 {
89 const int stream_type = CCV_TENSOR_GET_MEMORY(norm2[i * 2]->info.type)((norm2[i * 2]->info.type) & 0x3) == CCV_TENSOR_GPU_MEMORY ? CCV_STREAM_CONTEXT_GPU : CCV_STREAM_CONTEXT_CPU;
90 const int device_id = CCV_TENSOR_GET_DEVICE_ID(norm2[i * 2]->info.type)(((norm2[i * 2]->info.type) & 0xfff00) >> 8);
91 int type = stream_type;
92 CCV_STREAM_SET_DEVICE_ID(type, device_id)(type) = (((type) & ~0xfff00) | (((device_id) & 0xfff
) << 8))
;
93 ccv_nnc_stream_context_t* const stream_0 = ccv_cnnp_compiled_data_get_stream(compiled_data, type);
94 // Wait signal to finish.
95 if (stream_context)
96 ccv_nnc_stream_context_wait_signal(stream_0, signal);
97 ccv_nnc_cmd_exec(CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
98 if (stream_context)
99 {
100 ccv_nnc_stream_signal_t* const signal = ccv_nnc_stream_context_emit_signal_new(stream_0);
101 ccv_nnc_stream_context_wait_signal(stream_context, signal);
102 }
103 streams[i] = stream_0;
104 }
105 // If this should be blocking, blocking it.
106 if (!stream_context)
107 for (i = 0; i < parallel_count; i++)
108 if (streams[i])
109 ccv_nnc_stream_context_wait(streams[i]);
110 } else {
111 ccv_nnc_cmd_exec(CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
112 }
113 // Gather norm2.
114 ccv_nnc_cmd_t reduce_cmd = {
115 .cmd = CCV_NNC_CUSTOM_FORWARD,
116 .isa = &clip_grad_norm_reduce_norm2_vtab,
117 };
118 ccv_cnnp_model_parameter_gradients_map(model, parameters, reduce_cmd, ccv_nnc_no_hint, 0, 0, 0, norm2, parallel_count * 2, stream_context);
119 // Now compute max(max_norm / norm2, 1.0).
120 if (parallel_count > 1)
121 {
122 ccv_nnc_stream_context_t* streams[parallel_count];
123 ccv_nnc_stream_signal_t* signal;
124 if (stream_context)
125 signal = ccv_nnc_stream_context_emit_signal_new(stream_context);
126 for (i = 0; i < parallel_count; i++)
127 {
128 const int stream_type = CCV_TENSOR_GET_MEMORY(norm2[i * 2]->info.type)((norm2[i * 2]->info.type) & 0x3) == CCV_TENSOR_GPU_MEMORY ? CCV_STREAM_CONTEXT_GPU : CCV_STREAM_CONTEXT_CPU;
129 const int device_id = CCV_TENSOR_GET_DEVICE_ID(norm2[i * 2]->info.type)(((norm2[i * 2]->info.type) & 0xfff00) >> 8);
130 int type = stream_type;
131 CCV_STREAM_SET_DEVICE_ID(type, device_id)(type) = (((type) & ~0xfff00) | (((device_id) & 0xfff
) << 8))
;
132 ccv_nnc_stream_context_t* const stream_0 = ccv_cnnp_compiled_data_get_stream(compiled_data, type);
133 // Wait signal to finish.
134 if (stream_context)
135 ccv_nnc_stream_context_wait_signal(stream_0, signal);
136 ccv_nnc_cmd_exec(CMD_EWSQRT_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSQRT_FORWARD, 0, ccv_nnc_cmd_auto, 0), ccv_nnc_no_hint, 0, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
137 ccv_nnc_cmd_exec(CMD_SET_FORWARD(max_norm)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={max_norm,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(max_normt[i])(ccv_nnc_tensor_t* []){max_normt[i]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
138 ccv_nnc_cmd_exec(CMD_EWDIV_FORWARD()ccv_nnc_cmd(CCV_NNC_EWDIV_FORWARD, 0, ccv_nnc_cmd_auto, 0), ccv_nnc_no_hint, 0, TENSOR_LIST(max_normt[i], norm2[i * 2])(ccv_nnc_tensor_t* []){max_normt[i], norm2[i * 2]}, (1 +1 +1 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1
)
, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
139 ccv_nnc_cmd_exec(CMD_CLAMP_FORWARD(NAN, 1)ccv_nnc_cmd(CCV_NNC_CLAMP_FORWARD, 0, (ccv_nnc_cmd_param_t){.
size={.dim={1,1,1}},.clamp={.min=(__builtin_nanf ("")),.max=1
}}, 0)
, ccv_nnc_no_hint, 0, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2[i * 2])(ccv_nnc_tensor_t* []){norm2[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
140 if (stream_context)
141 {
142 ccv_nnc_stream_signal_t* const signal = ccv_nnc_stream_context_emit_signal_new(stream_0);
143 ccv_nnc_stream_context_wait_signal(stream_context, signal);
144 }
145 streams[i] = stream_0;
146 }
147 // If this should be blocking, blocking it.
148 if (!stream_context)
149 for (i = 0; i < parallel_count; i++)
150 if (streams[i])
151 ccv_nnc_stream_context_wait(streams[i]);
152 } else {
153 ccv_nnc_cmd_exec(CMD_EWSQRT_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSQRT_FORWARD, 0, ccv_nnc_cmd_auto, 0), ccv_nnc_no_hint, 0, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
154 ccv_nnc_cmd_exec(CMD_SET_FORWARD(max_norm)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={max_norm,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(max_normt[0])(ccv_nnc_tensor_t* []){max_normt[0]}, (1 +1 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
155 ccv_nnc_cmd_exec(CMD_EWDIV_FORWARD()ccv_nnc_cmd(CCV_NNC_EWDIV_FORWARD, 0, ccv_nnc_cmd_auto, 0), ccv_nnc_no_hint, 0, TENSOR_LIST(max_normt[0], norm2[0])(ccv_nnc_tensor_t* []){max_normt[0], norm2[0]}, (1 +1 +1 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
156 ccv_nnc_cmd_exec(CMD_CLAMP_FORWARD(NAN, 1)ccv_nnc_cmd(CCV_NNC_CLAMP_FORWARD, 0, (ccv_nnc_cmd_param_t){.
size={.dim={1,1,1}},.clamp={.min=(__builtin_nanf ("")),.max=1
}}, 0)
, ccv_nnc_no_hint, 0, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(norm2[0])(ccv_nnc_tensor_t* []){norm2[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
157 }
158 ccv_nnc_cmd_t scatter_cmd = {
159 .cmd = CCV_NNC_CUSTOM_FORWARD,
160 .isa = &clip_grad_norm_scatter_norm2_vtab,
161 };
162 ccv_cnnp_model_parameter_gradients_map(model, parameters, scatter_cmd, ccv_nnc_no_hint, 0, norm2, parallel_count * 2, 0, 0, stream_context);
163 if (stream_type == CCV_STREAM_CONTEXT_GPU)
164 for (i = 0; i < parallel_count; i++)
165 {
166 ccv_nnc_xpu_free(&compiled_data->xpu_alloc, norm2[i * 2]->data.u8);
167 ccv_nnc_xpu_free(&compiled_data->xpu_alloc, norm2[i * 2 + 1]->data.u8);
168 ccv_nnc_xpu_free(&compiled_data->xpu_alloc, max_normt[i]->data.u8);
169 }
170 for (i = 0; i < parallel_count; i++)
171 {
172 ccv_nnc_tensor_free(norm2[i * 2]);
173 ccv_nnc_tensor_free(norm2[i * 2 + 1]);
174 ccv_nnc_tensor_free(max_normt[i]);
175 }
176}
177
178// MARK - Add-on Functions
179
180static int _ccv_cnnp_model_isnan(const ccv_nnc_cmd_t cmd, const ccv_nnc_hint_t hint, const int flags, ccv_nnc_tensor_t* const* const inputs, const int input_size, ccv_nnc_tensor_t* const* const outputs, const int output_size, ccv_nnc_stream_context_t* const stream_context)
181{
182 const int device_id = CCV_TENSOR_GET_DEVICE_ID(inputs[0]->info.type)(((inputs[0]->info.type) & 0xfff00) >> 8);
183 ccv_nnc_tensor_t* const old_isnanr = outputs[1 + device_id * 2];
184 ccv_nnc_tensor_t* const isnanr = outputs[1 + device_id * 2 + 1];
185 ccv_nnc_cmd_t reduce_cmd = CMD_REDUCE_ISNAN_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_ISNAN_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
186 reduce_cmd.info.reduce.count = ccv_nnc_tensor_nd(inputs[0]->info.dim);
187 int i;
188 for (i = 0; i < cmd.info.reduce.count; i++)
189 reduce_cmd.info.reduce.axis[i] = i;
190 ccv_nnc_cmd_exec(reduce_cmd, hint, flags, TENSOR_LIST(inputs[0])(ccv_nnc_tensor_t* []){inputs[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(isnanr)(ccv_nnc_tensor_t* []){isnanr}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
191 ccv_nnc_cmd_exec(CMD_EWSUM_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSUM_FORWARD, 0, ccv_nnc_cmd_auto, 0), hint, flags, TENSOR_LIST(old_isnanr, isnanr)(ccv_nnc_tensor_t* []){old_isnanr, isnanr}, (1 +1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(old_isnanr)(ccv_nnc_tensor_t* []){old_isnanr}, (1 +1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
192 return CCV_NNC_EXEC_SUCCESS;
193}
194
195static ccv_nnc_cmd_vtab_t reduce_isnan_vtab = {
196 .exec = _ccv_cnnp_model_isnan
197};
198
199int ccv_cnnp_model_parameter_gradients_isnan(ccv_cnnp_model_t* const model, const ccv_cnnp_model_io_t parameters, ccv_nnc_stream_context_t* const stream_context)
200{
201 ccv_cnnp_compiled_data_t* const compiled_data = model->compiled_data;
202 assert(compiled_data)((void) sizeof ((compiled_data) ? 1 : 0), __extension__ ({ if
(compiled_data) ; else __assert_fail ("compiled_data", "ccv_cnnp_model_addons.c"
, 202, __extension__ __PRETTY_FUNCTION__); }))
;
203 const int parallel_count = ccv_max(model->parallel_count, 1)({ typeof (model->parallel_count) _a = (model->parallel_count
); typeof (1) _b = (1); (_a > _b) ? _a : _b; })
;
204 ccv_nnc_tensor_t* isnanr[parallel_count * 2];
205 const int stream_type = model->compiled_data->stream_type;
206 int i;
207 if (stream_type == CCV_STREAM_CONTEXT_GPU)
208 {
209 for (i = 0; i < parallel_count; i++)
210 {
211 ccv_nnc_tensor_param_t info = {
212 .type = CCV_TENSOR_GPU_MEMORY,
213 .format = CCV_TENSOR_FORMAT_NHWC,
214 .datatype = CCV_32S,
215 .dim = {1},
216 };
217 CCV_TENSOR_SET_DEVICE_ID(info.type, i)(info.type) = (((info.type) & ~0xfff00) | (((i) & 0xfff
) << 8))
;
218 isnanr[i * 2] = ccv_nnc_tensor_new(ccv_nnc_xpu_alloc(&compiled_data->xpu_alloc, i, stream_context, ccv_nnc_tensor_data_size(info)), info, 0);
219 isnanr[i * 2 + 1] = ccv_nnc_tensor_new(ccv_nnc_xpu_alloc(&compiled_data->xpu_alloc, i, stream_context, ccv_nnc_tensor_data_size(info)), info, 0);
220 }
221 } else {
222 for (i = 0; i < parallel_count; i++)
223 {
224 ccv_nnc_tensor_param_t info = {
225 .type = CCV_TENSOR_CPU_MEMORY,
226 .format = CCV_TENSOR_FORMAT_NHWC,
227 .datatype = CCV_32S,
228 .dim = {1},
229 };
230 isnanr[i * 2] = ccv_nnc_tensor_new(0, info, 0);
231 isnanr[i * 2 + 1] = ccv_nnc_tensor_new(0, info, 0);
232 }
233 }
234 // zero out old isnanr.
235 if (parallel_count > 1)
236 {
237 ccv_nnc_stream_context_t* streams[parallel_count];
238 ccv_nnc_stream_signal_t* signal;
239 if (stream_context)
240 signal = ccv_nnc_stream_context_emit_signal_new(stream_context);
241 for (i = 0; i < parallel_count; i++)
242 {
243 const int stream_type = CCV_TENSOR_GET_MEMORY(isnanr[i * 2]->info.type)((isnanr[i * 2]->info.type) & 0x3) == CCV_TENSOR_GPU_MEMORY ? CCV_STREAM_CONTEXT_GPU : CCV_STREAM_CONTEXT_CPU;
244 const int device_id = CCV_TENSOR_GET_DEVICE_ID(isnanr[i * 2]->info.type)(((isnanr[i * 2]->info.type) & 0xfff00) >> 8);
245 int type = stream_type;
246 CCV_STREAM_SET_DEVICE_ID(type, device_id)(type) = (((type) & ~0xfff00) | (((device_id) & 0xfff
) << 8))
;
247 ccv_nnc_stream_context_t* const stream_0 = ccv_cnnp_compiled_data_get_stream(compiled_data, type);
248 // Wait signal to finish.
249 if (stream_context)
250 ccv_nnc_stream_context_wait_signal(stream_0, signal);
251 ccv_nnc_cmd_exec(CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(isnanr[i * 2])(ccv_nnc_tensor_t* []){isnanr[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_0);
252 if (stream_context)
253 {
254 ccv_nnc_stream_signal_t* const signal = ccv_nnc_stream_context_emit_signal_new(stream_0);
255 ccv_nnc_stream_context_wait_signal(stream_context, signal);
256 }
257 streams[i] = stream_0;
258 }
259 // If this should be blocking, blocking it.
260 if (!stream_context)
261 for (i = 0; i < parallel_count; i++)
262 if (streams[i])
263 ccv_nnc_stream_context_wait(streams[i]);
264 } else
265 ccv_nnc_cmd_exec(CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, 0, TENSOR_LIST(isnanr[0])(ccv_nnc_tensor_t* []){isnanr[0]}, (1 +1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, stream_context);
266 // Gather isnanr.
267 ccv_nnc_cmd_t reduce_cmd = {
268 .cmd = CCV_NNC_CUSTOM_FORWARD,
269 .isa = &reduce_isnan_vtab,
270 };
271 ccv_cnnp_model_parameter_gradients_map(model, parameters, reduce_cmd, ccv_nnc_no_hint, 0, 0, 0, isnanr, parallel_count * 2, stream_context);
272 for (i = 0; i < parallel_count; i++)
273 ccv_nnc_tensor_free(isnanr[i * 2 + 1]);
274 int retval = 0;
275 if (stream_type == CCV_TENSOR_GPU_MEMORY)
276 {
277 ccv_nnc_tensor_param_t info = {
278 .type = CCV_TENSOR_CPU_MEMORY,
279 .format = CCV_TENSOR_FORMAT_NHWC,
280 .datatype = CCV_32S,
281 .dim = {1},
282 };
283 ccv_nnc_tensor_t* checknan = ccv_nnc_tensor_new(0, info, 0);
284 for (i = 0; i < parallel_count; i++)
285 {
286 ccv_nnc_cmd_exec(CMD_DATA_TRANSFER_FORWARD()ccv_nnc_cmd(CCV_NNC_DATA_TRANSFER_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, ccv_nnc_no_hint, 0, TENSOR_LIST(isnanr[i * 2])(ccv_nnc_tensor_t* []){isnanr[i * 2]}, (1 +1 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_LIST(checknan)(ccv_nnc_tensor_t* []){checknan}, (1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, 0);
287 if (checknan->data.i32[0] > 0)
288 {
289 retval = 1;
290 break;
291 }
292 }
293 ccv_nnc_tensor_free(checknan);
294 } else {
295 for (i = 0; i < parallel_count; i++)
296 if (isnanr[i * 2]->data.i32[0] > 0)
297 {
298 retval = 1;
299 break;
300 }
301 }
302 for (i = 0; i < parallel_count; i++)
303 ccv_nnc_tensor_free(isnanr[i * 2]);
304 return retval;
305}
306
307// MARK - Core Layers
308
309static void _ccv_cnnp_sum_build(ccv_cnnp_model_t* const self, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
310{
311 PRINT(CCV_CLI_VERBOSE, "[cnnp_sum_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_sum_build] -\n"); fflush(stdout); } } while (
0)
;
312 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 312, __extension__ __PRETTY_FUNCTION__
); }))
;
313 outputs[0] = ccv_nnc_tensor_symbol_new(graph, ccv_nnc_tensor_symbol_params(graph, inputs[0]), 0);
314 ccv_nnc_graph_exec_symbol_new(graph, CMD_EWSUM_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSUM_FORWARD, 0, ccv_nnc_cmd_auto, 0), inputs, input_size, outputs, output_size, 0);
315}
316
317static ccv_cnnp_model_t* _ccv_cnnp_sum_copy(const ccv_cnnp_model_t* const self, void* const context);
318
319static const ccv_cnnp_model_vtab_t ccv_cnnp_sum_isa = {
320 .build = _ccv_cnnp_sum_build,
321 .copy = _ccv_cnnp_sum_copy,
322};
323
324typedef struct {
325 ccv_cnnp_model_t super;
326 ccv_nnc_tensor_symbol_t output;
327} ccv_cnnp_model_sum_t;
328
329ccv_cnnp_model_t* ccv_cnnp_sum(const char* const name)
330{
331 ccv_cnnp_model_sum_t* const model_sum = (ccv_cnnp_model_sum_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_sum_t));
332 model_sum->super.isa = &ccv_cnnp_sum_isa;
333 model_sum->super.input_size = 0;
334 model_sum->super.outputs = &model_sum->output;
335 model_sum->super.output_size = 1;
336 ccv_cnnp_model_copy_name(&model_sum->super, name);
337 return (ccv_cnnp_model_t*)model_sum;
338}
339
340static ccv_cnnp_model_t* _ccv_cnnp_sum_copy(const ccv_cnnp_model_t* const self, void* const context)
341{
342 return ccv_cnnp_sum(self->name);
343}
344
345typedef struct {
346 ccv_cnnp_model_t super;
347 int axis;
348 ccv_nnc_tensor_symbol_t output;
349} ccv_cnnp_model_concat_t;
350
351static void _ccv_cnnp_concat_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
352{
353 const ccv_cnnp_model_concat_t* const self = (const ccv_cnnp_model_concat_t*)super;
354 PRINT(CCV_CLI_VERBOSE, "[cnnp_concat_build] 1. -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_concat_build] 1. -\n"); fflush(stdout); } } while
(0)
;
355 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 355, __extension__ __PRETTY_FUNCTION__
); }))
;
356 ccv_nnc_tensor_param_t output_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
357 int i, j;
358 if (output_params.dim[0] == 0)
359 for (i = 1; i < input_size; i++)
360 {
361 output_params = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
362 if (output_params.dim[0] != 0)
363 break;
364 }
365 const int nd = ccv_nnc_tensor_nd(output_params.dim);
366 const int axis = self->axis;
367 assert(axis < nd)((void) sizeof ((axis < nd) ? 1 : 0), __extension__ ({ if (
axis < nd) ; else __assert_fail ("axis < nd", "ccv_cnnp_model_addons.c"
, 367, __extension__ __PRETTY_FUNCTION__); }))
;
368 output_params.dim[axis] = 0;
369 int input_is_contiguous = 1;
370 for (i = 0; i < input_size; i++)
371 {
372 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
373 const int input_nd = ccv_nnc_tensor_nd(input_params.dim);
374 if (input_nd == 0)
375 {
376 PRINT(CCV_CLI_VERBOSE, "[cnnp_concat_build] %d. input[%d]: -\n", i + 2, i)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_concat_build] %d. input[%d]: -\n", i + 2, i)
; fflush(stdout); } } while (0)
;
377 input_is_contiguous = 0;
378 continue;
379 }
380 if (CCV_CLI_OUTPUT_LEVEL_IS(CCV_CLI_VERBOSE)(CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
381 {
382 PRINT(CCV_CLI_VERBOSE, "[cnnp_concat_build] %d. input[%d]: (%d", i + 2, i, input_params.dim[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_concat_build] %d. input[%d]: (%d", i + 2, i,
input_params.dim[0]); fflush(stdout); } } while (0)
;
383 int i;
384 for (i = 1; i < CCV_NNC_MAX_DIM_ALLOC(12) && input_params.dim[i] > 0; i++)
385 PRINT(CCV_CLI_VERBOSE, ", %d", input_params.dim[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", input_params.dim[i]); fflush(stdout); } } while
(0)
;
386 PRINT(CCV_CLI_VERBOSE, ")\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(")\n"); fflush(stdout); } } while (0)
;
387 }
388 assert(input_nd == nd)((void) sizeof ((input_nd == nd) ? 1 : 0), __extension__ ({ if
(input_nd == nd) ; else __assert_fail ("input_nd == nd", "ccv_cnnp_model_addons.c"
, 388, __extension__ __PRETTY_FUNCTION__); }))
;
389 for (j = 0; j < nd; j++)
390 if (j != axis)
391 { assert(input_params.dim[j] == output_params.dim[j])((void) sizeof ((input_params.dim[j] == output_params.dim[j])
? 1 : 0), __extension__ ({ if (input_params.dim[j] == output_params
.dim[j]) ; else __assert_fail ("input_params.dim[j] == output_params.dim[j]"
, "ccv_cnnp_model_addons.c", 391, __extension__ __PRETTY_FUNCTION__
); }))
; }
392 output_params.dim[axis] += input_params.dim[axis];
393 }
394 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
395 int ofs[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
396 int stride[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
397 ccv_nnc_tensor_get_stride(output_params.dim, stride);
398 if (input_is_contiguous)
399 {
400 ccv_nnc_tensor_symbol_t aliases[input_size];
401 for (i = 0; i < input_size; i++)
402 {
403 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
404 aliases[i] = ccv_nnc_tensor_symbol_alias_new(graph, outputs[0], ofs, stride, input_params, 0);
405 ofs[axis] += input_params.dim[axis];
406 }
407 // Format transform is more flexible.
408 ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, input_size, aliases, input_size, "concat");
409 } else {
410 ccv_nnc_tensor_symbol_t aliases[input_size];
411 for (i = 0; i < input_size; i++)
412 {
413 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
414 if (input_params.dim[0] == 0)
415 {
416 // Create a new alias anyway, but not going to use it, in this way, the alias count will match during absorb.
417 aliases[i] = ccv_nnc_tensor_symbol_alias_new(graph, outputs[0], ofs, stride, input_params, 0);
418 continue;
419 }
420 aliases[i] = ccv_nnc_tensor_symbol_alias_new(graph, outputs[0], ofs, stride, input_params, 0);
421 ofs[axis] += input_params.dim[axis];
422 }
423 // Format transform is more flexible.
424 ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, input_size, aliases, input_size, "concat");
425 }
426}
427
428static ccv_cnnp_model_t* _ccv_cnnp_concat_copy(const ccv_cnnp_model_t* const self, void* const context);
429
430static const ccv_cnnp_model_vtab_t ccv_cnnp_concat_isa = {
431 .build = _ccv_cnnp_concat_build,
432 .copy = _ccv_cnnp_concat_copy,
433};
434
435ccv_cnnp_model_t* ccv_cnnp_concat(const int axis, const char* const name)
436{
437 ccv_cnnp_model_concat_t* const model_concat = (ccv_cnnp_model_concat_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_concat_t));
438 model_concat->super.isa = &ccv_cnnp_concat_isa;
439 model_concat->super.input_size = 0;
440 model_concat->super.outputs = &model_concat->output;
441 model_concat->super.output_size = 1;
442 model_concat->axis = axis;
443 ccv_cnnp_model_copy_name(&model_concat->super, name);
444 return (ccv_cnnp_model_t*)model_concat;
445}
446
447static ccv_cnnp_model_t* _ccv_cnnp_concat_copy(const ccv_cnnp_model_t* const super, void* const context)
448{
449 const ccv_cnnp_model_concat_t* const self = (const ccv_cnnp_model_concat_t*)super;
450 return ccv_cnnp_concat(self->axis, self->super.name);
451}
452
453typedef struct {
454 ccv_cnnp_model_t super;
455 int axis;
456 ccv_nnc_tensor_symbol_t outputs[1];
457} ccv_cnnp_model_chunk_t;
458
459static void _ccv_cnnp_chunk_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
460{
461 const ccv_cnnp_model_concat_t* const self = (const ccv_cnnp_model_concat_t*)super;
462 PRINT(CCV_CLI_VERBOSE, "[cnnp_chunk_build] 1. axis: %d\n", self->axis)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_chunk_build] 1. axis: %d\n", self->axis);
fflush(stdout); } } while (0)
;
463 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 463, __extension__ __PRETTY_FUNCTION__); }))
;
464 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
465 if (CCV_CLI_OUTPUT_LEVEL_IS(CCV_CLI_VERBOSE)(CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
466 {
467 PRINT(CCV_CLI_VERBOSE, "[cnnp_chunk_build] 2. input: (%d", input_params.dim[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_chunk_build] 2. input: (%d", input_params.dim
[0]); fflush(stdout); } } while (0)
;
468 int i;
469 for (i = 1; i < CCV_NNC_MAX_DIM_ALLOC(12) && input_params.dim[i] > 0; i++)
470 PRINT(CCV_CLI_VERBOSE, ", %d", input_params.dim[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", input_params.dim[i]); fflush(stdout); } } while
(0)
;
471 PRINT(CCV_CLI_VERBOSE, ")\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(")\n"); fflush(stdout); } } while (0)
;
472 }
473 ccv_nnc_tensor_param_t output_params = input_params;
474 int i;
475 const int nd = ccv_nnc_tensor_nd(output_params.dim);
476 const int axis = self->axis;
477 assert(axis < nd)((void) sizeof ((axis < nd) ? 1 : 0), __extension__ ({ if (
axis < nd) ; else __assert_fail ("axis < nd", "ccv_cnnp_model_addons.c"
, 477, __extension__ __PRETTY_FUNCTION__); }))
;
478 const int n = self->super.output_size;
479 assert(n == output_size)((void) sizeof ((n == output_size) ? 1 : 0), __extension__ ({
if (n == output_size) ; else __assert_fail ("n == output_size"
, "ccv_cnnp_model_addons.c", 479, __extension__ __PRETTY_FUNCTION__
); }))
;
480 assert(output_params.dim[axis] % n == 0)((void) sizeof ((output_params.dim[axis] % n == 0) ? 1 : 0), __extension__
({ if (output_params.dim[axis] % n == 0) ; else __assert_fail
("output_params.dim[axis] % n == 0", "ccv_cnnp_model_addons.c"
, 480, __extension__ __PRETTY_FUNCTION__); }))
;
481 output_params.dim[axis] = output_params.dim[axis] / n;
482 int ofs[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
483 int stride[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
484 ccv_nnc_tensor_get_stride(input_params.dim, stride);
485 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
486 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If we are not reshape an alias, it is straightforward.
487 {
488 for (i = 0; i < output_size; i++)
489 {
490 outputs[i] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], ofs, stride, output_params, 0);
491 ofs[axis] += output_params.dim[axis];
492 }
493 } else {
494 // Otherwise, we need to check if it is permute. For permute, we cannot do alias directly.
495 // We need to first materialize the permute and then run reshape on top of it, otherwise it will be wrong.
496 int old_stride[CCV_NNC_MAX_DIM_ALLOC(12)];
497 ccv_nnc_tensor_symbol_alias_params(graph, inputs[0], 0, old_stride);
498 // We identify permute by checking if the stride is not in descending order.
499 // This also covered "permute" through reshape, rather than using ccv_cnnp_permute directly.
500 int i, no_permute = 1;
501 for (i = 1; no_permute && i < nd; i++)
502 if (old_stride[i - 1] < old_stride[i])
503 no_permute = 0;
504 if (no_permute)
505 { // Just straightforward reshape if there is no no permute.
506 for (i = 0; i < output_size; i++)
507 {
508 outputs[i] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], ofs, old_stride, output_params, 0);
509 ofs[axis] += output_params.dim[axis];
510 }
511 } else {
512 // Otherwise, we first do format transform to plain tensor and then do reshape.
513 ccv_nnc_tensor_symbol_t permuted = ccv_nnc_tensor_symbol_new(graph, input_params, 0);
514 ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(permuted)(const ccv_nnc_tensor_symbol_t []){permuted}, (1 +1 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "reshape");
515 for (i = 0; i < output_size; i++)
516 {
517 outputs[i] = ccv_nnc_tensor_symbol_alias_new(graph, permuted, ofs, stride, output_params, 0);
518 ofs[axis] += output_params.dim[axis];
519 }
520 }
521 }
522}
523
524static ccv_cnnp_model_t* _ccv_cnnp_chunk_copy(const ccv_cnnp_model_t* const self, void* const context);
525
526static const ccv_cnnp_model_vtab_t ccv_cnnp_chunk_isa = {
527 .build = _ccv_cnnp_chunk_build,
528 .copy = _ccv_cnnp_chunk_copy,
529};
530
531ccv_cnnp_model_t* ccv_cnnp_chunk(const int n, const int axis, const char* const name)
532{
533 assert(n >= 1)((void) sizeof ((n >= 1) ? 1 : 0), __extension__ ({ if (n >=
1) ; else __assert_fail ("n >= 1", "ccv_cnnp_model_addons.c"
, 533, __extension__ __PRETTY_FUNCTION__); }))
;
534 ccv_cnnp_model_chunk_t* const model_chunk = (ccv_cnnp_model_chunk_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_chunk_t) + sizeof(ccv_nnc_tensor_symbol_t) * (n - 1));
535 model_chunk->super.isa = &ccv_cnnp_chunk_isa;
536 model_chunk->super.input_size = 1;
537 model_chunk->super.outputs = model_chunk->outputs;
538 model_chunk->super.output_size = n;
539 model_chunk->axis = axis;
540 ccv_cnnp_model_copy_name(&model_chunk->super, name);
541 return (ccv_cnnp_model_t*)model_chunk;
542}
543
544static ccv_cnnp_model_t* _ccv_cnnp_chunk_copy(const ccv_cnnp_model_t* const super, void* const context)
545{
546 const ccv_cnnp_model_chunk_t* const self = (const ccv_cnnp_model_chunk_t*)super;
547 return ccv_cnnp_chunk(self->super.output_size, self->axis, self->super.name);
548}
549
550typedef struct {
551 ccv_cnnp_model_t super;
552 ccv_nnc_tensor_symbol_t output;
553 int format;
554 int dim[CCV_NNC_MAX_DIM_ALLOC(12)];
555 int ofs[CCV_NNC_MAX_DIM_ALLOC(12)];
556 int stride[CCV_NNC_MAX_DIM_ALLOC(12)];
557} ccv_cnnp_model_reshape_t;
558
559static void _ccv_cnnp_reshape_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
560{
561 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 561, __extension__ __PRETTY_FUNCTION__); }))
;
562 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 562, __extension__ __PRETTY_FUNCTION__
); }))
;
563 ccv_cnnp_model_reshape_t* const self = (ccv_cnnp_model_reshape_t*)super;
564 if (CCV_CLI_OUTPUT_LEVEL_IS(CCV_CLI_VERBOSE)(CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
565 {
566 PRINT(CCV_CLI_VERBOSE, "[cnnp_reshape_build] 1. dim: (%d", self->dim[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reshape_build] 1. dim: (%d", self->dim[0]
); fflush(stdout); } } while (0)
;
567 int i;
568 for (i = 1; i < CCV_NNC_MAX_DIM_ALLOC(12) && self->dim[i] > 0; i++)
569 PRINT(CCV_CLI_VERBOSE, ", %d", self->dim[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", self->dim[i]); fflush(stdout); } } while
(0)
;
570 const int count = i;
571 PRINT(CCV_CLI_VERBOSE, "), ofs: (%d", self->ofs[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("), ofs: (%d", self->ofs[0]); fflush(stdout); } }
while (0)
;
572 for (i = 1; i < count; i++)
573 PRINT(CCV_CLI_VERBOSE, ", %d", self->ofs[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", self->ofs[i]); fflush(stdout); } } while
(0)
;
574 PRINT(CCV_CLI_VERBOSE, "), stride: (%d", self->stride[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("), stride: (%d", self->stride[0]); fflush(stdout
); } } while (0)
;
575 for (i = 1; i < count; i++)
576 PRINT(CCV_CLI_VERBOSE, ", %d", self->stride[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", self->stride[i]); fflush(stdout); } } while
(0)
;
577 PRINT(CCV_CLI_VERBOSE, ")\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(")\n"); fflush(stdout); } } while (0)
;
578 }
579 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
580 int dim[CCV_NNC_MAX_DIM_ALLOC(12)];
581 memcpy(dim, self->dim, sizeof(dim));
582 int i, auto_idx = -1;
583 size_t known = 1;
584 const size_t tensor_count = ccv_nnc_tensor_count(params);
585 for (i = 0; i < CCV_NNC_MAX_DIM_ALLOC(12) && dim[i]; i++)
586 if (dim[i] == -1)
587 auto_idx = i;
588 else
589 known *= dim[i];
590 if (auto_idx >= 0)
591 {
592 assert(known > 0 && tensor_count % known == 0)((void) sizeof ((known > 0 && tensor_count % known
== 0) ? 1 : 0), __extension__ ({ if (known > 0 &&
tensor_count % known == 0) ; else __assert_fail ("known > 0 && tensor_count % known == 0"
, "ccv_cnnp_model_addons.c", 592, __extension__ __PRETTY_FUNCTION__
); }))
;
593 dim[auto_idx] = tensor_count / known;
594 }
595 if (CCV_CLI_OUTPUT_LEVEL_IS(CCV_CLI_VERBOSE)(CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
596 {
597 PRINT(CCV_CLI_VERBOSE, "[cnnp_reshape_build] 2. input: (%d", params.dim[0])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reshape_build] 2. input: (%d", params.dim[0]
); fflush(stdout); } } while (0)
;
598 int i;
599 for (i = 1; i < CCV_NNC_MAX_DIM_ALLOC(12) && params.dim[i] > 0; i++)
600 PRINT(CCV_CLI_VERBOSE, ", %d", params.dim[i])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(", %d", params.dim[i]); fflush(stdout); } } while (
0)
;
601 PRINT(CCV_CLI_VERBOSE, ")\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf(")\n"); fflush(stdout); } } while (0)
;
602 }
603 assert(ccv_nnc_dimension_count(dim) <= ccv_nnc_tensor_count(params))((void) sizeof ((ccv_nnc_dimension_count(dim) <= ccv_nnc_tensor_count
(params)) ? 1 : 0), __extension__ ({ if (ccv_nnc_dimension_count
(dim) <= ccv_nnc_tensor_count(params)) ; else __assert_fail
("ccv_nnc_dimension_count(dim) <= ccv_nnc_tensor_count(params)"
, "ccv_cnnp_model_addons.c", 603, __extension__ __PRETTY_FUNCTION__
); }))
;
604 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
605 int stride_from_dim[CCV_NNC_MAX_DIM_ALLOC(12)];
606 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If we are not reshape an alias, it is straightforward.
607 {
608 memcpy(params.dim, dim, sizeof(params.dim));
609 int* stride;
610 if (self->stride[0] == 0)
611 {
612 ccv_nnc_tensor_get_stride(dim, stride_from_dim);
613 stride = stride_from_dim;
614 } else
615 stride = self->stride;
616 if (self->format > 0)
617 params.format = self->format;
618 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], self->ofs, stride, params, 0);
619 } else {
620 // Otherwise, we need to check if it is permute. For permute, we cannot do alias directly.
621 // We need to first materialize the permute and then run reshape on top of it, otherwise it will be wrong.
622 int old_stride[CCV_NNC_MAX_DIM_ALLOC(12)];
623 ccv_nnc_tensor_symbol_alias_params(graph, inputs[0], 0, old_stride);
624 // We identify permute by checking if the stride is not in descending order.
625 // This also covered "permute" through reshape, rather than using ccv_cnnp_permute directly.
626 const int nd = ccv_nnc_tensor_nd(params.dim);
627 const int new_nd = ccv_nnc_tensor_nd(dim);
628 int i, no_permute = 1;
629 // If the new dim has different nd, or we actually have a stride, we need to check if it is no permute or not.
630 if (new_nd != nd || (self->stride[0] != 0 && memcmp(self->stride, old_stride, sizeof(self->stride))))
631 for (i = 1; no_permute && i < nd; i++)
632 if (old_stride[i - 1] < old_stride[i])
633 no_permute = 0;
634 if (no_permute)
635 { // Just straightforward reshape if there is no no permute.
636 memcpy(params.dim, dim, sizeof(params.dim));
637 int* stride;
638 if (self->stride[0] == 0)
639 {
640 if (new_nd != nd) // Cannot use old stride.
641 {
642 ccv_nnc_tensor_get_stride(dim, stride_from_dim);
643 stride = stride_from_dim;
644 } else
645 stride = old_stride;
646 } else
647 stride = self->stride;
648 if (self->format > 0)
649 params.format = self->format;
650 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], self->ofs, stride, params, 0);
651 } else {
652 // Otherwise, we first do format transform to plain tensor and then do reshape.
653 ccv_nnc_tensor_symbol_t permuted = ccv_nnc_tensor_symbol_new(graph, params, 0);
654 ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(permuted)(const ccv_nnc_tensor_symbol_t []){permuted}, (1 +1 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "reshape");
655 memcpy(params.dim, dim, sizeof(params.dim));
656 int* stride;
657 if (self->stride[0] == 0)
658 {
659 ccv_nnc_tensor_get_stride(dim, stride_from_dim);
660 stride = stride_from_dim;
661 } else
662 stride = self->stride;
663 if (self->format > 0)
664 params.format = self->format;
665 // And then we create alias against the permuted one.
666 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, permuted, self->ofs, stride, params, 0);
667 }
668 }
669}
670
671static ccv_cnnp_model_t* _ccv_cnnp_reshape_copy(const ccv_cnnp_model_t* const super, void* const context);
672
673static const ccv_cnnp_model_vtab_t ccv_cnnp_reshape_isa = {
674 .build = _ccv_cnnp_reshape_build,
675 .copy = _ccv_cnnp_reshape_copy,
676};
677
678ccv_cnnp_model_t* ccv_cnnp_reshape(const int format, const int dim[CCV_NNC_MAX_DIM_ALLOC(12)], const int ofs[CCV_NNC_MAX_DIM_ALLOC(12)], const int stride[CCV_NNC_MAX_DIM_ALLOC(12)], const char* const name)
679{
680 ccv_cnnp_model_reshape_t* const model_reshape = (ccv_cnnp_model_reshape_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reshape_t));
681 model_reshape->super.isa = &ccv_cnnp_reshape_isa;
682 model_reshape->super.input_size = 1;
683 model_reshape->super.outputs = &model_reshape->output;
684 model_reshape->super.output_size = 1;
685 ccv_cnnp_model_copy_name(&model_reshape->super, name);
686 model_reshape->format = format;
687 memcpy(model_reshape->dim, dim, sizeof(model_reshape->dim));
688 memcpy(model_reshape->ofs, ofs, sizeof(model_reshape->ofs));
689 if (stride[0] != 0)
690 memcpy(model_reshape->stride, stride, sizeof(model_reshape->stride));
691 return (ccv_cnnp_model_t*)model_reshape;
692}
693
694static ccv_cnnp_model_t* _ccv_cnnp_reshape_copy(const ccv_cnnp_model_t* const super, void* const context)
695{
696 const ccv_cnnp_model_reshape_t* const self = (const ccv_cnnp_model_reshape_t*)super;
697 return ccv_cnnp_reshape(self->format, self->dim, self->ofs, self->stride, self->super.name);
698}
699
700typedef struct {
701 ccv_cnnp_model_t super;
702 ccv_nnc_tensor_symbol_t output;
703 int type;
704 int begin[CCV_NNC_MAX_DIM_ALLOC(12)];
705 int end[CCV_NNC_MAX_DIM_ALLOC(12)];
706} ccv_cnnp_model_pad_t;
707
708static void _ccv_cnnp_pad_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
709{
710 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 710, __extension__ __PRETTY_FUNCTION__); }))
;
711 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 711, __extension__ __PRETTY_FUNCTION__
); }))
;
712 ccv_cnnp_model_pad_t* const self = (ccv_cnnp_model_pad_t*)super;
713 PRINT(CCV_CLI_VERBOSE, "[cnnp_pad_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_pad_build] -\n"); fflush(stdout); } } while (
0)
;
714 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
715 const int nd = ccv_nnc_tensor_nd(input_params.dim);
716 ccv_nnc_tensor_param_t params = input_params;
717 int i;
718 for (i = 0 ; i < nd; i++)
719 params.dim[i] += self->begin[i] + self->end[i];
720 const ccv_nnc_tensor_symbol_t padded = ccv_nnc_tensor_symbol_new(graph, params, 0);
721 ccv_nnc_cmd_t pad = CMD_PAD_FORWARD(self->type, (), ())ccv_nnc_cmd(CCV_NNC_PAD_FORWARD, 0, ((ccv_nnc_cmd_param_t){.size
={.dim={}},.pad={.type=self->type,.end={}}}), 0)
;
722 memcpy(pad.info.size.dim, self->begin, sizeof(pad.info.size.dim));
723 memcpy(pad.info.pad.end, self->end, sizeof(pad.info.pad.end));
724 ccv_nnc_graph_exec_symbol_new(graph, pad, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(padded)(const ccv_nnc_tensor_symbol_t []){padded}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "pad");
725 outputs[0] = padded;
726}
727
728static ccv_cnnp_model_t* _ccv_cnnp_pad_copy(const ccv_cnnp_model_t* const super, void* const context);
729
730static const ccv_cnnp_model_vtab_t ccv_cnnp_pad_isa = {
731 .build = _ccv_cnnp_pad_build,
732 .copy = _ccv_cnnp_pad_copy,
733};
734
735ccv_cnnp_model_t* ccv_cnnp_pad(const int type, const int begin[CCV_NNC_MAX_DIM_ALLOC(12)], const int end[CCV_NNC_MAX_DIM_ALLOC(12)], const char* const name)
736{
737 ccv_cnnp_model_pad_t* const model_pad = (ccv_cnnp_model_pad_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_pad_t));
738 model_pad->super.isa = &ccv_cnnp_pad_isa;
739 model_pad->super.input_size = 1;
740 model_pad->super.outputs = &model_pad->output;
741 model_pad->super.output_size = 1;
742 ccv_cnnp_model_copy_name(&model_pad->super, name);
743 model_pad->type = type;
744 memcpy(model_pad->begin, begin, sizeof(model_pad->begin));
745 memcpy(model_pad->end, end, sizeof(model_pad->end));
746 return (ccv_cnnp_model_t*)model_pad;
747}
748
749static ccv_cnnp_model_t* _ccv_cnnp_pad_copy(const ccv_cnnp_model_t* const super, void* const context)
750{
751 const ccv_cnnp_model_pad_t* const self = (const ccv_cnnp_model_pad_t*)super;
752 return ccv_cnnp_pad(self->type, self->begin, self->end, self->super.name);
753}
754
755typedef struct {
756 ccv_cnnp_model_t super;
757 ccv_nnc_tensor_symbol_t output;
758} ccv_cnnp_model_identity_t;
759
760static void _ccv_cnnp_identity_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
761{
762 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 762, __extension__ __PRETTY_FUNCTION__); }))
;
763 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 763, __extension__ __PRETTY_FUNCTION__
); }))
;
764 PRINT(CCV_CLI_VERBOSE, "[cnnp_identity_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_identity_build] -\n"); fflush(stdout); } } while
(0)
;
765 outputs[0] = inputs[0];
766}
767
768static ccv_cnnp_model_t* _ccv_cnnp_identity_copy(const ccv_cnnp_model_t* const super, void* const context);
769
770static const ccv_cnnp_model_vtab_t ccv_cnnp_identity_isa = {
771 .build = _ccv_cnnp_identity_build,
772 .copy = _ccv_cnnp_identity_copy,
773};
774
775ccv_cnnp_model_t* ccv_cnnp_identity(const char* const name)
776{
777 ccv_cnnp_model_identity_t* const model_identity = (ccv_cnnp_model_identity_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_identity_t));
778 model_identity->super.isa = &ccv_cnnp_identity_isa;
779 model_identity->super.input_size = 1;
780 model_identity->super.outputs = &model_identity->output;
781 model_identity->super.output_size = 1;
782 ccv_cnnp_model_copy_name(&model_identity->super, name);
783 return (ccv_cnnp_model_t*)model_identity;
784}
785
786static ccv_cnnp_model_t* _ccv_cnnp_identity_copy(const ccv_cnnp_model_t* const super, void* const context)
787{
788 const ccv_cnnp_model_identity_t* const self = (const ccv_cnnp_model_identity_t*)super;
789 return ccv_cnnp_identity(self->super.name);
790}
791
792typedef struct {
793 ccv_cnnp_model_t super;
794 ccv_nnc_tensor_symbol_t output;
795 int index[CCV_NNC_MAX_DIM_ALLOC(12)];
796} ccv_cnnp_model_permute_t;
797
798static void _ccv_cnnp_permute_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
799{
800 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 800, __extension__ __PRETTY_FUNCTION__); }))
;
801 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 801, __extension__ __PRETTY_FUNCTION__
); }))
;
802 ccv_cnnp_model_permute_t* const self = (ccv_cnnp_model_permute_t*)super;
803 PRINT(CCV_CLI_VERBOSE, "[cnnp_permute_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_permute_build] -\n"); fflush(stdout); } } while
(0)
;
804 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
805 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
806 const int nd = ccv_nnc_tensor_nd(params.dim);
807 int input_dim[CCV_NNC_MAX_DIM_ALLOC(12)];
808 memcpy(input_dim, params.dim, sizeof(params.dim));
809 int input_stride[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
810 int output_stride[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
811 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If it is not an alias. Find stride and permute.
812 {
813 ccv_nnc_tensor_get_stride(input_dim, input_stride);
814 int i;
815 for (i = 0; i < nd; i++)
816 {
817 const int idx = self->index[i];
818 assert(idx >= 0 && idx < nd)((void) sizeof ((idx >= 0 && idx < nd) ? 1 : 0)
, __extension__ ({ if (idx >= 0 && idx < nd) ; else
__assert_fail ("idx >= 0 && idx < nd", "ccv_cnnp_model_addons.c"
, 818, __extension__ __PRETTY_FUNCTION__); }))
;
819 params.dim[i] = input_dim[idx];
820 output_stride[i] = input_stride[idx];
821 }
822 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], ccv_nnc_no_ofs, output_stride, params, 0);
823 } else {
824 // if it is an alias, we can get the stride from it and use that.
825 int input_ofs[CCV_NNC_MAX_DIM_ALLOC(12)];
826 ccv_nnc_tensor_symbol_alias_params(graph, inputs[0], input_ofs, input_stride);
827 assert(input_stride[0] != 0)((void) sizeof ((input_stride[0] != 0) ? 1 : 0), __extension__
({ if (input_stride[0] != 0) ; else __assert_fail ("input_stride[0] != 0"
, "ccv_cnnp_model_addons.c", 827, __extension__ __PRETTY_FUNCTION__
); }))
;
828 int output_ofs[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
829 int i;
830 for (i = 0; i < nd; i++)
831 {
832 const int idx = self->index[i];
833 assert(idx >= 0 && idx < nd)((void) sizeof ((idx >= 0 && idx < nd) ? 1 : 0)
, __extension__ ({ if (idx >= 0 && idx < nd) ; else
__assert_fail ("idx >= 0 && idx < nd", "ccv_cnnp_model_addons.c"
, 833, __extension__ __PRETTY_FUNCTION__); }))
;
834 params.dim[i] = input_dim[idx];
835 output_stride[i] = input_stride[idx];
836 output_ofs[i] = input_ofs[idx];
837 }
838 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], output_ofs, output_stride, params, 0);
839 }
840}
841
842static ccv_cnnp_model_t* _ccv_cnnp_permute_copy(const ccv_cnnp_model_t* const super, void* const context);
843
844static const ccv_cnnp_model_vtab_t ccv_cnnp_permute_isa = {
845 .build = _ccv_cnnp_permute_build,
846 .copy = _ccv_cnnp_permute_copy,
847};
848
849ccv_cnnp_model_t* ccv_cnnp_permute(const int index[CCV_NNC_MAX_DIM_ALLOC(12)], const char* const name)
850{
851 ccv_cnnp_model_permute_t* const model_permute = (ccv_cnnp_model_permute_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_permute_t));
852 model_permute->super.isa = &ccv_cnnp_permute_isa;
853 model_permute->super.input_size = 1;
854 model_permute->super.outputs = &model_permute->output;
855 model_permute->super.output_size = 1;
856 ccv_cnnp_model_copy_name(&model_permute->super, name);
857 memcpy(model_permute->index, index, sizeof(model_permute->index));
858 return (ccv_cnnp_model_t*)model_permute;
859}
860
861static ccv_cnnp_model_t* _ccv_cnnp_permute_copy(const ccv_cnnp_model_t* const super, void* const context)
862{
863 const ccv_cnnp_model_permute_t* const self = (const ccv_cnnp_model_permute_t*)super;
864 return ccv_cnnp_permute(self->index, self->super.name);
865}
866
867typedef struct {
868 ccv_cnnp_model_t super;
869 int index;
870 ccv_nnc_tensor_symbol_t output;
871} ccv_cnnp_model_extract_t;
872
873static void _ccv_cnnp_extract_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
874{
875 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 875, __extension__ __PRETTY_FUNCTION__
); }))
;
876 ccv_cnnp_model_extract_t* const self = (ccv_cnnp_model_extract_t*)super;
877 PRINT(CCV_CLI_VERBOSE, "[cnnp_extract_build] index: %d\n", self->index)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_extract_build] index: %d\n", self->index)
; fflush(stdout); } } while (0)
;
878 outputs[0] = inputs[self->index];
879}
880
881static ccv_cnnp_model_t* _ccv_cnnp_extract_copy(const ccv_cnnp_model_t* const self, void* const context);
882
883static const ccv_cnnp_model_vtab_t ccv_cnnp_extract_isa = {
884 .build = _ccv_cnnp_extract_build,
885 .copy = _ccv_cnnp_extract_copy,
886};
887
888ccv_cnnp_model_t* ccv_cnnp_extract(const int index, const char* const name)
889{
890 ccv_cnnp_model_extract_t* const model_extract = (ccv_cnnp_model_extract_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_extract_t));
891 model_extract->index = index;
892 model_extract->super.isa = &ccv_cnnp_extract_isa;
893 model_extract->super.input_size = 0;
894 model_extract->super.outputs = &model_extract->output;
895 model_extract->super.output_size = 1;
896 ccv_cnnp_model_copy_name(&model_extract->super, name);
897 return (ccv_cnnp_model_t*)model_extract;
898}
899
900static ccv_cnnp_model_t* _ccv_cnnp_extract_copy(const ccv_cnnp_model_t* const super, void* const context)
901{
902 ccv_cnnp_model_extract_t* const self = (ccv_cnnp_model_extract_t*)super;
903 return ccv_cnnp_extract(self->index, self->super.name);
904}
905
906typedef struct {
907 ccv_cnnp_model_t super;
908 ccv_nnc_tensor_symbol_t output;
909} ccv_cnnp_model_flatten_t;
910
911static void _ccv_cnnp_flatten_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
912{
913 PRINT(CCV_CLI_VERBOSE, "[cnnp_flatten_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_flatten_build] -\n"); fflush(stdout); } } while
(0)
;
914 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 914, __extension__ __PRETTY_FUNCTION__); }))
;
915 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 915, __extension__ __PRETTY_FUNCTION__
); }))
;
916 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
917 ccv_nnc_tensor_param_t output_params = params;
918 memset(output_params.dim, 0, sizeof(output_params.dim));
919 output_params.dim[0] = ccv_nnc_tensor_get_n(params);
920 assert(output_params.dim[0] > 0)((void) sizeof ((output_params.dim[0] > 0) ? 1 : 0), __extension__
({ if (output_params.dim[0] > 0) ; else __assert_fail ("output_params.dim[0] > 0"
, "ccv_cnnp_model_addons.c", 920, __extension__ __PRETTY_FUNCTION__
); }))
;
921 output_params.dim[1] = ccv_nnc_tensor_count(params) / output_params.dim[0];
922 int stride[CCV_NNC_MAX_DIM_ALLOC(12)] = {};
923 ccv_nnc_tensor_get_stride(output_params.dim, stride);
924 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], DIM_ALLOC()(int [(12)]){}, stride, output_params, 0);
925}
926
927static ccv_cnnp_model_t* _ccv_cnnp_flatten_copy(const ccv_cnnp_model_t* const self, void* const context);
928
929static const ccv_cnnp_model_vtab_t ccv_cnnp_flatten_isa = {
930 .build = _ccv_cnnp_flatten_build,
931 .copy = _ccv_cnnp_flatten_copy,
932};
933
934ccv_cnnp_model_t* ccv_cnnp_flatten(const char* const name)
935{
936 ccv_cnnp_model_flatten_t* const model_flatten = (ccv_cnnp_model_flatten_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_flatten_t));
937 model_flatten->super.isa = &ccv_cnnp_flatten_isa;
938 model_flatten->super.input_size = 1;
939 model_flatten->super.outputs = &model_flatten->output;
940 model_flatten->super.output_size = 1;
941 ccv_cnnp_model_copy_name(&model_flatten->super, name);
942 return (ccv_cnnp_model_t*)model_flatten;
943}
944
945static ccv_cnnp_model_t* _ccv_cnnp_flatten_copy(const ccv_cnnp_model_t* const self, void* const context)
946{
947 return ccv_cnnp_flatten(self->name);
948}
949
950// MARK - Batch Norm Layer
951
952typedef struct {
953 ccv_cnnp_model_t super;
954 ccv_nnc_tensor_symbol_t output;
955 ccv_nnc_tensor_symbol_t bias;
956 ccv_nnc_tensor_symbol_t scale;
957 ccv_nnc_graph_exec_symbol_t batch_norm;
958 ccv_nnc_cmd_param_t params;
959 ccv_array_t* zero_inits;
960 ccv_array_t* retainables;
961} ccv_cnnp_model_batch_norm_t;
962
963static void _ccv_cnnp_batch_norm_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
964{
965 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 965, __extension__ __PRETTY_FUNCTION__); }))
;
966 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 966, __extension__ __PRETTY_FUNCTION__
); }))
;
967 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
968 PRINT(CCV_CLI_VERBOSE, "[cnnp_batch_norm_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_batch_norm_build] -\n"); fflush(stdout); } }
while (0)
;
969 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
970 const int nd = ccv_nnc_tensor_nd(params.dim);
971 ccv_nnc_tensor_param_t bias_params = params;
972 memset(bias_params.dim, 0, sizeof(bias_params.dim));
973 // If the accuracy is not enough, bump it to 32-bit floating point.
974 if (bias_params.datatype != CCV_32F && bias_params.datatype != CCV_64F)
975 bias_params.datatype = CCV_32F;
976 bias_params.dim[0] = nd > 1 ? ccv_nnc_tensor_get_c(params) : params.dim[0];
977 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, params, 0);
978 // Both scale and bias are shared between if this model is reused.
979 if (!self->scale.graph)
980 self->scale = ccv_nnc_tensor_symbol_new(graph, bias_params, "scale");
981 if (!self->bias.graph)
982 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
983 const ccv_nnc_tensor_symbol_t scale = ccv_cnnp_model_get_symbol(super, self->scale);
984 const ccv_nnc_tensor_symbol_t bias = ccv_cnnp_model_get_symbol(super, self->bias);
985 const ccv_nnc_tensor_symbol_t mean = ccv_nnc_tensor_symbol_new(graph, bias_params, "mean");
986 const ccv_nnc_tensor_symbol_t var = ccv_nnc_tensor_symbol_new(graph, bias_params, "var");
987 // Otherwise, notice mean, var, saved_mean, saved_inv_std are not reused.
988 if (!self->zero_inits)
989 self->zero_inits = ccv_array_new(sizeof(ccv_nnc_tensor_symbol_t), 0, 0);
990 ccv_array_push(self->zero_inits, &mean);
991 ccv_array_push(self->zero_inits, &var);
992 const ccv_nnc_tensor_symbol_t out_mean = ccv_nnc_tensor_symbol_new(graph, bias_params, "out_mean");
993 const ccv_nnc_tensor_symbol_t out_var = ccv_nnc_tensor_symbol_new(graph, bias_params, "out_var");
994 if (!self->retainables)
995 self->retainables = ccv_array_new(sizeof(ccv_nnc_tensor_symbol_t), 0, 0);
996 ccv_array_push(self->retainables, &out_mean);
997 ccv_array_push(self->retainables, &out_var);
998 const ccv_nnc_tensor_symbol_t saved_mean = ccv_nnc_tensor_symbol_new(graph, bias_params, "saved_mean");
999 const ccv_nnc_tensor_symbol_t saved_inv_std = ccv_nnc_tensor_symbol_new(graph, bias_params, "saved_inv_std");
1000 const int hw = ccv_nnc_tensor_hw(params, ccv_nnc_tensor_nd(params.dim), CCV_NNC_MAX_DIM(2));
1001 ccv_nnc_cmd_param_t batch_norm = self->params;
1002 batch_norm.bnorm.count = hw >= 0 ? CCV_NNC_MAX_DIM(2) + 1 : 1;
1003 int i;
1004 batch_norm.bnorm.axis[0] = (params.format == CCV_TENSOR_FORMAT_CHWN) ? 3 : 0;
1005 if (hw >= 0)
1006 for (i = 0; i < CCV_NNC_MAX_DIM(2); i++)
1007 batch_norm.bnorm.axis[i + 1] = i + hw;
1008 self->params = batch_norm;
1009 self->batch_norm = ccv_nnc_graph_exec_symbol_new(graph, ccv_nnc_cmd(CCV_NNC_BATCH_NORM_FORWARD, 0, batch_norm, 0), TENSOR_SYMBOL_LIST(inputs[0], scale, bias, mean, var)(const ccv_nnc_tensor_symbol_t []){inputs[0], scale, bias, mean
, var}, (1 +1 +1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, out_mean, out_var, saved_mean, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, out_mean, out_var,
saved_mean, saved_inv_std}, (1 +1 +1 +1 +1 +1 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "batch_norm");
1010 outputs[0] = output;
1011}
1012
1013static void _ccv_cnnp_batch_norm_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
1014{
1015 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
1016 if (self->scale.graph)
1017 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(0, 1)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={0, 1}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->scale);
1018 if (self->bias.graph)
1019 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
1020 int i;
1021 if (self->zero_inits)
1022 for (i = 0; i < self->zero_inits->rnum; i++)
1023 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, *(ccv_nnc_tensor_symbol_t*)ccv_array_get(self->zero_inits, i)((void*)(((char*)((self->zero_inits)->data)) + (size_t)
(self->zero_inits)->rsize * (size_t)(i)))
);
1024}
1025
1026static void _ccv_cnnp_batch_norm_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
1027{
1028 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
1029 if (self->scale.graph)
1030 add_to_array(parameters, self->scale, is_trainable);
1031 if (self->bias.graph)
1032 add_to_array(parameters, self->bias, is_trainable);
1033}
1034
1035static void _ccv_cnnp_batch_norm_add_to_output(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const outputs)
1036{
1037 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
1038 int i;
1039 if (self->retainables)
1040 for (i = 0; i < self->retainables->rnum; i++)
1041 {
1042 const ccv_nnc_tensor_symbol_t symbol = *(ccv_nnc_tensor_symbol_t*)ccv_array_get(self->retainables, i)((void*)(((char*)((self->retainables)->data)) + (size_t
)(self->retainables)->rsize * (size_t)(i)))
;
1043 add_to_array(outputs, symbol, 0);
1044 }
1045}
1046
1047static void _ccv_cnnp_batch_norm_set_is_test(ccv_cnnp_model_t* const super, const int is_test, const ccv_cnnp_cmd_updater_f updater, void* const context)
1048{
1049 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
1050 if (self->batch_norm.graph)
1051 {
1052 self->params.bnorm.is_test = is_test;
1053 updater(context, self->batch_norm, ccv_nnc_cmd(CCV_NNC_BATCH_NORM_FORWARD, 0, self->params, 0), ccv_nnc_no_hint);
1054 }
1055}
1056
1057static void _ccv_cnnp_batch_norm_deinit(ccv_cnnp_model_t* const super)
1058{
1059 ccv_cnnp_model_batch_norm_t* const self = (ccv_cnnp_model_batch_norm_t*)super;
1060 if (self->zero_inits)
1061 ccv_array_free(self->zero_inits);
1062 if (self->retainables)
1063 ccv_array_free(self->retainables);
1064}
1065
1066static ccv_cnnp_model_t* _ccv_cnnp_batch_norm_copy(const ccv_cnnp_model_t* const super, void* const context);
1067
1068static const ccv_cnnp_model_vtab_t ccv_cnnp_batch_norm_isa = {
1069 .build = _ccv_cnnp_batch_norm_build,
1070 .init_states = _ccv_cnnp_batch_norm_init_states,
1071 .add_to_parameter = _ccv_cnnp_batch_norm_add_to_parameter,
1072 .add_to_output = _ccv_cnnp_batch_norm_add_to_output,
1073 .copy = _ccv_cnnp_batch_norm_copy,
1074 .set_is_test = _ccv_cnnp_batch_norm_set_is_test,
1075 .deinit = _ccv_cnnp_batch_norm_deinit,
1076};
1077
1078ccv_cnnp_model_t* ccv_cnnp_batch_norm(const float momentum, const float epsilon, const int is_trainable, const char* const name)
1079{
1080 ccv_cnnp_model_batch_norm_t* const model_batch_norm = (ccv_cnnp_model_batch_norm_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_batch_norm_t));
1081 model_batch_norm->super.isa = &ccv_cnnp_batch_norm_isa;
1082 model_batch_norm->super.input_size = 1;
1083 model_batch_norm->super.outputs = &model_batch_norm->output;
1084 model_batch_norm->super.output_size = 1;
1085 model_batch_norm->super.is_trainable = is_trainable;
1086 ccv_cnnp_model_copy_name(&model_batch_norm->super, name);
1087 model_batch_norm->scale.d = CCV_NNC_NO_TENSOR_SYMBOL;
1088 model_batch_norm->scale.graph = 0;
1089 model_batch_norm->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
1090 model_batch_norm->bias.graph = 0;
1091 model_batch_norm->params.bnorm.momentum = momentum;
1092 model_batch_norm->params.bnorm.epsilon = epsilon;
1093 return (ccv_cnnp_model_t*)model_batch_norm;
1094}
1095
1096static ccv_cnnp_model_t* _ccv_cnnp_batch_norm_copy(const ccv_cnnp_model_t* const super, void* const context)
1097{
1098 const ccv_cnnp_model_batch_norm_t* const self = (const ccv_cnnp_model_batch_norm_t*)super;
1099 return ccv_cnnp_batch_norm(self->params.bnorm.momentum, self->params.bnorm.epsilon, self->super.is_trainable, self->super.name);
1100}
1101
1102// MARK - Convolution Layer
1103
1104typedef struct {
1105 ccv_cnnp_model_t super;
1106 ccv_nnc_tensor_symbol_t output;
1107 ccv_nnc_tensor_symbol_t weights;
1108 ccv_nnc_tensor_symbol_t bias;
1109 int groups;
1110 int filters;
1111 int kdim[CCV_NNC_MAX_DIM_ALLOC(12)];
1112 int dilation[CCV_NNC_MAX_DIM_ALLOC(12)];
1113 int no_bias;
1114 int format;
1115 ccv_nnc_hint_t hint;
1116} ccv_cnnp_model_convolution_t;
1117
1118static void _ccv_cnnp_convolution_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1119{
1120 ccv_cnnp_model_convolution_t* const self = (ccv_cnnp_model_convolution_t*)super;
1121 PRINT(CCV_CLI_VERBOSE, "[cnnp_convolution_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_convolution_build] -\n"); fflush(stdout); } }
while (0)
;
1
Assuming the condition is false
2
Taking false branch
3
Loop condition is false. Exiting loop
1122 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1122, __extension__ __PRETTY_FUNCTION__); }))
;
4
Assuming 'input_size' is equal to 1
5
Taking true branch
1123 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1123, __extension__ __PRETTY_FUNCTION__
); }))
;
6
Assuming 'output_size' is equal to 1
7
Taking true branch
1124 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1125 int i;
1126 const int k_nd = ccv_nnc_tensor_nd(self->kdim);
1127 const int nd = k_nd + 2;
1128 ccv_nnc_tensor_param_t weights_params = params;
1129 if (self->format)
8
Assuming field 'format' is 0
9
Taking false branch
1130 weights_params.format = self->format;
1131 ccv_nnc_tensor_set_n(&weights_params, self->filters);
1132 const int a_nd = ccv_nnc_tensor_nd(params.dim);
1133 int c;
10
'c' declared without an initial value
1134 switch (params.format)
11
'Default' branch taken. Execution continues on line 1149
1135 {
1136 case CCV_TENSOR_FORMAT_NHWC:
1137 c = params.dim[a_nd - 1];
1138 break;
1139 case CCV_TENSOR_FORMAT_NCHW:
1140 if (a_nd == k_nd + 1)
1141 c = params.dim[0];
1142 else
1143 c = params.dim[a_nd <= 1 ? 0 : 1];
1144 break;
1145 case CCV_TENSOR_FORMAT_CHWN:
1146 c = params.dim[0];
1147 break;
1148 }
1149 assert(c % self->groups == 0)((void) sizeof ((c % self->groups == 0) ? 1 : 0), __extension__
({ if (c % self->groups == 0) ; else __assert_fail ("c % self->groups == 0"
, "ccv_cnnp_model_addons.c", 1149, __extension__ __PRETTY_FUNCTION__
); }))
;
12
The left operand of '%' is a garbage value
1150 ccv_nnc_tensor_set_c(&weights_params, nd, c / self->groups);
1151 int hw = -1;
1152 if (weights_params.format == CCV_TENSOR_FORMAT_NHWC || weights_params.format == CCV_TENSOR_FORMAT_CHWN)
1153 hw = 1;
1154 else if (weights_params.format == CCV_TENSOR_FORMAT_NCHW)
1155 hw = 2;
1156 assert(hw >= 0)((void) sizeof ((hw >= 0) ? 1 : 0), __extension__ ({ if (hw
>= 0) ; else __assert_fail ("hw >= 0", "ccv_cnnp_model_addons.c"
, 1156, __extension__ __PRETTY_FUNCTION__); }))
;
1157 for (i = 0; i < k_nd; i++)
1158 weights_params.dim[i + hw] = self->kdim[i];
1159 if (!self->weights.graph)
1160 self->weights = ccv_nnc_tensor_symbol_new(graph, weights_params, "weights");
1161 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 1161, __extension__ __PRETTY_FUNCTION__); }))
;
1162 const ccv_nnc_tensor_symbol_t weights = ccv_cnnp_model_get_symbol(super, self->weights);
1163 ccv_nnc_tensor_param_t bias_params = params;
1164 if (self->format)
1165 bias_params.format = self->format;
1166 memset(bias_params.dim, 0, sizeof(bias_params.dim));
1167 bias_params.dim[0] = self->filters;
1168 ccv_nnc_cmd_t cmd = CMD_CONVOLUTION_FORWARD(self->groups, self->filters)ccv_nnc_cmd(CCV_NNC_CONVOLUTION_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={}},.convolution={.count=self->filters,.groups
=self->groups}}), 0)
;
1169 for (i = 0; i < k_nd; i++)
1170 cmd.info.size.dim[i] = self->kdim[i];
1171 cmd.info.size.dim[k_nd] = c;
1172 memcpy(cmd.info.convolution.dilation, self->dilation, sizeof(self->dilation));
1173 ccv_nnc_tensor_param_t output_params;
1174 // Dilate weight size based on the dilation factor.
1175 for (i = 0; i < k_nd; i++)
1176 weights_params.dim[i + hw] = (self->kdim[i] - 1) * ccv_max(self->dilation[i], 1)({ typeof (self->dilation[i]) _a = (self->dilation[i]);
typeof (1) _b = (1); (_a > _b) ? _a : _b; })
+ 1;
1177 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
1178 params,
1179 weights_params,
1180 bias_params,
1181 }, 3, self->hint, &output_params, 1);
1182 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1183 ccv_nnc_graph_exec_symbol_t convolution;
1184 if (self->no_bias)
1185 convolution = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights}, (1 +1
+1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "convolution");
1186 else {
1187 if (!self->bias.graph)
1188 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
1189 const ccv_nnc_tensor_symbol_t bias = ccv_cnnp_model_get_symbol(super, self->bias);
1190 convolution = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights, bias},
(1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "convolution");
1191 }
1192 ccv_nnc_graph_exec_symbol_set_hint(graph, convolution, self->hint);
1193 outputs[0] = output;
1194}
1195
1196static void _ccv_cnnp_convolution_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
1197{
1198 ccv_cnnp_model_convolution_t* const self = (ccv_cnnp_model_convolution_t*)super;
1199 const ccv_nnc_tensor_param_t weight_params = ccv_nnc_tensor_symbol_params(graph, self->weights);
1200 const int n = ccv_max(ccv_nnc_tensor_get_n(weight_params), 1)({ typeof (ccv_nnc_tensor_get_n(weight_params)) _a = (ccv_nnc_tensor_get_n
(weight_params)); typeof (1) _b = (1); (_a > _b) ? _a : _b
; })
;
1201 const int count = ccv_nnc_tensor_count(weight_params);
1202 const float std = sqrtf(2) / sqrtf(count / n);
1203 const float bound = sqrtf(3) * std;
1204 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
1205 if (self->bias.graph)
1206 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
1207}
1208
1209static void _ccv_cnnp_convolution_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
1210{
1211 ccv_cnnp_model_convolution_t* const self = (ccv_cnnp_model_convolution_t*)super;
1212 add_to_array(parameters, self->weights, is_trainable);
1213 if (self->bias.graph)
1214 add_to_array(parameters, self->bias, is_trainable);
1215}
1216
1217static ccv_cnnp_model_t* _ccv_cnnp_convolution_copy(const ccv_cnnp_model_t* const super, void* const context);
1218
1219static const ccv_cnnp_model_vtab_t ccv_cnnp_convolution_isa = {
1220 .build = _ccv_cnnp_convolution_build,
1221 .init_states = _ccv_cnnp_convolution_init_states,
1222 .add_to_parameter = _ccv_cnnp_convolution_add_to_parameter,
1223 .copy = _ccv_cnnp_convolution_copy,
1224};
1225
1226ccv_cnnp_model_t* ccv_cnnp_convolution(const int groups, const int filters, const int kdim[CCV_NNC_MAX_DIM_ALLOC(12)], const int dilation[CCV_NNC_MAX_DIM_ALLOC(12)], const int no_bias, ccv_nnc_hint_t hint, const int format, const int is_trainable, const char* const name)
1227{
1228 ccv_cnnp_model_convolution_t* const model_convolution = (ccv_cnnp_model_convolution_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_convolution_t));
1229 model_convolution->super.isa = &ccv_cnnp_convolution_isa;
1230 model_convolution->super.input_size = 1;
1231 model_convolution->super.outputs = &model_convolution->output;
1232 model_convolution->super.output_size = 1;
1233 model_convolution->super.is_trainable = is_trainable;
1234 ccv_cnnp_model_copy_name(&model_convolution->super, name);
1235 model_convolution->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
1236 model_convolution->weights.graph = 0;
1237 model_convolution->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
1238 model_convolution->bias.graph = 0;
1239 model_convolution->groups = groups;
1240 model_convolution->filters = filters;
1241 memcpy(model_convolution->kdim, kdim, sizeof(model_convolution->kdim));
1242 memcpy(model_convolution->dilation, dilation, sizeof(model_convolution->dilation));
1243 model_convolution->no_bias = no_bias;
1244 model_convolution->hint = hint;
1245 model_convolution->format = format;
1246 return (ccv_cnnp_model_t*)model_convolution;
1247}
1248
1249static ccv_cnnp_model_t* _ccv_cnnp_convolution_copy(const ccv_cnnp_model_t* const super, void* const context)
1250{
1251 ccv_cnnp_model_convolution_t* const self = (ccv_cnnp_model_convolution_t*)super;
1252 return ccv_cnnp_convolution(self->groups, self->filters, self->kdim, self->dilation, self->no_bias, self->hint, self->format, self->super.is_trainable, self->super.name);
1253}
1254
1255// MARK - Convolution Transpose Layer
1256
1257typedef struct {
1258 ccv_cnnp_model_t super;
1259 ccv_nnc_tensor_symbol_t output;
1260 ccv_nnc_tensor_symbol_t weights;
1261 ccv_nnc_tensor_symbol_t bias;
1262 int groups;
1263 int filters;
1264 int kdim[CCV_NNC_MAX_DIM_ALLOC(12)];
1265 int dilation[CCV_NNC_MAX_DIM_ALLOC(12)];
1266 int output_padding;
1267 int no_bias;
1268 int format;
1269 ccv_nnc_hint_t hint;
1270} ccv_cnnp_model_convolution_transpose_t;
1271
1272static void _ccv_cnnp_convolution_transpose_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1273{
1274 ccv_cnnp_model_convolution_transpose_t* const self = (ccv_cnnp_model_convolution_transpose_t*)super;
1275 PRINT(CCV_CLI_VERBOSE, "[cnnp_convolution_transpose_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_convolution_transpose_build] -\n"); fflush(stdout
); } } while (0)
;
1276 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1276, __extension__ __PRETTY_FUNCTION__); }))
;
1277 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1277, __extension__ __PRETTY_FUNCTION__
); }))
;
1278 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1279 int i;
1280 const int nd = CCV_NNC_MAX_DIM(2) + 2;
1281 ccv_nnc_tensor_param_t weights_params = params;
1282 if (self->format)
1283 weights_params.format = self->format;
1284 const int c = ccv_nnc_tensor_get_c(params);
1285 ccv_nnc_tensor_set_n(&weights_params, c);
1286 assert(c % self->groups == 0)((void) sizeof ((c % self->groups == 0) ? 1 : 0), __extension__
({ if (c % self->groups == 0) ; else __assert_fail ("c % self->groups == 0"
, "ccv_cnnp_model_addons.c", 1286, __extension__ __PRETTY_FUNCTION__
); }))
;
1287 ccv_nnc_tensor_set_c(&weights_params, nd, self->filters / self->groups);
1288 const int hw = ccv_nnc_tensor_hw(weights_params, nd, CCV_NNC_MAX_DIM(2));
1289 assert(hw >= 0)((void) sizeof ((hw >= 0) ? 1 : 0), __extension__ ({ if (hw
>= 0) ; else __assert_fail ("hw >= 0", "ccv_cnnp_model_addons.c"
, 1289, __extension__ __PRETTY_FUNCTION__); }))
;
1290 for (i = 0; i < CCV_NNC_MAX_DIM(2); i++)
1291 weights_params.dim[i + hw] = self->kdim[i];
1292 if (!self->weights.graph)
1293 self->weights = ccv_nnc_tensor_symbol_new(graph, weights_params, "weights");
1294 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 1294, __extension__ __PRETTY_FUNCTION__); }))
;
1295 const ccv_nnc_tensor_symbol_t weights = ccv_cnnp_model_get_symbol(super, self->weights);
1296 ccv_nnc_tensor_param_t bias_params = params;
1297 if (self->format)
1298 bias_params.format = self->format;
1299 memset(bias_params.dim, 0, sizeof(bias_params.dim));
1300 bias_params.dim[0] = self->filters;
1301 ccv_nnc_cmd_t cmd = CMD_CONVOLUTION_TRANSPOSE_FORWARD(self->groups, self->filters, self->output_padding)ccv_nnc_cmd(CCV_NNC_CONVOLUTION_TRANSPOSE_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={}},.convolution_transpose={.count=self->filters
,.groups=self->groups,.output_padding=self->output_padding
}}), 0)
;
1302 for (i = 0; i < CCV_NNC_MAX_DIM(2); i++)
1303 cmd.info.size.dim[i] = self->kdim[i];
1304 cmd.info.size.dim[CCV_NNC_MAX_DIM(2)] = c;
1305 memcpy(cmd.info.convolution_transpose.dilation, self->dilation, sizeof(self->dilation));
1306 ccv_nnc_tensor_param_t output_params;
1307 // Dilate weight size based on the dilation factor.
1308 for (i = 0; i < CCV_NNC_MAX_DIM(2); i++)
1309 weights_params.dim[i + hw] = (self->kdim[i] - 1) * ccv_max(self->dilation[i], 1)({ typeof (self->dilation[i]) _a = (self->dilation[i]);
typeof (1) _b = (1); (_a > _b) ? _a : _b; })
+ 1;
1310 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
1311 params,
1312 weights_params,
1313 bias_params,
1314 }, 3, self->hint, &output_params, 1);
1315 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1316 ccv_nnc_graph_exec_symbol_t convolution_transpose;
1317 if (self->no_bias)
1318 convolution_transpose = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights}, (1 +1
+1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "convolution_transpose");
1319 else {
1320 if (!self->bias.graph)
1321 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
1322 const ccv_nnc_tensor_symbol_t bias = ccv_cnnp_model_get_symbol(super, self->bias);
1323 convolution_transpose = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights, bias},
(1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "convolution_transpose");
1324 }
1325 ccv_nnc_graph_exec_symbol_set_hint(graph, convolution_transpose, self->hint);
1326 outputs[0] = output;
1327}
1328
1329static void _ccv_cnnp_convolution_transpose_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
1330{
1331 ccv_cnnp_model_convolution_transpose_t* const self = (ccv_cnnp_model_convolution_transpose_t*)super;
1332 const ccv_nnc_tensor_param_t weight_params = ccv_nnc_tensor_symbol_params(graph, self->weights);
1333 const int n = ccv_max(ccv_nnc_tensor_get_n(weight_params), 1)({ typeof (ccv_nnc_tensor_get_n(weight_params)) _a = (ccv_nnc_tensor_get_n
(weight_params)); typeof (1) _b = (1); (_a > _b) ? _a : _b
; })
;
1334 const int count = ccv_nnc_tensor_count(weight_params);
1335 const float std = sqrtf(2) / sqrtf(count / n);
1336 const float bound = sqrtf(3) * std;
1337 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
1338 if (self->bias.graph)
1339 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
1340}
1341
1342static void _ccv_cnnp_convolution_transpose_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
1343{
1344 ccv_cnnp_model_convolution_transpose_t* const self = (ccv_cnnp_model_convolution_transpose_t*)super;
1345 add_to_array(parameters, self->weights, is_trainable);
1346 if (self->bias.graph)
1347 add_to_array(parameters, self->bias, is_trainable);
1348}
1349
1350static ccv_cnnp_model_t* _ccv_cnnp_convolution_transpose_copy(const ccv_cnnp_model_t* const super, void* const context);
1351
1352static const ccv_cnnp_model_vtab_t ccv_cnnp_convolution_transpose_isa = {
1353 .build = _ccv_cnnp_convolution_transpose_build,
1354 .init_states = _ccv_cnnp_convolution_transpose_init_states,
1355 .add_to_parameter = _ccv_cnnp_convolution_transpose_add_to_parameter,
1356 .copy = _ccv_cnnp_convolution_transpose_copy,
1357};
1358
1359ccv_cnnp_model_t* ccv_cnnp_convolution_transpose(const int groups, const int filters, const int kdim[CCV_NNC_MAX_DIM_ALLOC(12)], const int dilation[CCV_NNC_MAX_DIM_ALLOC(12)], const int output_padding, const int no_bias, ccv_nnc_hint_t hint, const int format, const int is_trainable, const char* const name)
1360{
1361 ccv_cnnp_model_convolution_transpose_t* const model_convolution_transpose = (ccv_cnnp_model_convolution_transpose_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_convolution_transpose_t));
1362 model_convolution_transpose->super.isa = &ccv_cnnp_convolution_transpose_isa;
1363 model_convolution_transpose->super.input_size = 1;
1364 model_convolution_transpose->super.outputs = &model_convolution_transpose->output;
1365 model_convolution_transpose->super.output_size = 1;
1366 model_convolution_transpose->super.is_trainable = is_trainable;
1367 ccv_cnnp_model_copy_name(&model_convolution_transpose->super, name);
1368 model_convolution_transpose->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
1369 model_convolution_transpose->weights.graph = 0;
1370 model_convolution_transpose->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
1371 model_convolution_transpose->bias.graph = 0;
1372 model_convolution_transpose->groups = groups;
1373 model_convolution_transpose->filters = filters;
1374 memcpy(model_convolution_transpose->kdim, kdim, sizeof(model_convolution_transpose->kdim));
1375 memcpy(model_convolution_transpose->dilation, dilation, sizeof(model_convolution_transpose->dilation));
1376 model_convolution_transpose->output_padding = output_padding;
1377 model_convolution_transpose->no_bias = no_bias;
1378 model_convolution_transpose->hint = hint;
1379 model_convolution_transpose->format = format;
1380 return (ccv_cnnp_model_t*)model_convolution_transpose;
1381}
1382
1383static ccv_cnnp_model_t* _ccv_cnnp_convolution_transpose_copy(const ccv_cnnp_model_t* const super, void* const context)
1384{
1385 ccv_cnnp_model_convolution_transpose_t* const self = (ccv_cnnp_model_convolution_transpose_t*)super;
1386 return ccv_cnnp_convolution_transpose(self->groups, self->filters, self->kdim, self->dilation, self->output_padding, self->no_bias, self->hint, self->format, self->super.is_trainable, self->super.name);
1387}
1388
1389// MARK - Dense Layer
1390
1391typedef struct {
1392 ccv_cnnp_model_t super;
1393 ccv_nnc_tensor_symbol_t output;
1394 ccv_nnc_tensor_symbol_t weights;
1395 ccv_nnc_tensor_symbol_t bias;
1396 int count;
1397 int no_bias;
1398 int flags;
1399} ccv_cnnp_model_dense_t;
1400
1401static void _ccv_cnnp_dense_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1402{
1403 ccv_cnnp_model_dense_t* const self = (ccv_cnnp_model_dense_t*)super;
1404 PRINT(CCV_CLI_VERBOSE, "[cnnp_dense_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_dense_build] -\n"); fflush(stdout); } } while
(0)
;
1405 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1405, __extension__ __PRETTY_FUNCTION__); }))
;
1406 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1406, __extension__ __PRETTY_FUNCTION__
); }))
;
1407 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1408 ccv_nnc_tensor_param_t weights_params = params;
1409 memset(weights_params.dim, 0, sizeof(weights_params.dim));
1410 if (params.dim[0] != 0)
1411 {
1412 weights_params.dim[0] = self->count;
1413 weights_params.dim[1] = params.dim[ccv_nnc_tensor_nd(params.dim) - 1];
1414 }
1415 if (!self->weights.graph)
1416 self->weights = ccv_nnc_tensor_symbol_new(graph, weights_params, "weights");
1417 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 1417, __extension__ __PRETTY_FUNCTION__); }))
;
1418 const ccv_nnc_tensor_symbol_t weights = ccv_cnnp_model_get_symbol(super, self->weights);
1419 ccv_nnc_tensor_param_t bias_params = params;
1420 memset(bias_params.dim, 0, sizeof(bias_params.dim));
1421 bias_params.dim[0] = self->count;
1422 ccv_nnc_cmd_t cmd = {0};
1423 cmd.cmd = CCV_NNC_GEMM_FORWARD;
1424 cmd.info.blas.a[0] = 1;
1425 cmd.info.blas.a[1] = 1;
1426 cmd.info.blas.transpose_b[0] = 0;
1427 cmd.info.blas.transpose_b[1] = 1;
1428 cmd.info.blas.flags = self->flags;
1429 ccv_nnc_tensor_param_t output_params;
1430 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
1431 params,
1432 weights_params,
1433 bias_params,
1434 }, 3, ccv_nnc_no_hint, &output_params, 1);
1435 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1436 if (self->no_bias)
1437 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights}, (1 +1
+1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "dense");
1438 else {
1439 if (!self->bias.graph)
1440 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
1441 const ccv_nnc_tensor_symbol_t bias = ccv_cnnp_model_get_symbol(super, self->bias);
1442 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], weights, bias},
(1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "dense");
1443 }
1444 outputs[0] = output;
1445}
1446
1447static void _ccv_cnnp_dense_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
1448{
1449 ccv_cnnp_model_dense_t* const self = (ccv_cnnp_model_dense_t*)super;
1450 const ccv_nnc_tensor_param_t weight_params = ccv_nnc_tensor_symbol_params(graph, self->weights);
1451 const int c = weight_params.dim[1];
1452 const float std = sqrtf(2) / sqrtf(c);
1453 const float bound = sqrtf(3) * std;
1454 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
1455 if (self->bias.graph)
1456 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
1457}
1458
1459static void _ccv_cnnp_dense_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
1460{
1461 ccv_cnnp_model_dense_t* const self = (ccv_cnnp_model_dense_t*)super;
1462 add_to_array(parameters, self->weights, is_trainable);
1463 if (self->bias.graph)
1464 add_to_array(parameters, self->bias, is_trainable);
1465}
1466
1467static ccv_cnnp_model_t* _ccv_cnnp_dense_copy(const ccv_cnnp_model_t* const super, void* const context);
1468
1469static const ccv_cnnp_model_vtab_t ccv_cnnp_dense_isa = {
1470 .build = _ccv_cnnp_dense_build,
1471 .init_states = _ccv_cnnp_dense_init_states,
1472 .add_to_parameter = _ccv_cnnp_dense_add_to_parameter,
1473 .copy = _ccv_cnnp_dense_copy,
1474};
1475
1476ccv_cnnp_model_t* ccv_cnnp_dense(const int count, const int no_bias, const int flags, const int is_trainable, const char* const name)
1477{
1478 ccv_cnnp_model_dense_t* const model_dense = (ccv_cnnp_model_dense_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_dense_t));
1479 model_dense->super.isa = &ccv_cnnp_dense_isa;
1480 model_dense->super.input_size = 1;
1481 model_dense->super.outputs = &model_dense->output;
1482 model_dense->super.output_size = 1;
1483 model_dense->super.is_trainable = is_trainable;
1484 ccv_cnnp_model_copy_name(&model_dense->super, name);
1485 model_dense->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
1486 model_dense->weights.graph = 0;
1487 model_dense->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
1488 model_dense->bias.graph = 0;
1489 model_dense->count = count;
1490 model_dense->no_bias = no_bias;
1491 model_dense->flags = flags;
1492 return (ccv_cnnp_model_t*)model_dense;
1493}
1494
1495static ccv_cnnp_model_t* _ccv_cnnp_dense_copy(const ccv_cnnp_model_t* const super, void* const context)
1496{
1497 const ccv_cnnp_model_dense_t* const self = (const ccv_cnnp_model_dense_t*)super;
1498 return ccv_cnnp_dense(self->count, self->no_bias, self->flags, self->super.is_trainable, self->super.name);
1499}
1500
1501// MARK - Pool Layers
1502
1503typedef struct {
1504 ccv_cnnp_model_t super;
1505 ccv_nnc_tensor_symbol_t output;
1506 int kdim[CCV_NNC_MAX_DIM_ALLOC(12)];
1507 ccv_nnc_hint_t hint;
1508} ccv_cnnp_model_pool_t;
1509
1510static void _ccv_cnnp_max_pool_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1511{
1512 ccv_cnnp_model_pool_t* const self = (ccv_cnnp_model_pool_t*)super;
1513 PRINT(CCV_CLI_VERBOSE, "[cnnp_max_pool_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_max_pool_build] -\n"); fflush(stdout); } } while
(0)
;
1514 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1514, __extension__ __PRETTY_FUNCTION__); }))
;
1515 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1515, __extension__ __PRETTY_FUNCTION__
); }))
;
1516 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1517 const int hw = ccv_nnc_tensor_hw(params, ccv_nnc_tensor_nd(params.dim), CCV_NNC_MAX_DIM(2));
1518 ccv_nnc_cmd_t cmd;
1519 if (hw >= 0 && self->kdim[0] == 0 && self->kdim[1] == 0)
1520 cmd = CMD_MAX_POOL_FORWARD(params.dim[hw], params.dim[hw + 1])ccv_nnc_cmd(CCV_NNC_MAX_POOL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={params.dim[hw], params.dim[hw + 1],1}}}), 0)
;
1521 else
1522 cmd = CMD_MAX_POOL_FORWARD(self->kdim[0], self->kdim[1])ccv_nnc_cmd(CCV_NNC_MAX_POOL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={self->kdim[0], self->kdim[1],1}}}), 0)
;
1523 ccv_nnc_tensor_param_t output_params;
1524 ccv_nnc_hint_tensor_auto(cmd, &params, 1, self->hint, &output_params, 1);
1525 const ccv_nnc_tensor_symbol_t pool_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1526 const ccv_nnc_graph_exec_symbol_t exec = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(pool_output)(const ccv_nnc_tensor_symbol_t []){pool_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "max_pool");
1527 ccv_nnc_graph_exec_symbol_set_hint(graph, exec, self->hint);
1528 outputs[0] = pool_output;
1529}
1530
1531static ccv_cnnp_model_t* _ccv_cnnp_max_pool_copy(const ccv_cnnp_model_t* const super, void* const context);
1532
1533static const ccv_cnnp_model_vtab_t ccv_cnnp_max_pool_isa = {
1534 .build = _ccv_cnnp_max_pool_build,
1535 .copy = _ccv_cnnp_max_pool_copy,
1536};
1537
1538ccv_cnnp_model_t* ccv_cnnp_max_pool(const int kdim[CCV_NNC_MAX_DIM_ALLOC(12)], const ccv_nnc_hint_t hint, const char* const name)
1539{
1540 ccv_cnnp_model_pool_t* const model_pool = (ccv_cnnp_model_pool_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_pool_t));
1541 model_pool->super.isa = &ccv_cnnp_max_pool_isa;
1542 model_pool->super.input_size = 1;
1543 model_pool->super.outputs = &model_pool->output;
1544 model_pool->super.output_size = 1;
1545 ccv_cnnp_model_copy_name(&model_pool->super, name);
1546 memcpy(model_pool->kdim, kdim, sizeof(model_pool->kdim));
1547 model_pool->hint = hint;
1548 return (ccv_cnnp_model_t*)model_pool;
1549}
1550
1551static ccv_cnnp_model_t* _ccv_cnnp_max_pool_copy(const ccv_cnnp_model_t* const super, void* const context)
1552{
1553 const ccv_cnnp_model_pool_t* const self = (const ccv_cnnp_model_pool_t*)super;
1554 return ccv_cnnp_max_pool(self->kdim, self->hint, self->super.name);
1555}
1556
1557static void _ccv_cnnp_average_pool_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1558{
1559 ccv_cnnp_model_pool_t* const self = (ccv_cnnp_model_pool_t*)super;
1560 PRINT(CCV_CLI_VERBOSE, "[cnnp_average_pool_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_average_pool_build] -\n"); fflush(stdout); }
} while (0)
;
1561 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1561, __extension__ __PRETTY_FUNCTION__); }))
;
1562 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1562, __extension__ __PRETTY_FUNCTION__
); }))
;
1563 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1564 const int hw = ccv_nnc_tensor_hw(params, ccv_nnc_tensor_nd(params.dim), CCV_NNC_MAX_DIM(2));
1565 ccv_nnc_cmd_t cmd;
1566 if (hw >= 0 && self->kdim[0] == 0 && self->kdim[1] == 0)
1567 cmd = CMD_AVERAGE_POOL_FORWARD(params.dim[hw], params.dim[hw + 1])ccv_nnc_cmd(CCV_NNC_AVERAGE_POOL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={params.dim[hw], params.dim[hw + 1],1}}}), 0)
;
1568 else
1569 cmd = CMD_AVERAGE_POOL_FORWARD(self->kdim[0], self->kdim[1])ccv_nnc_cmd(CCV_NNC_AVERAGE_POOL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={self->kdim[0], self->kdim[1],1}}}), 0)
;
1570 ccv_nnc_tensor_param_t output_params;
1571 ccv_nnc_hint_tensor_auto(cmd, &params, 1, self->hint, &output_params, 1);
1572 const ccv_nnc_tensor_symbol_t pool_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1573 const ccv_nnc_graph_exec_symbol_t exec = ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(pool_output)(const ccv_nnc_tensor_symbol_t []){pool_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "average_pool");
1574 ccv_nnc_graph_exec_symbol_set_hint(graph, exec, self->hint);
1575 outputs[0] = pool_output;
1576}
1577
1578static ccv_cnnp_model_t* _ccv_cnnp_average_pool_copy(const ccv_cnnp_model_t* const super, void* const context);
1579
1580static const ccv_cnnp_model_vtab_t ccv_cnnp_average_pool_isa = {
1581 .build = _ccv_cnnp_average_pool_build,
1582 .copy = _ccv_cnnp_average_pool_copy,
1583};
1584
1585ccv_cnnp_model_t* ccv_cnnp_average_pool(const int kdim[CCV_NNC_MAX_DIM_ALLOC(12)], const ccv_nnc_hint_t hint, const char* const name)
1586{
1587 ccv_cnnp_model_pool_t* const model_pool = (ccv_cnnp_model_pool_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_pool_t));
1588 model_pool->super.isa = &ccv_cnnp_average_pool_isa;
1589 model_pool->super.input_size = 1;
1590 model_pool->super.outputs = &model_pool->output;
1591 model_pool->super.output_size = 1;
1592 ccv_cnnp_model_copy_name(&model_pool->super, name);
1593 memcpy(model_pool->kdim, kdim, sizeof(model_pool->kdim));
1594 model_pool->hint = hint;
1595 return (ccv_cnnp_model_t*)model_pool;
1596}
1597
1598static ccv_cnnp_model_t* _ccv_cnnp_average_pool_copy(const ccv_cnnp_model_t* const super, void* const context)
1599{
1600 const ccv_cnnp_model_pool_t* const self = (const ccv_cnnp_model_pool_t*)super;
1601 return ccv_cnnp_average_pool(self->kdim, self->hint, self->super.name);
1602}
1603
1604// MARK - RELU Layer
1605
1606typedef struct {
1607 ccv_cnnp_model_t super;
1608 ccv_nnc_tensor_symbol_t output;
1609} ccv_cnnp_model_relu_t;
1610
1611static void _ccv_cnnp_relu_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1612{
1613 PRINT(CCV_CLI_VERBOSE, "[cnnp_relu_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_relu_build] -\n"); fflush(stdout); } } while
(0)
;
1614 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1614, __extension__ __PRETTY_FUNCTION__); }))
;
1615 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1615, __extension__ __PRETTY_FUNCTION__
); }))
;
1616 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1617 ccv_nnc_tensor_param_t output_params;
1618 const ccv_nnc_cmd_t relu = CMD_RELU_FORWARD()ccv_nnc_cmd(CCV_NNC_RELU_FORWARD, 0, ccv_nnc_cmd_auto, 0);
1619 ccv_nnc_hint_tensor_auto(relu, (ccv_nnc_tensor_param_t []){
1620 params,
1621 }, 1, ccv_nnc_no_hint, &output_params, 1);
1622 const ccv_nnc_tensor_symbol_t relu_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1623 ccv_nnc_graph_exec_symbol_new(graph, relu, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(relu_output)(const ccv_nnc_tensor_symbol_t []){relu_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "relu");
1624 outputs[0] = relu_output;
1625}
1626
1627static ccv_cnnp_model_t* _ccv_cnnp_relu_copy(const ccv_cnnp_model_t* const self, void* const context);
1628
1629static const ccv_cnnp_model_vtab_t ccv_cnnp_relu_isa = {
1630 .build = _ccv_cnnp_relu_build,
1631 .copy = _ccv_cnnp_relu_copy,
1632};
1633
1634ccv_cnnp_model_t* ccv_cnnp_relu(const char* const name)
1635{
1636 ccv_cnnp_model_relu_t* const model_relu = (ccv_cnnp_model_relu_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_relu_t));
1637 model_relu->super.isa = &ccv_cnnp_relu_isa;
1638 model_relu->super.input_size = 1;
1639 model_relu->super.outputs = &model_relu->output;
1640 model_relu->super.output_size = 1;
1641 ccv_cnnp_model_copy_name(&model_relu->super, name);
1642 return (ccv_cnnp_model_t*)model_relu;
1643}
1644
1645static ccv_cnnp_model_t* _ccv_cnnp_relu_copy(const ccv_cnnp_model_t* const self, void* const context)
1646{
1647 return ccv_cnnp_relu(self->name);
1648}
1649
1650// MARK - Sigmoid Layer
1651
1652typedef struct {
1653 ccv_cnnp_model_t super;
1654 ccv_nnc_tensor_symbol_t output;
1655} ccv_cnnp_model_sigmoid_t;
1656
1657static void _ccv_cnnp_sigmoid_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1658{
1659 PRINT(CCV_CLI_VERBOSE, "[cnnp_sigmoid_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_sigmoid_build] -\n"); fflush(stdout); } } while
(0)
;
1660 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1660, __extension__ __PRETTY_FUNCTION__); }))
;
1661 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1661, __extension__ __PRETTY_FUNCTION__
); }))
;
1662 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1663 ccv_nnc_tensor_param_t output_params;
1664 const ccv_nnc_cmd_t sigmoid = CMD_SIGMOID_FORWARD()ccv_nnc_cmd(CCV_NNC_SIGMOID_FORWARD, 0, ccv_nnc_cmd_auto, 0);
1665 ccv_nnc_hint_tensor_auto(sigmoid, (ccv_nnc_tensor_param_t []){
1666 params,
1667 }, 1, ccv_nnc_no_hint, &output_params, 1);
1668 const ccv_nnc_tensor_symbol_t sigmoid_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1669 ccv_nnc_graph_exec_symbol_new(graph, sigmoid, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(sigmoid_output)(const ccv_nnc_tensor_symbol_t []){sigmoid_output}, (1 +1 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1
)
, "sigmoid");
1670 outputs[0] = sigmoid_output;
1671}
1672
1673static ccv_cnnp_model_t* _ccv_cnnp_sigmoid_copy(const ccv_cnnp_model_t* const self, void* const context);
1674
1675static const ccv_cnnp_model_vtab_t ccv_cnnp_sigmoid_isa = {
1676 .build = _ccv_cnnp_sigmoid_build,
1677 .copy = _ccv_cnnp_sigmoid_copy,
1678};
1679
1680ccv_cnnp_model_t* ccv_cnnp_sigmoid(const char* const name)
1681{
1682 ccv_cnnp_model_sigmoid_t* const model_sigmoid = (ccv_cnnp_model_sigmoid_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_sigmoid_t));
1683 model_sigmoid->super.isa = &ccv_cnnp_sigmoid_isa;
1684 model_sigmoid->super.input_size = 1;
1685 model_sigmoid->super.outputs = &model_sigmoid->output;
1686 model_sigmoid->super.output_size = 1;
1687 ccv_cnnp_model_copy_name(&model_sigmoid->super, name);
1688 return (ccv_cnnp_model_t*)model_sigmoid;
1689}
1690
1691static ccv_cnnp_model_t* _ccv_cnnp_sigmoid_copy(const ccv_cnnp_model_t* const self, void* const context)
1692{
1693 return ccv_cnnp_sigmoid(self->name);
1694}
1695
1696// MARK - Tanh Layer
1697
1698typedef struct {
1699 ccv_cnnp_model_t super;
1700 ccv_nnc_tensor_symbol_t output;
1701} ccv_cnnp_model_tanh_t;
1702
1703static void _ccv_cnnp_tanh_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1704{
1705 PRINT(CCV_CLI_VERBOSE, "[cnnp_tanh_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_tanh_build] -\n"); fflush(stdout); } } while
(0)
;
1706 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1706, __extension__ __PRETTY_FUNCTION__); }))
;
1707 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1707, __extension__ __PRETTY_FUNCTION__
); }))
;
1708 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1709 ccv_nnc_tensor_param_t output_params;
1710 const ccv_nnc_cmd_t tanh = CMD_TANH_FORWARD()ccv_nnc_cmd(CCV_NNC_TANH_FORWARD, 0, ccv_nnc_cmd_auto, 0);
1711 ccv_nnc_hint_tensor_auto(tanh, (ccv_nnc_tensor_param_t []){
1712 params,
1713 }, 1, ccv_nnc_no_hint, &output_params, 1);
1714 const ccv_nnc_tensor_symbol_t tanh_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1715 ccv_nnc_graph_exec_symbol_new(graph, tanh, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(tanh_output)(const ccv_nnc_tensor_symbol_t []){tanh_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "tanh");
1716 outputs[0] = tanh_output;
1717}
1718
1719static ccv_cnnp_model_t* _ccv_cnnp_tanh_copy(const ccv_cnnp_model_t* const self, void* const context);
1720
1721static const ccv_cnnp_model_vtab_t ccv_cnnp_tanh_isa = {
1722 .build = _ccv_cnnp_tanh_build,
1723 .copy = _ccv_cnnp_tanh_copy,
1724};
1725
1726ccv_cnnp_model_t* ccv_cnnp_tanh(const char* const name)
1727{
1728 ccv_cnnp_model_tanh_t* const model_tanh = (ccv_cnnp_model_tanh_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_tanh_t));
1729 model_tanh->super.isa = &ccv_cnnp_tanh_isa;
1730 model_tanh->super.input_size = 1;
1731 model_tanh->super.outputs = &model_tanh->output;
1732 model_tanh->super.output_size = 1;
1733 ccv_cnnp_model_copy_name(&model_tanh->super, name);
1734 return (ccv_cnnp_model_t*)model_tanh;
1735}
1736
1737static ccv_cnnp_model_t* _ccv_cnnp_tanh_copy(const ccv_cnnp_model_t* const self, void* const context)
1738{
1739 return ccv_cnnp_tanh(self->name);
1740}
1741
1742// MARK - Exp Layer
1743
1744typedef struct {
1745 ccv_cnnp_model_t super;
1746 ccv_nnc_tensor_symbol_t output;
1747} ccv_cnnp_model_exp_t;
1748
1749static void _ccv_cnnp_exp_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1750{
1751 PRINT(CCV_CLI_VERBOSE, "[cnnp_exp_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_exp_build] -\n"); fflush(stdout); } } while (
0)
;
1752 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1752, __extension__ __PRETTY_FUNCTION__); }))
;
1753 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1753, __extension__ __PRETTY_FUNCTION__
); }))
;
1754 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1755 ccv_nnc_tensor_param_t output_params;
1756 const ccv_nnc_cmd_t exp = CMD_EWEXP_FORWARD()ccv_nnc_cmd(CCV_NNC_EWEXP_FORWARD, 0, ccv_nnc_cmd_auto, 0);
1757 ccv_nnc_hint_tensor_auto(exp, (ccv_nnc_tensor_param_t []){
1758 params,
1759 }, 1, ccv_nnc_no_hint, &output_params, 1);
1760 const ccv_nnc_tensor_symbol_t exp_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1761 ccv_nnc_graph_exec_symbol_new(graph, exp, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(exp_output)(const ccv_nnc_tensor_symbol_t []){exp_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "exp");
1762 outputs[0] = exp_output;
1763}
1764
1765static ccv_cnnp_model_t* _ccv_cnnp_exp_copy(const ccv_cnnp_model_t* const self, void* const context);
1766
1767static const ccv_cnnp_model_vtab_t ccv_cnnp_exp_isa = {
1768 .build = _ccv_cnnp_exp_build,
1769 .copy = _ccv_cnnp_exp_copy,
1770};
1771
1772ccv_cnnp_model_t* ccv_cnnp_exp(const char* const name)
1773{
1774 ccv_cnnp_model_exp_t* const model_exp = (ccv_cnnp_model_exp_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_exp_t));
1775 model_exp->super.isa = &ccv_cnnp_exp_isa;
1776 model_exp->super.input_size = 1;
1777 model_exp->super.outputs = &model_exp->output;
1778 model_exp->super.output_size = 1;
1779 ccv_cnnp_model_copy_name(&model_exp->super, name);
1780 return (ccv_cnnp_model_t*)model_exp;
1781}
1782
1783static ccv_cnnp_model_t* _ccv_cnnp_exp_copy(const ccv_cnnp_model_t* const self, void* const context)
1784{
1785 return ccv_cnnp_exp(self->name);
1786}
1787
1788// MARK - Softplus Layer
1789
1790typedef struct {
1791 ccv_cnnp_model_t super;
1792 ccv_nnc_tensor_symbol_t output;
1793} ccv_cnnp_model_softplus_t;
1794
1795static void _ccv_cnnp_softplus_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1796{
1797 PRINT(CCV_CLI_VERBOSE, "[cnnp_softplus_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_softplus_build] -\n"); fflush(stdout); } } while
(0)
;
1798 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1798, __extension__ __PRETTY_FUNCTION__); }))
;
1799 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1799, __extension__ __PRETTY_FUNCTION__
); }))
;
1800 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1801 ccv_nnc_tensor_param_t output_params;
1802 const ccv_nnc_cmd_t softplus = CMD_EWSOFTPLUS_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSOFTPLUS_FORWARD, 0, ccv_nnc_cmd_auto, 0
)
;
1803 ccv_nnc_hint_tensor_auto(softplus, (ccv_nnc_tensor_param_t []){
1804 params,
1805 }, 1, ccv_nnc_no_hint, &output_params, 1);
1806 const ccv_nnc_tensor_symbol_t softplus_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1807 ccv_nnc_graph_exec_symbol_new(graph, softplus, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(softplus_output)(const ccv_nnc_tensor_symbol_t []){softplus_output}, (1 +1 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -
1)
, "softplus");
1808 outputs[0] = softplus_output;
1809}
1810
1811static ccv_cnnp_model_t* _ccv_cnnp_softplus_copy(const ccv_cnnp_model_t* const self, void* const context);
1812
1813static const ccv_cnnp_model_vtab_t ccv_cnnp_softplus_isa = {
1814 .build = _ccv_cnnp_softplus_build,
1815 .copy = _ccv_cnnp_softplus_copy,
1816};
1817
1818ccv_cnnp_model_t* ccv_cnnp_softplus(const char* const name)
1819{
1820 ccv_cnnp_model_softplus_t* const model_softplus = (ccv_cnnp_model_softplus_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_softplus_t));
1821 model_softplus->super.isa = &ccv_cnnp_softplus_isa;
1822 model_softplus->super.input_size = 1;
1823 model_softplus->super.outputs = &model_softplus->output;
1824 model_softplus->super.output_size = 1;
1825 ccv_cnnp_model_copy_name(&model_softplus->super, name);
1826 return (ccv_cnnp_model_t*)model_softplus;
1827}
1828
1829static ccv_cnnp_model_t* _ccv_cnnp_softplus_copy(const ccv_cnnp_model_t* const self, void* const context)
1830{
1831 return ccv_cnnp_softplus(self->name);
1832}
1833
1834// MARK - Swish Layer
1835
1836typedef struct {
1837 ccv_cnnp_model_t super;
1838 ccv_nnc_tensor_symbol_t output;
1839 float beta;
1840} ccv_cnnp_model_swish_t;
1841
1842static void _ccv_cnnp_swish_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1843{
1844 PRINT(CCV_CLI_VERBOSE, "[cnnp_swish_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_swish_build] -\n"); fflush(stdout); } } while
(0)
;
1845 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1845, __extension__ __PRETTY_FUNCTION__); }))
;
1846 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1846, __extension__ __PRETTY_FUNCTION__
); }))
;
1847 ccv_cnnp_model_swish_t* const self = (ccv_cnnp_model_swish_t*)super;
1848 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1849 ccv_nnc_tensor_param_t output_params;
1850 const ccv_nnc_cmd_t swish = CMD_SWISH_FORWARD(self->beta)ccv_nnc_cmd(CCV_NNC_SWISH_FORWARD, 0, ((ccv_nnc_cmd_param_t){
.size={.dim={1,1,1}},.swish={.beta=self->beta}}), 0)
;
1851 ccv_nnc_hint_tensor_auto(swish, (ccv_nnc_tensor_param_t []){
1852 params,
1853 }, 1, ccv_nnc_no_hint, &output_params, 1);
1854 const ccv_nnc_tensor_symbol_t swish_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1855 ccv_nnc_graph_exec_symbol_new(graph, swish, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(swish_output)(const ccv_nnc_tensor_symbol_t []){swish_output}, (1 +1 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "swish");
1856 outputs[0] = swish_output;
1857}
1858
1859static ccv_cnnp_model_t* _ccv_cnnp_swish_copy(const ccv_cnnp_model_t* const self, void* const context);
1860
1861static const ccv_cnnp_model_vtab_t ccv_cnnp_swish_isa = {
1862 .build = _ccv_cnnp_swish_build,
1863 .copy = _ccv_cnnp_swish_copy,
1864};
1865
1866ccv_cnnp_model_t* ccv_cnnp_swish(const float beta, const char* const name)
1867{
1868 ccv_cnnp_model_swish_t* const model_swish = (ccv_cnnp_model_swish_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_swish_t));
1869 model_swish->super.isa = &ccv_cnnp_swish_isa;
1870 model_swish->super.input_size = 1;
1871 model_swish->super.outputs = &model_swish->output;
1872 model_swish->super.output_size = 1;
1873 model_swish->beta = beta;
1874 ccv_cnnp_model_copy_name(&model_swish->super, name);
1875 return (ccv_cnnp_model_t*)model_swish;
1876}
1877
1878static ccv_cnnp_model_t* _ccv_cnnp_swish_copy(const ccv_cnnp_model_t* const self, void* const context)
1879{
1880 const ccv_cnnp_model_swish_t* const swish = (const ccv_cnnp_model_swish_t*)self;
1881 return ccv_cnnp_swish(swish->beta, self->name);
1882}
1883
1884// MARK - Swish Mul Layer
1885
1886typedef struct {
1887 ccv_cnnp_model_t super;
1888 ccv_nnc_tensor_symbol_t output;
1889 float beta;
1890 float scale;
1891} ccv_cnnp_model_swish_mul_t;
1892
1893static void _ccv_cnnp_swish_mul_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1894{
1895 PRINT(CCV_CLI_VERBOSE, "[cnnp_swish_mul_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_swish_mul_build] -\n"); fflush(stdout); } } while
(0)
;
1896 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 1896, __extension__ __PRETTY_FUNCTION__); }))
;
1897 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1897, __extension__ __PRETTY_FUNCTION__
); }))
;
1898 const ccv_cnnp_model_swish_mul_t* const self = (const ccv_cnnp_model_swish_mul_t*)super;
1899 ccv_nnc_tensor_param_t input_params[2];
1900 int i;
1901 for (i = 0; i < 2; i++)
1902 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
1903 ccv_nnc_tensor_param_t output_params;
1904 const ccv_nnc_cmd_t swish_mul = CMD_SWISH_MUL_FORWARD(self->beta, self->scale)ccv_nnc_cmd(CCV_NNC_SWISH_MUL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.swish_mul={.beta=self->beta,.scale
=self->scale}}), 0)
;
1905 ccv_nnc_hint_tensor_auto(swish_mul, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
1906 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1907 ccv_nnc_graph_exec_symbol_new(graph, swish_mul, inputs, input_size, outputs, output_size, "swish_mul");
1908}
1909
1910static ccv_cnnp_model_t* _ccv_cnnp_swish_mul_copy(const ccv_cnnp_model_t* const self, void* const context);
1911
1912static const ccv_cnnp_model_vtab_t ccv_cnnp_swish_mul_isa = {
1913 .build = _ccv_cnnp_swish_mul_build,
1914 .copy = _ccv_cnnp_swish_mul_copy,
1915};
1916
1917ccv_cnnp_model_t* ccv_cnnp_swish_mul(const float beta, const float scale, const char* const name)
1918{
1919 ccv_cnnp_model_swish_mul_t* const model_swish_mul = (ccv_cnnp_model_swish_mul_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_swish_mul_t));
1920 model_swish_mul->super.isa = &ccv_cnnp_swish_mul_isa;
1921 model_swish_mul->super.input_size = 2;
1922 model_swish_mul->super.outputs = &model_swish_mul->output;
1923 model_swish_mul->super.output_size = 1;
1924 model_swish_mul->beta = beta;
1925 model_swish_mul->scale = scale;
1926 ccv_cnnp_model_copy_name(&model_swish_mul->super, name);
1927 return (ccv_cnnp_model_t*)model_swish_mul;
1928}
1929
1930static ccv_cnnp_model_t* _ccv_cnnp_swish_mul_copy(const ccv_cnnp_model_t* const super, void* const context)
1931{
1932 const ccv_cnnp_model_swish_mul_t* const self = (const ccv_cnnp_model_swish_mul_t*)super;
1933 return ccv_cnnp_swish_mul(self->beta, self->scale, self->super.name);
1934}
1935
1936// MARK - GELU Layer
1937
1938typedef struct {
1939 ccv_cnnp_model_t super;
1940 ccv_nnc_tensor_symbol_t output;
1941 int tanh;
1942} ccv_cnnp_model_gelu_t;
1943
1944static void _ccv_cnnp_gelu_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1945{
1946 PRINT(CCV_CLI_VERBOSE, "[cnnp_gelu_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_gelu_build] -\n"); fflush(stdout); } } while
(0)
;
1947 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1947, __extension__ __PRETTY_FUNCTION__); }))
;
1948 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1948, __extension__ __PRETTY_FUNCTION__
); }))
;
1949 ccv_cnnp_model_gelu_t* const self = (ccv_cnnp_model_gelu_t*)super;
1950 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
1951 ccv_nnc_tensor_param_t output_params;
1952 const ccv_nnc_cmd_t gelu = CMD_GELU_FORWARD(self->tanh)ccv_nnc_cmd(CCV_NNC_GELU_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.gelu={.tanh=self->tanh}}, 0)
;
1953 ccv_nnc_hint_tensor_auto(gelu, (ccv_nnc_tensor_param_t []){
1954 params,
1955 }, 1, ccv_nnc_no_hint, &output_params, 1);
1956 const ccv_nnc_tensor_symbol_t gelu_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
1957 ccv_nnc_graph_exec_symbol_new(graph, gelu, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(gelu_output)(const ccv_nnc_tensor_symbol_t []){gelu_output}, (1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "gelu");
1958 outputs[0] = gelu_output;
1959}
1960
1961static ccv_cnnp_model_t* _ccv_cnnp_gelu_copy(const ccv_cnnp_model_t* const self, void* const context);
1962
1963static const ccv_cnnp_model_vtab_t ccv_cnnp_gelu_isa = {
1964 .build = _ccv_cnnp_gelu_build,
1965 .copy = _ccv_cnnp_gelu_copy,
1966};
1967
1968ccv_cnnp_model_t* ccv_cnnp_gelu(const int tanh, const char* const name)
1969{
1970 ccv_cnnp_model_gelu_t* const model_gelu = (ccv_cnnp_model_gelu_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_gelu_t));
1971 model_gelu->super.isa = &ccv_cnnp_gelu_isa;
1972 model_gelu->super.input_size = 1;
1973 model_gelu->super.outputs = &model_gelu->output;
1974 model_gelu->super.output_size = 1;
1975 model_gelu->tanh = tanh;
1976 ccv_cnnp_model_copy_name(&model_gelu->super, name);
1977 return (ccv_cnnp_model_t*)model_gelu;
1978}
1979
1980static ccv_cnnp_model_t* _ccv_cnnp_gelu_copy(const ccv_cnnp_model_t* const super, void* const context)
1981{
1982 ccv_cnnp_model_gelu_t* const self = (ccv_cnnp_model_gelu_t*)super;
1983 return ccv_cnnp_gelu(self->tanh, self->super.name);
1984}
1985
1986// MARK - Leaky ReLU Layer
1987
1988typedef struct {
1989 ccv_cnnp_model_t super;
1990 ccv_nnc_tensor_symbol_t output;
1991 float negative_slope;
1992} ccv_cnnp_model_leaky_relu_t;
1993
1994static void _ccv_cnnp_leaky_relu_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
1995{
1996 PRINT(CCV_CLI_VERBOSE, "[cnnp_leaky_relu_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_leaky_relu_build] -\n"); fflush(stdout); } }
while (0)
;
1997 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 1997, __extension__ __PRETTY_FUNCTION__); }))
;
1998 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 1998, __extension__ __PRETTY_FUNCTION__
); }))
;
1999 ccv_cnnp_model_leaky_relu_t* const self = (ccv_cnnp_model_leaky_relu_t*)super;
2000 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2001 ccv_nnc_tensor_param_t output_params;
2002 const ccv_nnc_cmd_t leaky_relu = CMD_LEAKY_RELU_FORWARD(self->negative_slope)ccv_nnc_cmd(CCV_NNC_LEAKY_RELU_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.leaky_relu={.negative_slope=self->
negative_slope}}, 0)
;
2003 ccv_nnc_hint_tensor_auto(leaky_relu, (ccv_nnc_tensor_param_t []){
2004 params,
2005 }, 1, ccv_nnc_no_hint, &output_params, 1);
2006 const ccv_nnc_tensor_symbol_t leaky_relu_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2007 ccv_nnc_graph_exec_symbol_new(graph, leaky_relu, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(leaky_relu_output)(const ccv_nnc_tensor_symbol_t []){leaky_relu_output}, (1 +1 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
-1)
, "leaky_relu");
2008 outputs[0] = leaky_relu_output;
2009}
2010
2011static ccv_cnnp_model_t* _ccv_cnnp_leaky_relu_copy(const ccv_cnnp_model_t* const self, void* const context);
2012
2013static const ccv_cnnp_model_vtab_t ccv_cnnp_leaky_relu_isa = {
2014 .build = _ccv_cnnp_leaky_relu_build,
2015 .copy = _ccv_cnnp_leaky_relu_copy,
2016};
2017
2018ccv_cnnp_model_t* ccv_cnnp_leaky_relu(const float negative_slope, const char* const name)
2019{
2020 ccv_cnnp_model_leaky_relu_t* const model_leaky_relu = (ccv_cnnp_model_leaky_relu_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_leaky_relu_t));
2021 model_leaky_relu->super.isa = &ccv_cnnp_leaky_relu_isa;
2022 model_leaky_relu->super.input_size = 1;
2023 model_leaky_relu->super.outputs = &model_leaky_relu->output;
2024 model_leaky_relu->super.output_size = 1;
2025 model_leaky_relu->negative_slope = negative_slope;
2026 ccv_cnnp_model_copy_name(&model_leaky_relu->super, name);
2027 return (ccv_cnnp_model_t*)model_leaky_relu;
2028}
2029
2030static ccv_cnnp_model_t* _ccv_cnnp_leaky_relu_copy(const ccv_cnnp_model_t* const super, void* const context)
2031{
2032 ccv_cnnp_model_leaky_relu_t* const self = (ccv_cnnp_model_leaky_relu_t*)super;
2033 return ccv_cnnp_leaky_relu(self->negative_slope, self->super.name);
2034}
2035
2036// MARK - Softmax Layer
2037
2038typedef struct {
2039 ccv_cnnp_model_t super;
2040 ccv_nnc_tensor_symbol_t output;
2041} ccv_cnnp_model_softmax_t;
2042
2043static void _ccv_cnnp_softmax_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2044{
2045 PRINT(CCV_CLI_VERBOSE, "[cnnp_softmax_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_softmax_build] -\n"); fflush(stdout); } } while
(0)
;
2046 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2046, __extension__ __PRETTY_FUNCTION__); }))
;
2047 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2047, __extension__ __PRETTY_FUNCTION__
); }))
;
2048 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2049 ccv_nnc_tensor_param_t output_params;
2050 const ccv_nnc_cmd_t softmax = CMD_SOFTMAX_FORWARD()ccv_nnc_cmd(CCV_NNC_SOFTMAX_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2051 ccv_nnc_hint_tensor_auto(softmax, (ccv_nnc_tensor_param_t []){
2052 params,
2053 }, 1, ccv_nnc_no_hint, &output_params, 1);
2054 const ccv_nnc_tensor_symbol_t softmax_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2055 ccv_nnc_graph_exec_symbol_new(graph, softmax, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(softmax_output)(const ccv_nnc_tensor_symbol_t []){softmax_output}, (1 +1 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1
)
, "softmax");
2056 outputs[0] = softmax_output;
2057}
2058
2059static ccv_cnnp_model_t* _ccv_cnnp_softmax_copy(const ccv_cnnp_model_t* const self, void* const context);
2060
2061static const ccv_cnnp_model_vtab_t ccv_cnnp_softmax_isa = {
2062 .build = _ccv_cnnp_softmax_build,
2063 .copy = _ccv_cnnp_softmax_copy,
2064};
2065
2066ccv_cnnp_model_t* ccv_cnnp_softmax(const char* const name)
2067{
2068 ccv_cnnp_model_softmax_t* const model_softmax = (ccv_cnnp_model_softmax_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_softmax_t));
2069 model_softmax->super.isa = &ccv_cnnp_softmax_isa;
2070 model_softmax->super.input_size = 1;
2071 model_softmax->super.outputs = &model_softmax->output;
2072 model_softmax->super.output_size = 1;
2073 ccv_cnnp_model_copy_name(&model_softmax->super, name);
2074 return (ccv_cnnp_model_t*)model_softmax;
2075}
2076
2077static ccv_cnnp_model_t* _ccv_cnnp_softmax_copy(const ccv_cnnp_model_t* const self, void* const context)
2078{
2079 return ccv_cnnp_softmax(self->name);
2080}
2081
2082// MARK - Add Layer
2083
2084typedef struct {
2085 ccv_cnnp_model_t super;
2086 float p;
2087 float q;
2088 ccv_nnc_tensor_symbol_t output;
2089} ccv_cnnp_model_add_t;
2090
2091static void _ccv_cnnp_add_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2092{
2093 PRINT(CCV_CLI_VERBOSE, "[cnnp_add_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_add_build] -\n"); fflush(stdout); } } while (
0)
;
2094 const ccv_cnnp_model_add_t* const self = (const ccv_cnnp_model_add_t*)super;
2095 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 2095, __extension__ __PRETTY_FUNCTION__); }))
;
2096 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2096, __extension__ __PRETTY_FUNCTION__
); }))
;
2097 ccv_nnc_tensor_param_t input_params[2];
2098 int i;
2099 for (i = 0; i < 2; i++)
2100 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
2101 ccv_nnc_tensor_param_t output_params;
2102 const ccv_nnc_cmd_t add = CMD_ADD_FORWARD(self->p, self->q)ccv_nnc_cmd(CCV_NNC_ADD_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={self->p, self->q}}}, 0)
;
2103 ccv_nnc_hint_tensor_auto(add, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
2104 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2105 ccv_nnc_graph_exec_symbol_new(graph, add, inputs, input_size, outputs, output_size, "add");
2106}
2107
2108static ccv_cnnp_model_t* _ccv_cnnp_add_copy(const ccv_cnnp_model_t* const self, void* const context);
2109
2110static const ccv_cnnp_model_vtab_t ccv_cnnp_add_isa = {
2111 .build = _ccv_cnnp_add_build,
2112 .copy = _ccv_cnnp_add_copy,
2113};
2114
2115ccv_cnnp_model_t* ccv_cnnp_add(const float p, const float q, const char* const name)
2116{
2117 ccv_cnnp_model_add_t* const model_add = (ccv_cnnp_model_add_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_add_t));
2118 model_add->super.isa = &ccv_cnnp_add_isa;
2119 model_add->super.input_size = 2;
2120 model_add->super.outputs = &model_add->output;
2121 model_add->super.output_size = 1;
2122 model_add->p = p;
2123 model_add->q = q;
2124 ccv_cnnp_model_copy_name(&model_add->super, name);
2125 return (ccv_cnnp_model_t*)model_add;
2126}
2127
2128static ccv_cnnp_model_t* _ccv_cnnp_add_copy(const ccv_cnnp_model_t* const super, void* const context)
2129{
2130 const ccv_cnnp_model_add_t* const self = (const ccv_cnnp_model_add_t*)super;
2131 return ccv_cnnp_add(self->p, self->q, self->super.name);
2132}
2133
2134// MARK - Mul Layer
2135
2136typedef struct {
2137 ccv_cnnp_model_t super;
2138 ccv_nnc_tensor_symbol_t output;
2139 float p;
2140} ccv_cnnp_model_mul_t;
2141
2142static void _ccv_cnnp_mul_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2143{
2144 PRINT(CCV_CLI_VERBOSE, "[cnnp_mul_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_mul_build] -\n"); fflush(stdout); } } while (
0)
;
2145 const ccv_cnnp_model_mul_t* const self = (const ccv_cnnp_model_mul_t*)super;
2146 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 2146, __extension__ __PRETTY_FUNCTION__); }))
;
2147 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2147, __extension__ __PRETTY_FUNCTION__
); }))
;
2148 ccv_nnc_tensor_param_t input_params[2];
2149 int i;
2150 for (i = 0; i < 2; i++)
2151 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
2152 ccv_nnc_tensor_param_t output_params;
2153 const ccv_nnc_cmd_t mul = CMD_MUL_FORWARD(self->p)ccv_nnc_cmd(CCV_NNC_MUL_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={self->p,}}}, 0)
;
2154 ccv_nnc_hint_tensor_auto(mul, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
2155 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2156 ccv_nnc_graph_exec_symbol_new(graph, mul, inputs, input_size, outputs, output_size, "mul");
2157}
2158
2159static ccv_cnnp_model_t* _ccv_cnnp_mul_copy(const ccv_cnnp_model_t* const self, void* const context);
2160
2161static const ccv_cnnp_model_vtab_t ccv_cnnp_mul_isa = {
2162 .build = _ccv_cnnp_mul_build,
2163 .copy = _ccv_cnnp_mul_copy,
2164};
2165
2166ccv_cnnp_model_t* ccv_cnnp_mul(const float p, const char* const name)
2167{
2168 ccv_cnnp_model_mul_t* const model_mul = (ccv_cnnp_model_mul_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_mul_t));
2169 model_mul->super.isa = &ccv_cnnp_mul_isa;
2170 model_mul->super.input_size = 2;
2171 model_mul->super.outputs = &model_mul->output;
2172 model_mul->super.output_size = 1;
2173 model_mul->p = p;
2174 ccv_cnnp_model_copy_name(&model_mul->super, name);
2175 return (ccv_cnnp_model_t*)model_mul;
2176}
2177
2178static ccv_cnnp_model_t* _ccv_cnnp_mul_copy(const ccv_cnnp_model_t* const super, void* const context)
2179{
2180 const ccv_cnnp_model_mul_t* const self = (const ccv_cnnp_model_mul_t*)super;
2181 return ccv_cnnp_mul(self->p, self->super.name);
2182}
2183
2184// MARK - Scalar Mul Layer
2185
2186typedef struct {
2187 ccv_cnnp_model_t super;
2188 ccv_nnc_tensor_symbol_t output;
2189 float a;
2190} ccv_cnnp_model_scalar_mul_t;
2191
2192static void _ccv_cnnp_scalar_mul_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2193{
2194 PRINT(CCV_CLI_VERBOSE, "[cnnp_scalar_mul_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_scalar_mul_build] -\n"); fflush(stdout); } }
while (0)
;
2195 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2195, __extension__ __PRETTY_FUNCTION__); }))
;
2196 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2196, __extension__ __PRETTY_FUNCTION__
); }))
;
2197 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2198 ccv_nnc_tensor_param_t output_params;
2199 ccv_cnnp_model_scalar_mul_t* const self = (ccv_cnnp_model_scalar_mul_t*)super;
2200 const ccv_nnc_cmd_t scalar_mul = CMD_SCALAR_MUL_FORWARD(self->a)ccv_nnc_cmd(CCV_NNC_SCALAR_MUL_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={self->a,}}}, 0)
;
2201 ccv_nnc_hint_tensor_auto(scalar_mul, (ccv_nnc_tensor_param_t []){
2202 params,
2203 }, 1, ccv_nnc_no_hint, &output_params, 1);
2204 const ccv_nnc_tensor_symbol_t scalar_mul_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2205 ccv_nnc_graph_exec_symbol_new(graph, scalar_mul, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(scalar_mul_output)(const ccv_nnc_tensor_symbol_t []){scalar_mul_output}, (1 +1 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
-1)
, "scalar_mul");
2206 outputs[0] = scalar_mul_output;
2207}
2208
2209static ccv_cnnp_model_t* _ccv_cnnp_scalar_mul_copy(const ccv_cnnp_model_t* const super, void* const context);
2210
2211static const ccv_cnnp_model_vtab_t ccv_cnnp_scalar_mul_isa = {
2212 .build = _ccv_cnnp_scalar_mul_build,
2213 .copy = _ccv_cnnp_scalar_mul_copy,
2214};
2215
2216ccv_cnnp_model_t* ccv_cnnp_scalar_mul(const float a, const char* const name)
2217{
2218 ccv_cnnp_model_scalar_mul_t* const model_scalar_mul = (ccv_cnnp_model_scalar_mul_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_scalar_mul_t));
2219 model_scalar_mul->super.isa = &ccv_cnnp_scalar_mul_isa;
2220 model_scalar_mul->super.input_size = 1;
2221 model_scalar_mul->super.outputs = &model_scalar_mul->output;
2222 model_scalar_mul->super.output_size = 1;
2223 model_scalar_mul->a = a;
2224 ccv_cnnp_model_copy_name(&model_scalar_mul->super, name);
2225 return (ccv_cnnp_model_t*)model_scalar_mul;
2226}
2227
2228static ccv_cnnp_model_t* _ccv_cnnp_scalar_mul_copy(const ccv_cnnp_model_t* const super, void* const context)
2229{
2230 const ccv_cnnp_model_scalar_mul_t* const self = (const ccv_cnnp_model_scalar_mul_t*)super;
2231 return ccv_cnnp_scalar_mul(self->a, self->super.name);
2232}
2233
2234// MARK - Div Layer
2235
2236typedef struct {
2237 ccv_cnnp_model_t super;
2238 ccv_nnc_tensor_symbol_t output;
2239 int reciprocal;
2240} ccv_cnnp_model_div_t;
2241
2242static void _ccv_cnnp_div_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2243{
2244 const ccv_cnnp_model_div_t* const self = (const ccv_cnnp_model_div_t*)super;
2245 PRINT(CCV_CLI_VERBOSE, "[cnnp_div_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_div_build] -\n"); fflush(stdout); } } while (
0)
;
2246 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2246, __extension__ __PRETTY_FUNCTION__
); }))
;
2247 ccv_nnc_tensor_param_t input_params[2];
2248 int i;
2249 ccv_nnc_tensor_param_t output_params;
2250 const ccv_nnc_cmd_t div = CMD_EWDIV_FORWARD()ccv_nnc_cmd(CCV_NNC_EWDIV_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2251 if (self->reciprocal)
2252 {
2253 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2253, __extension__ __PRETTY_FUNCTION__); }))
;
2254 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2255 input_params[1] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2256 ccv_nnc_hint_tensor_auto(div, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
2257 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2258 ccv_nnc_graph_exec_symbol_new(graph, div, TENSOR_SYMBOL_LIST(NO_TENSOR_SYMBOL, inputs[0])(const ccv_nnc_tensor_symbol_t []){(const ccv_nnc_tensor_symbol_t
){.d = CCV_NNC_NO_TENSOR_SYMBOL}, inputs[0]}, (1 +1 +1 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, outputs, output_size, "div");
2259 } else {
2260 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 2260, __extension__ __PRETTY_FUNCTION__); }))
;
2261 for (i = 0; i < 2; i++)
2262 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
2263 ccv_nnc_hint_tensor_auto(div, input_params, input_size, ccv_nnc_no_hint, &output_params, 1);
2264 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2265 ccv_nnc_graph_exec_symbol_new(graph, div, inputs, input_size, outputs, output_size, "div");
2266 }
2267}
2268
2269static ccv_cnnp_model_t* _ccv_cnnp_div_copy(const ccv_cnnp_model_t* const self, void* const context);
2270
2271static const ccv_cnnp_model_vtab_t ccv_cnnp_div_isa = {
2272 .build = _ccv_cnnp_div_build,
2273 .copy = _ccv_cnnp_div_copy,
2274};
2275
2276ccv_cnnp_model_t* ccv_cnnp_div(const int reciprocal, const char* const name)
2277{
2278 ccv_cnnp_model_div_t* const model_div = (ccv_cnnp_model_div_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_div_t));
2279 model_div->super.isa = &ccv_cnnp_div_isa;
2280 model_div->super.input_size = reciprocal ? 1 : 2;
2281 model_div->super.outputs = &model_div->output;
2282 model_div->super.output_size = 1;
2283 model_div->reciprocal = reciprocal;
2284 ccv_cnnp_model_copy_name(&model_div->super, name);
2285 return (ccv_cnnp_model_t*)model_div;
2286}
2287
2288static ccv_cnnp_model_t* _ccv_cnnp_div_copy(const ccv_cnnp_model_t* const super, void* const context)
2289{
2290 const ccv_cnnp_model_div_t* const self = (const ccv_cnnp_model_div_t*)super;
2291 return ccv_cnnp_div(self->reciprocal, self->super.name);
2292}
2293
2294// MARK - Sqrt Layer
2295
2296typedef struct {
2297 ccv_cnnp_model_t super;
2298 ccv_nnc_tensor_symbol_t output;
2299} ccv_cnnp_model_sqrt_t;
2300
2301static void _ccv_cnnp_sqrt_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2302{
2303 PRINT(CCV_CLI_VERBOSE, "[cnnp_sqrt_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_sqrt_build] -\n"); fflush(stdout); } } while
(0)
;
2304 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2304, __extension__ __PRETTY_FUNCTION__
); }))
;
2305 ccv_nnc_tensor_param_t input_params[1];
2306 ccv_nnc_tensor_param_t output_params;
2307 const ccv_nnc_cmd_t sqrt = CMD_EWSQRT_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSQRT_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2308 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2308, __extension__ __PRETTY_FUNCTION__); }))
;
2309 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2310 ccv_nnc_hint_tensor_auto(sqrt, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2311 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2312 ccv_nnc_graph_exec_symbol_new(graph, sqrt, inputs, 1, outputs, output_size, "sqrt");
2313}
2314
2315static ccv_cnnp_model_t* _ccv_cnnp_sqrt_copy(const ccv_cnnp_model_t* const self, void* const context);
2316
2317static const ccv_cnnp_model_vtab_t ccv_cnnp_sqrt_isa = {
2318 .build = _ccv_cnnp_sqrt_build,
2319 .copy = _ccv_cnnp_sqrt_copy,
2320};
2321
2322ccv_cnnp_model_t* ccv_cnnp_sqrt(const char* const name)
2323{
2324 ccv_cnnp_model_sqrt_t* const model_sqrt = (ccv_cnnp_model_sqrt_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_sqrt_t));
2325 model_sqrt->super.isa = &ccv_cnnp_sqrt_isa;
2326 model_sqrt->super.input_size = 1;
2327 model_sqrt->super.outputs = &model_sqrt->output;
2328 model_sqrt->super.output_size = 1;
2329 ccv_cnnp_model_copy_name(&model_sqrt->super, name);
2330 return (ccv_cnnp_model_t*)model_sqrt;
2331}
2332
2333static ccv_cnnp_model_t* _ccv_cnnp_sqrt_copy(const ccv_cnnp_model_t* const super, void* const context)
2334{
2335 const ccv_cnnp_model_sqrt_t* const self = (const ccv_cnnp_model_sqrt_t*)super;
2336 return ccv_cnnp_sqrt(self->super.name);
2337}
2338
2339// MARK - Log Layer
2340
2341typedef struct {
2342 ccv_cnnp_model_t super;
2343 ccv_nnc_tensor_symbol_t output;
2344} ccv_cnnp_model_log_t;
2345
2346static void _ccv_cnnp_log_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2347{
2348 PRINT(CCV_CLI_VERBOSE, "[cnnp_log_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_log_build] -\n"); fflush(stdout); } } while (
0)
;
2349 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2349, __extension__ __PRETTY_FUNCTION__
); }))
;
2350 ccv_nnc_tensor_param_t input_params[1];
2351 ccv_nnc_tensor_param_t output_params;
2352 const ccv_nnc_cmd_t log = CMD_EWLOG_FORWARD()ccv_nnc_cmd(CCV_NNC_EWLOG_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2353 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2353, __extension__ __PRETTY_FUNCTION__); }))
;
2354 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2355 ccv_nnc_hint_tensor_auto(log, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2356 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2357 ccv_nnc_graph_exec_symbol_new(graph, log, inputs, 1, outputs, output_size, "log");
2358}
2359
2360static ccv_cnnp_model_t* _ccv_cnnp_log_copy(const ccv_cnnp_model_t* const self, void* const context);
2361
2362static const ccv_cnnp_model_vtab_t ccv_cnnp_log_isa = {
2363 .build = _ccv_cnnp_log_build,
2364 .copy = _ccv_cnnp_log_copy,
2365};
2366
2367ccv_cnnp_model_t* ccv_cnnp_log(const char* const name)
2368{
2369 ccv_cnnp_model_log_t* const model_log = (ccv_cnnp_model_log_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_log_t));
2370 model_log->super.isa = &ccv_cnnp_log_isa;
2371 model_log->super.input_size = 1;
2372 model_log->super.outputs = &model_log->output;
2373 model_log->super.output_size = 1;
2374 ccv_cnnp_model_copy_name(&model_log->super, name);
2375 return (ccv_cnnp_model_t*)model_log;
2376}
2377
2378static ccv_cnnp_model_t* _ccv_cnnp_log_copy(const ccv_cnnp_model_t* const super, void* const context)
2379{
2380 return ccv_cnnp_log(super->name);
2381}
2382
2383// MARK - Pow Layer
2384
2385typedef struct {
2386 ccv_cnnp_model_t super;
2387 ccv_nnc_tensor_symbol_t output;
2388 ccv_nnc_cmd_param_t params;
2389} ccv_cnnp_model_pow_t;
2390
2391static void _ccv_cnnp_pow_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2392{
2393 ccv_cnnp_model_pow_t* const self = (ccv_cnnp_model_pow_t*)super;
2394 PRINT(CCV_CLI_VERBOSE, "[cnnp_pow_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_pow_build] -\n"); fflush(stdout); } } while (
0)
;
2395 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2395, __extension__ __PRETTY_FUNCTION__); }))
;
2396 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2396, __extension__ __PRETTY_FUNCTION__
); }))
;
2397 ccv_nnc_tensor_param_t input_params[1];
2398 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2399 ccv_nnc_tensor_param_t output_params;
2400 const ccv_nnc_cmd_t pow = ccv_nnc_cmd(CCV_NNC_EWPOW_FORWARD, 0, self->params, 0);
2401 ccv_nnc_hint_tensor_auto(pow, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2402 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2403 ccv_nnc_graph_exec_symbol_new(graph, pow, inputs, input_size, outputs, output_size, "pow");
2404}
2405
2406static ccv_cnnp_model_t* _ccv_cnnp_pow_copy(const ccv_cnnp_model_t* const self, void* const context);
2407
2408static const ccv_cnnp_model_vtab_t ccv_cnnp_pow_isa = {
2409 .build = _ccv_cnnp_pow_build,
2410 .copy = _ccv_cnnp_pow_copy,
2411};
2412
2413ccv_cnnp_model_t* ccv_cnnp_pow(const float exponent, const char* const name)
2414{
2415 ccv_cnnp_model_pow_t* const model_pow = (ccv_cnnp_model_pow_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_pow_t));
2416 model_pow->super.isa = &ccv_cnnp_pow_isa;
2417 model_pow->super.input_size = 1;
2418 model_pow->super.outputs = &model_pow->output;
2419 model_pow->super.output_size = 1;
2420 model_pow->params = (ccv_nnc_cmd_param_t){
2421 .size = {
2422 .dim = { 1, 1, 1 }
2423 },
2424 .pow = {
2425 .exponent = exponent,
2426 },
2427 };
2428 ccv_cnnp_model_copy_name(&model_pow->super, name);
2429 return (ccv_cnnp_model_t*)model_pow;
2430}
2431
2432static ccv_cnnp_model_t* _ccv_cnnp_pow_copy(const ccv_cnnp_model_t* const super, void* const context)
2433{
2434 const ccv_cnnp_model_pow_t* const self = (const ccv_cnnp_model_pow_t*)super;
2435 return ccv_cnnp_pow(self->params.pow.exponent, super->name);
2436}
2437
2438// MARK - Sin Layer
2439
2440typedef struct {
2441 ccv_cnnp_model_t super;
2442 ccv_nnc_tensor_symbol_t output;
2443} ccv_cnnp_model_sin_t;
2444
2445static void _ccv_cnnp_sin_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2446{
2447 PRINT(CCV_CLI_VERBOSE, "[cnnp_sin_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_sin_build] -\n"); fflush(stdout); } } while (
0)
;
2448 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2448, __extension__ __PRETTY_FUNCTION__
); }))
;
2449 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2449, __extension__ __PRETTY_FUNCTION__); }))
;
2450 ccv_nnc_tensor_param_t input_params[1];
2451 ccv_nnc_tensor_param_t output_params;
2452 const ccv_nnc_cmd_t sin = CMD_EWSIN_FORWARD()ccv_nnc_cmd(CCV_NNC_EWSIN_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2453 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2454 ccv_nnc_hint_tensor_auto(sin, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2455 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2456 ccv_nnc_graph_exec_symbol_new(graph, sin, inputs, 1, outputs, output_size, "sin");
2457}
2458
2459static ccv_cnnp_model_t* _ccv_cnnp_sin_copy(const ccv_cnnp_model_t* const self, void* const context);
2460
2461static const ccv_cnnp_model_vtab_t ccv_cnnp_sin_isa = {
2462 .build = _ccv_cnnp_sin_build,
2463 .copy = _ccv_cnnp_sin_copy,
2464};
2465
2466ccv_cnnp_model_t* ccv_cnnp_sin(const char* const name)
2467{
2468 ccv_cnnp_model_sin_t* const model_sin = (ccv_cnnp_model_sin_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_sin_t));
2469 model_sin->super.isa = &ccv_cnnp_sin_isa;
2470 model_sin->super.input_size = 1;
2471 model_sin->super.outputs = &model_sin->output;
2472 model_sin->super.output_size = 1;
2473 ccv_cnnp_model_copy_name(&model_sin->super, name);
2474 return (ccv_cnnp_model_t*)model_sin;
2475}
2476
2477static ccv_cnnp_model_t* _ccv_cnnp_sin_copy(const ccv_cnnp_model_t* const super, void* const context)
2478{
2479 return ccv_cnnp_sin(super->name);
2480}
2481
2482// MARK - Cos Layer
2483
2484typedef struct {
2485 ccv_cnnp_model_t super;
2486 ccv_nnc_tensor_symbol_t output;
2487} ccv_cnnp_model_cos_t;
2488
2489static void _ccv_cnnp_cos_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2490{
2491 PRINT(CCV_CLI_VERBOSE, "[cnnp_cos_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_cos_build] -\n"); fflush(stdout); } } while (
0)
;
2492 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2492, __extension__ __PRETTY_FUNCTION__
); }))
;
2493 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2493, __extension__ __PRETTY_FUNCTION__); }))
;
2494 ccv_nnc_tensor_param_t input_params[1];
2495 ccv_nnc_tensor_param_t output_params;
2496 const ccv_nnc_cmd_t cos = CMD_EWCOS_FORWARD()ccv_nnc_cmd(CCV_NNC_EWCOS_FORWARD, 0, ccv_nnc_cmd_auto, 0);
2497 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2498 ccv_nnc_hint_tensor_auto(cos, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2499 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2500 ccv_nnc_graph_exec_symbol_new(graph, cos, inputs, 1, outputs, output_size, "cos");
2501}
2502
2503static ccv_cnnp_model_t* _ccv_cnnp_cos_copy(const ccv_cnnp_model_t* const self, void* const context);
2504
2505static const ccv_cnnp_model_vtab_t ccv_cnnp_cos_isa = {
2506 .build = _ccv_cnnp_cos_build,
2507 .copy = _ccv_cnnp_cos_copy,
2508};
2509
2510ccv_cnnp_model_t* ccv_cnnp_cos(const char* const name)
2511{
2512 ccv_cnnp_model_cos_t* const model_cos = (ccv_cnnp_model_cos_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_cos_t));
2513 model_cos->super.isa = &ccv_cnnp_cos_isa;
2514 model_cos->super.input_size = 1;
2515 model_cos->super.outputs = &model_cos->output;
2516 model_cos->super.output_size = 1;
2517 ccv_cnnp_model_copy_name(&model_cos->super, name);
2518 return (ccv_cnnp_model_t*)model_cos;
2519}
2520
2521static ccv_cnnp_model_t* _ccv_cnnp_cos_copy(const ccv_cnnp_model_t* const super, void* const context)
2522{
2523 return ccv_cnnp_cos(super->name);
2524}
2525
2526// MARK - Rotate Half Layer
2527
2528typedef struct {
2529 ccv_cnnp_model_t super;
2530 ccv_nnc_tensor_symbol_t output;
2531} ccv_cnnp_model_rotate_half_t;
2532
2533static void _ccv_cnnp_rotate_half_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2534{
2535 PRINT(CCV_CLI_VERBOSE, "[cnnp_rotate_half_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_rotate_half_build] -\n"); fflush(stdout); } }
while (0)
;
2536 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2536, __extension__ __PRETTY_FUNCTION__); }))
;
2537 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2537, __extension__ __PRETTY_FUNCTION__
); }))
;
2538 ccv_nnc_tensor_param_t input_params[1];
2539 ccv_nnc_tensor_param_t output_params;
2540 const ccv_nnc_cmd_t rotate_half = CMD_ROTATE_HALF_FORWARD()ccv_nnc_cmd(CCV_NNC_ROTATE_HALF_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}}}, 0)
;
2541 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2542 ccv_nnc_hint_tensor_auto(rotate_half, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2543 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2544 ccv_nnc_graph_exec_symbol_new(graph, rotate_half, inputs, 1, outputs, output_size, "rotate_half");
2545}
2546
2547static ccv_cnnp_model_t* _ccv_cnnp_rotate_half_copy(const ccv_cnnp_model_t* const self, void* const context);
2548
2549static const ccv_cnnp_model_vtab_t ccv_cnnp_rotate_half_isa = {
2550 .build = _ccv_cnnp_rotate_half_build,
2551 .copy = _ccv_cnnp_rotate_half_copy,
2552};
2553
2554ccv_cnnp_model_t* ccv_cnnp_rotate_half(const char* const name)
2555{
2556 ccv_cnnp_model_rotate_half_t* const model_rotate_half = (ccv_cnnp_model_rotate_half_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_rotate_half_t));
2557 model_rotate_half->super.isa = &ccv_cnnp_rotate_half_isa;
2558 model_rotate_half->super.input_size = 1;
2559 model_rotate_half->super.outputs = &model_rotate_half->output;
2560 model_rotate_half->super.output_size = 1;
2561 ccv_cnnp_model_copy_name(&model_rotate_half->super, name);
2562 return (ccv_cnnp_model_t*)model_rotate_half;
2563}
2564
2565static ccv_cnnp_model_t* _ccv_cnnp_rotate_half_copy(const ccv_cnnp_model_t* const super, void* const context)
2566{
2567 return ccv_cnnp_rotate_half(super->name);
2568}
2569
2570// MARK - Walsh-Hadamard Transform Layer
2571
2572typedef struct {
2573 ccv_cnnp_model_t super;
2574 ccv_nnc_tensor_symbol_t output;
2575 float scale;
2576} ccv_cnnp_model_walsh_hadamard_transform_t;
2577
2578static void _ccv_cnnp_walsh_hadamard_transform_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2579{
2580 PRINT(CCV_CLI_VERBOSE, "[cnnp_walsh_hadamard_transform_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_walsh_hadamard_transform_build] -\n"); fflush
(stdout); } } while (0)
;
2581 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2581, __extension__ __PRETTY_FUNCTION__); }))
;
2582 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2582, __extension__ __PRETTY_FUNCTION__
); }))
;
2583 const ccv_cnnp_model_walsh_hadamard_transform_t* const self = (const ccv_cnnp_model_walsh_hadamard_transform_t*)super;
2584 ccv_nnc_tensor_param_t input_params[1];
2585 ccv_nnc_tensor_param_t output_params;
2586 const ccv_nnc_cmd_t walsh_hadamard_transform = CMD_WALSH_HADAMARD_TRANSFORM_FORWARD(self->scale)ccv_nnc_cmd(CCV_NNC_WALSH_HADAMARD_TRANSFORM_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.walsh_hadamard_transform={.scale=(self
->scale)}}), 0)
;
2587 input_params[0] = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2588 ccv_nnc_hint_tensor_auto(walsh_hadamard_transform, input_params, 1, ccv_nnc_no_hint, &output_params, 1);
2589 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2590 ccv_nnc_graph_exec_symbol_new(graph, walsh_hadamard_transform, inputs, 1, outputs, output_size, "walsh_hadamard_transform");
2591}
2592
2593static ccv_cnnp_model_t* _ccv_cnnp_walsh_hadamard_transform_copy(const ccv_cnnp_model_t* const self, void* const context);
2594
2595static const ccv_cnnp_model_vtab_t ccv_cnnp_walsh_hadamard_transform_isa = {
2596 .build = _ccv_cnnp_walsh_hadamard_transform_build,
2597 .copy = _ccv_cnnp_walsh_hadamard_transform_copy,
2598};
2599
2600ccv_cnnp_model_t* ccv_cnnp_walsh_hadamard_transform(const float scale, const char* const name)
2601{
2602 ccv_cnnp_model_walsh_hadamard_transform_t* const model_walsh_hadamard_transform = (ccv_cnnp_model_walsh_hadamard_transform_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_walsh_hadamard_transform_t));
2603 model_walsh_hadamard_transform->super.isa = &ccv_cnnp_walsh_hadamard_transform_isa;
2604 model_walsh_hadamard_transform->super.input_size = 1;
2605 model_walsh_hadamard_transform->super.outputs = &model_walsh_hadamard_transform->output;
2606 model_walsh_hadamard_transform->super.output_size = 1;
2607 model_walsh_hadamard_transform->scale = scale;
2608 ccv_cnnp_model_copy_name(&model_walsh_hadamard_transform->super, name);
2609 return (ccv_cnnp_model_t*)model_walsh_hadamard_transform;
2610}
2611
2612static ccv_cnnp_model_t* _ccv_cnnp_walsh_hadamard_transform_copy(const ccv_cnnp_model_t* const super, void* const context)
2613{
2614 const ccv_cnnp_model_walsh_hadamard_transform_t* const self = (const ccv_cnnp_model_walsh_hadamard_transform_t*)super;
2615 return ccv_cnnp_walsh_hadamard_transform(self->scale, self->super.name);
2616}
2617
2618// MARK - Gated Delta Layer
2619
2620typedef struct {
2621 ccv_cnnp_model_t super;
2622 ccv_nnc_tensor_symbol_t outputs[2];
2623 int log_decay;
2624} ccv_cnnp_model_gated_delta_t;
2625
2626static void _ccv_cnnp_gated_delta_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2627{
2628 PRINT(CCV_CLI_VERBOSE, "[cnnp_gated_delta_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_gated_delta_build] -\n"); fflush(stdout); } }
while (0)
;
2629 ccv_cnnp_model_gated_delta_t* const self = (ccv_cnnp_model_gated_delta_t*)super;
2630 assert(input_size == 6)((void) sizeof ((input_size == 6) ? 1 : 0), __extension__ ({ if
(input_size == 6) ; else __assert_fail ("input_size == 6", "ccv_cnnp_model_addons.c"
, 2630, __extension__ __PRETTY_FUNCTION__); }))
;
2631 assert(output_size == 2)((void) sizeof ((output_size == 2) ? 1 : 0), __extension__ ({
if (output_size == 2) ; else __assert_fail ("output_size == 2"
, "ccv_cnnp_model_addons.c", 2631, __extension__ __PRETTY_FUNCTION__
); }))
;
2632 ccv_nnc_tensor_param_t input_params[6];
2633 int i;
2634 for (i = 0; i < 6; i++)
2635 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
2636 ccv_nnc_tensor_param_t output_params[2];
2637 const ccv_nnc_cmd_t gated_delta = CMD_GATED_DELTA_FORWARD(self->log_decay)ccv_nnc_cmd(CCV_NNC_GATED_DELTA_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.gated_delta={.log_decay=(self->log_decay
)}}), 0)
;
2638 ccv_nnc_hint_tensor_auto(gated_delta, input_params, 6, ccv_nnc_no_hint, output_params, 2);
2639 for (i = 0; i < 2; i++)
2640 outputs[i] = ccv_nnc_tensor_symbol_new(graph, output_params[i], 0);
2641 ccv_nnc_graph_exec_symbol_new(graph, gated_delta, inputs, input_size, outputs, output_size, "gated_delta");
2642}
2643
2644static ccv_cnnp_model_t* _ccv_cnnp_gated_delta_copy(const ccv_cnnp_model_t* const self, void* const context);
2645
2646static const ccv_cnnp_model_vtab_t ccv_cnnp_gated_delta_isa = {
2647 .build = _ccv_cnnp_gated_delta_build,
2648 .copy = _ccv_cnnp_gated_delta_copy,
2649};
2650
2651ccv_cnnp_model_t* ccv_cnnp_gated_delta(const int log_decay, const char* const name)
2652{
2653 ccv_cnnp_model_gated_delta_t* const model_gated_delta = (ccv_cnnp_model_gated_delta_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_gated_delta_t));
2654 model_gated_delta->super.isa = &ccv_cnnp_gated_delta_isa;
2655 model_gated_delta->super.input_size = 6;
2656 model_gated_delta->super.outputs = model_gated_delta->outputs;
2657 model_gated_delta->super.output_size = 2;
2658 model_gated_delta->log_decay = log_decay;
2659 ccv_cnnp_model_copy_name(&model_gated_delta->super, name);
2660 return (ccv_cnnp_model_t*)model_gated_delta;
2661}
2662
2663static ccv_cnnp_model_t* _ccv_cnnp_gated_delta_copy(const ccv_cnnp_model_t* const super, void* const context)
2664{
2665 const ccv_cnnp_model_gated_delta_t* const self = (const ccv_cnnp_model_gated_delta_t*)super;
2666 return ccv_cnnp_gated_delta(self->log_decay, super->name);
2667}
2668
2669// MARK - Cmul Layer
2670
2671typedef struct {
2672 ccv_cnnp_model_t super;
2673 ccv_nnc_tensor_symbol_t output;
2674} ccv_cnnp_model_cmul_t;
2675
2676static void _ccv_cnnp_cmul_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2677{
2678 PRINT(CCV_CLI_VERBOSE, "[cnnp_cmul_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_cmul_build] -\n"); fflush(stdout); } } while
(0)
;
2679 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 2679, __extension__ __PRETTY_FUNCTION__); }))
;
2680 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2680, __extension__ __PRETTY_FUNCTION__
); }))
;
2681 ccv_nnc_tensor_param_t input_params[2];
2682 int i;
2683 for (i = 0; i < 2; i++)
2684 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
2685 ccv_nnc_tensor_param_t output_params;
2686 const ccv_nnc_cmd_t mul = CMD_CMUL_FORWARD()ccv_nnc_cmd(CCV_NNC_CMUL_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}}}, 0)
;
2687 ccv_nnc_hint_tensor_auto(mul, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
2688 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2689 ccv_nnc_graph_exec_symbol_new(graph, mul, inputs, input_size, outputs, output_size, "cmul");
2690}
2691
2692static ccv_cnnp_model_t* _ccv_cnnp_cmul_copy(const ccv_cnnp_model_t* const self, void* const context);
2693
2694static const ccv_cnnp_model_vtab_t ccv_cnnp_cmul_isa = {
2695 .build = _ccv_cnnp_cmul_build,
2696 .copy = _ccv_cnnp_cmul_copy,
2697};
2698
2699ccv_cnnp_model_t* ccv_cnnp_cmul(const char* const name)
2700{
2701 ccv_cnnp_model_cmul_t* const model_cmul = (ccv_cnnp_model_cmul_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_cmul_t));
2702 model_cmul->super.isa = &ccv_cnnp_cmul_isa;
2703 model_cmul->super.input_size = 2;
2704 model_cmul->super.outputs = &model_cmul->output;
2705 model_cmul->super.output_size = 1;
2706 ccv_cnnp_model_copy_name(&model_cmul->super, name);
2707 return (ccv_cnnp_model_t*)model_cmul;
2708}
2709
2710static ccv_cnnp_model_t* _ccv_cnnp_cmul_copy(const ccv_cnnp_model_t* const super, void* const context)
2711{
2712 return ccv_cnnp_cmul(super->name);
2713}
2714
2715// MARK - Transpose Layer
2716
2717typedef struct {
2718 ccv_cnnp_model_t super;
2719 ccv_nnc_tensor_symbol_t output;
2720 int transpose[2];
2721} ccv_cnnp_model_transpose_t;
2722
2723static void _ccv_cnnp_transpose_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2724{
2725 ccv_cnnp_model_transpose_t* const self = (ccv_cnnp_model_transpose_t*)super;
2726 PRINT(CCV_CLI_VERBOSE, "[cnnp_transpose_build] (%d, %d)\n", self->transpose[0], self->transpose[1])do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_transpose_build] (%d, %d)\n", self->transpose
[0], self->transpose[1]); fflush(stdout); } } while (0)
;
2727 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2727, __extension__ __PRETTY_FUNCTION__); }))
;
2728 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2728, __extension__ __PRETTY_FUNCTION__
); }))
;
2729 if (self->transpose[0] == self->transpose[1])
2730 {
2731 outputs[0] = inputs[0];
2732 return;
2733 }
2734 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2735 ccv_nnc_tensor_param_t output_params;
2736 const ccv_nnc_cmd_t transpose = CMD_TRANSPOSE_FORWARD(self->transpose[0], self->transpose[1])ccv_nnc_cmd(CCV_NNC_TRANSPOSE_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.transpose={.axis={self->transpose[
0], self->transpose[1]}}}), 0)
;
2737 ccv_nnc_hint_tensor_auto(transpose, (ccv_nnc_tensor_param_t []){
2738 params,
2739 }, 1, ccv_nnc_no_hint, &output_params, 1);
2740 const ccv_nnc_tensor_symbol_t transpose_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
2741 ccv_nnc_graph_exec_symbol_new(graph, transpose, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(transpose_output)(const ccv_nnc_tensor_symbol_t []){transpose_output}, (1 +1 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
-1)
, "transpose");
2742 outputs[0] = transpose_output;
2743}
2744
2745static ccv_cnnp_model_t* _ccv_cnnp_transpose_copy(const ccv_cnnp_model_t* const super, void* const context);
2746
2747static const ccv_cnnp_model_vtab_t ccv_cnnp_transpose_isa = {
2748 .build = _ccv_cnnp_transpose_build,
2749 .copy = _ccv_cnnp_transpose_copy,
2750};
2751
2752ccv_cnnp_model_t* ccv_cnnp_transpose(const int axis_a, const int axis_b, const char* const name)
2753{
2754 ccv_cnnp_model_transpose_t* const model_transpose = (ccv_cnnp_model_transpose_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_transpose_t));
2755 model_transpose->super.isa = &ccv_cnnp_transpose_isa;
2756 model_transpose->super.input_size = 1;
2757 model_transpose->super.outputs = &model_transpose->output;
2758 model_transpose->super.output_size = 1;
2759 model_transpose->transpose[0] = axis_a;
2760 model_transpose->transpose[1] = axis_b;
2761 ccv_cnnp_model_copy_name(&model_transpose->super, name);
2762 return (ccv_cnnp_model_t*)model_transpose;
2763}
2764
2765static ccv_cnnp_model_t* _ccv_cnnp_transpose_copy(const ccv_cnnp_model_t* const super, void* const context)
2766{
2767 const ccv_cnnp_model_transpose_t* const self = (const ccv_cnnp_model_transpose_t*)super;
2768 return ccv_cnnp_transpose(self->transpose[0], self->transpose[1], self->super.name);
2769}
2770
2771// MARK - Layer Norm Layer
2772
2773typedef struct {
2774 ccv_cnnp_model_t super;
2775 ccv_nnc_tensor_symbol_t output;
2776 ccv_nnc_tensor_symbol_t bias;
2777 ccv_nnc_tensor_symbol_t scale;
2778 ccv_nnc_cmd_param_t params;
2779} ccv_cnnp_model_layer_norm_t;
2780
2781static void _ccv_cnnp_layer_norm_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2782{
2783 PRINT(CCV_CLI_VERBOSE, "[cnnp_layer_norm_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_layer_norm_build] -\n"); fflush(stdout); } }
while (0)
;
2784 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2784, __extension__ __PRETTY_FUNCTION__); }))
;
2785 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2785, __extension__ __PRETTY_FUNCTION__
); }))
;
2786 ccv_cnnp_model_layer_norm_t* const self = (ccv_cnnp_model_layer_norm_t*)super;
2787 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2788 ccv_nnc_tensor_param_t bias_params = params;
2789 const int nd = ccv_nnc_tensor_nd(params.dim);
2790 int i;
2791 for (i = 0; i < nd; i++)
2792 bias_params.dim[i] = 1;
2793 for (i = 0; i < self->params.lnorm.count; i++)
2794 bias_params.dim[self->params.lnorm.axis[i]] = params.dim[self->params.lnorm.axis[i]];
2795 if (self->params.lnorm.elementwise_affine)
2796 {
2797 // Both scale and bias are shared between if this model is reused.
2798 if (!self->scale.graph)
2799 self->scale = ccv_nnc_tensor_symbol_new(graph, bias_params, "scale");
2800 if (!self->bias.graph)
2801 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
2802 }
2803 const ccv_nnc_tensor_symbol_t scale = self->params.lnorm.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->scale) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
2804 const ccv_nnc_tensor_symbol_t bias = self->params.lnorm.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->bias) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
2805 const ccv_nnc_cmd_t layer_norm = ccv_nnc_cmd(CCV_NNC_LAYER_NORM_FORWARD, 0, self->params, 0);
2806 ccv_nnc_tensor_param_t output_params[3];
2807 if (self->params.lnorm.elementwise_affine)
2808 ccv_nnc_hint_tensor_auto(layer_norm, (ccv_nnc_tensor_param_t []){
2809 params,
2810 bias_params,
2811 bias_params,
2812 }, 3, ccv_nnc_no_hint, output_params, 3);
2813 else
2814 ccv_nnc_hint_tensor_auto(layer_norm, (ccv_nnc_tensor_param_t []){
2815 params,
2816 }, 1, ccv_nnc_no_hint, output_params, 3);
2817 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
2818 const ccv_nnc_tensor_symbol_t saved_mean = ccv_nnc_tensor_symbol_new(graph, output_params[1], "saved_mean");
2819 const ccv_nnc_tensor_symbol_t saved_inv_std = ccv_nnc_tensor_symbol_new(graph, output_params[2], "saved_inv_std");
2820 if (self->params.lnorm.elementwise_affine)
2821 ccv_nnc_graph_exec_symbol_new(graph, layer_norm, TENSOR_SYMBOL_LIST(inputs[0], scale, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], scale, bias}, (
1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_mean, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_mean, saved_inv_std
}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 -1)
, "layer_norm");
2822 else
2823 ccv_nnc_graph_exec_symbol_new(graph, layer_norm, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_mean, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_mean, saved_inv_std
}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 -1)
, "layer_norm");
2824 outputs[0] = output;
2825}
2826
2827static void _ccv_cnnp_layer_norm_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
2828{
2829 ccv_cnnp_model_layer_norm_t* const self = (ccv_cnnp_model_layer_norm_t*)super;
2830 if (self->scale.graph)
2831 initializer(context, CMD_SET_FORWARD(1)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->scale);
2832 if (self->bias.graph)
2833 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
2834}
2835
2836static void _ccv_cnnp_layer_norm_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
2837{
2838 ccv_cnnp_model_layer_norm_t* const self = (ccv_cnnp_model_layer_norm_t*)super;
2839 if (self->scale.graph)
2840 add_to_array(parameters, self->scale, is_trainable);
2841 if (self->bias.graph)
2842 add_to_array(parameters, self->bias, is_trainable);
2843}
2844
2845static ccv_cnnp_model_t* _ccv_cnnp_layer_norm_copy(const ccv_cnnp_model_t* const super, void* const context);
2846
2847static const ccv_cnnp_model_vtab_t ccv_cnnp_layer_norm_isa = {
2848 .build = _ccv_cnnp_layer_norm_build,
2849 .init_states = _ccv_cnnp_layer_norm_init_states,
2850 .add_to_parameter = _ccv_cnnp_layer_norm_add_to_parameter,
2851 .copy = _ccv_cnnp_layer_norm_copy,
2852};
2853
2854ccv_cnnp_model_t* ccv_cnnp_layer_norm(const float epsilon, const int axis[CCV_NNC_MAX_DIM_ALLOC(12)], const int axis_count, const int elementwise_affine, const float scale, const int is_trainable, const char* const name)
2855{
2856 ccv_cnnp_model_layer_norm_t* const model_layer_norm = (ccv_cnnp_model_layer_norm_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_layer_norm_t));
2857 model_layer_norm->super.isa = &ccv_cnnp_layer_norm_isa;
2858 model_layer_norm->super.input_size = 1;
2859 model_layer_norm->super.outputs = &model_layer_norm->output;
2860 model_layer_norm->super.output_size = 1;
2861 model_layer_norm->super.is_trainable = is_trainable;
2862 ccv_cnnp_model_copy_name(&model_layer_norm->super, name);
2863 model_layer_norm->scale.d = CCV_NNC_NO_TENSOR_SYMBOL;
2864 model_layer_norm->scale.graph = 0;
2865 model_layer_norm->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
2866 model_layer_norm->bias.graph = 0;
2867 model_layer_norm->params.lnorm.epsilon = epsilon;
2868 model_layer_norm->params.lnorm.scale = scale;
2869 model_layer_norm->params.lnorm.count = axis_count;
2870 model_layer_norm->params.lnorm.elementwise_affine = elementwise_affine;
2871 memcpy(model_layer_norm->params.lnorm.axis, axis, sizeof(int) * axis_count);
2872 return (ccv_cnnp_model_t*)model_layer_norm;
2873}
2874
2875static ccv_cnnp_model_t* _ccv_cnnp_layer_norm_copy(const ccv_cnnp_model_t* const super, void* const context)
2876{
2877 const ccv_cnnp_model_layer_norm_t* const self = (const ccv_cnnp_model_layer_norm_t*)super;
2878 return ccv_cnnp_layer_norm(self->params.lnorm.epsilon, self->params.lnorm.axis, self->params.lnorm.count, self->params.lnorm.elementwise_affine, self->params.lnorm.scale, self->super.is_trainable, self->super.name);
2879}
2880
2881// MARK - Group Norm Layer
2882
2883typedef struct {
2884 ccv_cnnp_model_t super;
2885 ccv_nnc_tensor_symbol_t output;
2886 ccv_nnc_tensor_symbol_t bias;
2887 ccv_nnc_tensor_symbol_t scale;
2888 ccv_nnc_cmd_param_t params;
2889} ccv_cnnp_model_group_norm_t;
2890
2891static void _ccv_cnnp_group_norm_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
2892{
2893 PRINT(CCV_CLI_VERBOSE, "[cnnp_group_norm_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_group_norm_build] -\n"); fflush(stdout); } }
while (0)
;
2894 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 2894, __extension__ __PRETTY_FUNCTION__); }))
;
2895 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 2895, __extension__ __PRETTY_FUNCTION__
); }))
;
2896 ccv_cnnp_model_group_norm_t* const self = (ccv_cnnp_model_group_norm_t*)super;
2897 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
2898 ccv_nnc_tensor_param_t bias_params = params;
2899 const int nd = ccv_nnc_tensor_nd(params.dim);
2900 int i;
2901 for (i = 0; i < nd; i++)
2902 bias_params.dim[i] = 1;
2903 bias_params.dim[self->params.gnorm.group_axis] = params.dim[self->params.gnorm.group_axis];
2904 if (self->params.gnorm.elementwise_affine)
2905 {
2906 // Both scale and bias are shared between if this model is reused.
2907 if (!self->scale.graph)
2908 self->scale = ccv_nnc_tensor_symbol_new(graph, bias_params, "scale");
2909 if (!self->bias.graph)
2910 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
2911 }
2912 const ccv_nnc_tensor_symbol_t scale = self->params.gnorm.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->scale) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
2913 const ccv_nnc_tensor_symbol_t bias = self->params.gnorm.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->bias) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
2914 const ccv_nnc_cmd_t group_norm = ccv_nnc_cmd(CCV_NNC_GROUP_NORM_FORWARD, 0, self->params, 0);
2915 ccv_nnc_tensor_param_t output_params[3];
2916 if (self->params.gnorm.elementwise_affine)
2917 ccv_nnc_hint_tensor_auto(group_norm, (ccv_nnc_tensor_param_t []){
2918 params,
2919 bias_params,
2920 bias_params,
2921 }, 3, ccv_nnc_no_hint, output_params, 3);
2922 else
2923 ccv_nnc_hint_tensor_auto(group_norm, (ccv_nnc_tensor_param_t []){
2924 params,
2925 }, 1, ccv_nnc_no_hint, output_params, 3);
2926 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
2927 const ccv_nnc_tensor_symbol_t saved_mean = ccv_nnc_tensor_symbol_new(graph, output_params[1], "saved_mean");
2928 const ccv_nnc_tensor_symbol_t saved_inv_std = ccv_nnc_tensor_symbol_new(graph, output_params[2], "saved_inv_std");
2929 if (self->params.gnorm.elementwise_affine)
2930 ccv_nnc_graph_exec_symbol_new(graph, group_norm, TENSOR_SYMBOL_LIST(inputs[0], scale, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], scale, bias}, (
1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_mean, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_mean, saved_inv_std
}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 -1)
, "group_norm");
2931 else
2932 ccv_nnc_graph_exec_symbol_new(graph, group_norm, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_mean, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_mean, saved_inv_std
}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 -1)
, "group_norm");
2933 outputs[0] = output;
2934}
2935
2936static void _ccv_cnnp_group_norm_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
2937{
2938 ccv_cnnp_model_group_norm_t* const self = (ccv_cnnp_model_group_norm_t*)super;
2939 if (self->scale.graph)
2940 initializer(context, CMD_SET_FORWARD(1)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->scale);
2941 if (self->bias.graph)
2942 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
2943}
2944
2945static void _ccv_cnnp_group_norm_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
2946{
2947 ccv_cnnp_model_group_norm_t* const self = (ccv_cnnp_model_group_norm_t*)super;
2948 if (self->scale.graph)
2949 add_to_array(parameters, self->scale, is_trainable);
2950 if (self->bias.graph)
2951 add_to_array(parameters, self->bias, is_trainable);
2952}
2953
2954static ccv_cnnp_model_t* _ccv_cnnp_group_norm_copy(const ccv_cnnp_model_t* const super, void* const context);
2955
2956static const ccv_cnnp_model_vtab_t ccv_cnnp_group_norm_isa = {
2957 .build = _ccv_cnnp_group_norm_build,
2958 .init_states = _ccv_cnnp_group_norm_init_states,
2959 .add_to_parameter = _ccv_cnnp_group_norm_add_to_parameter,
2960 .copy = _ccv_cnnp_group_norm_copy,
2961};
2962
2963ccv_cnnp_model_t* ccv_cnnp_group_norm(const int group_axis, const int groups, const float epsilon, const int reduce_axis[CCV_NNC_MAX_DIM_ALLOC(12)], const int axis_count, const int elementwise_affine, const int is_trainable, const char* const name)
2964{
2965 ccv_cnnp_model_group_norm_t* const model_group_norm = (ccv_cnnp_model_group_norm_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_group_norm_t));
2966 model_group_norm->super.isa = &ccv_cnnp_group_norm_isa;
2967 model_group_norm->super.input_size = 1;
2968 model_group_norm->super.outputs = &model_group_norm->output;
2969 model_group_norm->super.output_size = 1;
2970 model_group_norm->super.is_trainable = is_trainable;
2971 ccv_cnnp_model_copy_name(&model_group_norm->super, name);
2972 model_group_norm->scale.d = CCV_NNC_NO_TENSOR_SYMBOL;
2973 model_group_norm->scale.graph = 0;
2974 model_group_norm->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
2975 model_group_norm->bias.graph = 0;
2976 model_group_norm->params.gnorm.group_axis = group_axis;
2977 model_group_norm->params.gnorm.groups = groups;
2978 model_group_norm->params.gnorm.epsilon = epsilon;
2979 model_group_norm->params.gnorm.reduce_count = axis_count;
2980 model_group_norm->params.gnorm.elementwise_affine = elementwise_affine;
2981 memcpy(model_group_norm->params.gnorm.reduce_axis, reduce_axis, sizeof(int) * axis_count);
2982 return (ccv_cnnp_model_t*)model_group_norm;
2983}
2984
2985static ccv_cnnp_model_t* _ccv_cnnp_group_norm_copy(const ccv_cnnp_model_t* const super, void* const context)
2986{
2987 const ccv_cnnp_model_group_norm_t* const self = (const ccv_cnnp_model_group_norm_t*)super;
2988 return ccv_cnnp_group_norm(self->params.gnorm.group_axis, self->params.gnorm.groups, self->params.gnorm.epsilon, self->params.gnorm.reduce_axis, self->params.gnorm.reduce_count, self->params.gnorm.elementwise_affine, self->super.is_trainable, self->super.name);
2989}
2990
2991// MARK - RMSNorm Layer
2992
2993typedef struct {
2994 ccv_cnnp_model_t super;
2995 ccv_nnc_tensor_symbol_t output;
2996 ccv_nnc_tensor_symbol_t scale;
2997 ccv_nnc_cmd_param_t params;
2998} ccv_cnnp_model_rmsnorm_t;
2999
3000static void _ccv_cnnp_rmsnorm_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3001{
3002 PRINT(CCV_CLI_VERBOSE, "[cnnp_rmsnorm_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_rmsnorm_build] -\n"); fflush(stdout); } } while
(0)
;
3003 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3003, __extension__ __PRETTY_FUNCTION__); }))
;
3004 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3004, __extension__ __PRETTY_FUNCTION__
); }))
;
3005 ccv_cnnp_model_rmsnorm_t* const self = (ccv_cnnp_model_rmsnorm_t*)super;
3006 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3007 ccv_nnc_tensor_param_t scale_params = params;
3008 const int nd = ccv_nnc_tensor_nd(params.dim);
3009 int i;
3010 for (i = 0; i < nd; i++)
3011 scale_params.dim[i] = 1;
3012 for (i = 0; i < self->params.rmsnorm.count; i++)
3013 scale_params.dim[self->params.rmsnorm.axis[i]] = params.dim[self->params.rmsnorm.axis[i]];
3014 // Both scale and bias are shared between if this model is reused.
3015 if (self->params.rmsnorm.elementwise_affine)
3016 {
3017 if (!self->scale.graph)
3018 self->scale = ccv_nnc_tensor_symbol_new(graph, scale_params, "scale");
3019 }
3020 const ccv_nnc_tensor_symbol_t scale = self->params.rmsnorm.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->scale) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
3021 const ccv_nnc_cmd_t rmsnorm = ccv_nnc_cmd(CCV_NNC_RMSNORM_FORWARD, 0, self->params, 0);
3022 ccv_nnc_tensor_param_t output_params[2];
3023 if (self->params.rmsnorm.elementwise_affine)
3024 ccv_nnc_hint_tensor_auto(rmsnorm, (ccv_nnc_tensor_param_t []){
3025 params,
3026 scale_params,
3027 }, 2, ccv_nnc_no_hint, output_params, 2);
3028 else
3029 ccv_nnc_hint_tensor_auto(rmsnorm, (ccv_nnc_tensor_param_t []){
3030 params,
3031 }, 1, ccv_nnc_no_hint, output_params, 2);
3032 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
3033 const ccv_nnc_tensor_symbol_t saved_inv_std = ccv_nnc_tensor_symbol_new(graph, output_params[1], "saved_inv_std");
3034 if (self->params.rmsnorm.elementwise_affine)
3035 ccv_nnc_graph_exec_symbol_new(graph, rmsnorm, TENSOR_SYMBOL_LIST(inputs[0], scale)(const ccv_nnc_tensor_symbol_t []){inputs[0], scale}, (1 +1 +
1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
-1)
, TENSOR_SYMBOL_LIST(output, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_inv_std}, (1
+1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 -1)
, "rmsnorm");
3036 else
3037 ccv_nnc_graph_exec_symbol_new(graph, rmsnorm, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_inv_std)(const ccv_nnc_tensor_symbol_t []){output, saved_inv_std}, (1
+1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 -1)
, "rmsnorm");
3038 outputs[0] = output;
3039}
3040
3041static void _ccv_cnnp_rmsnorm_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
3042{
3043 ccv_cnnp_model_rmsnorm_t* const self = (ccv_cnnp_model_rmsnorm_t*)super;
3044 if (self->scale.graph)
3045 initializer(context, CMD_SET_FORWARD(1)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->scale);
3046}
3047
3048static void _ccv_cnnp_rmsnorm_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
3049{
3050 ccv_cnnp_model_rmsnorm_t* const self = (ccv_cnnp_model_rmsnorm_t*)super;
3051 if (self->scale.graph)
3052 add_to_array(parameters, self->scale, is_trainable);
3053}
3054
3055static ccv_cnnp_model_t* _ccv_cnnp_rmsnorm_copy(const ccv_cnnp_model_t* const super, void* const context);
3056
3057static const ccv_cnnp_model_vtab_t ccv_cnnp_rmsnorm_isa = {
3058 .build = _ccv_cnnp_rmsnorm_build,
3059 .init_states = _ccv_cnnp_rmsnorm_init_states,
3060 .add_to_parameter = _ccv_cnnp_rmsnorm_add_to_parameter,
3061 .copy = _ccv_cnnp_rmsnorm_copy,
3062};
3063
3064ccv_cnnp_model_t* ccv_cnnp_rmsnorm(const float epsilon, const int axis[CCV_NNC_MAX_DIM_ALLOC(12)], const int axis_count, const int elementwise_affine, const float scale, const int is_trainable, const char* const name)
3065{
3066 ccv_cnnp_model_rmsnorm_t* const model_rmsnorm = (ccv_cnnp_model_rmsnorm_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_rmsnorm_t));
3067 model_rmsnorm->super.isa = &ccv_cnnp_rmsnorm_isa;
3068 model_rmsnorm->super.input_size = 1;
3069 model_rmsnorm->super.outputs = &model_rmsnorm->output;
3070 model_rmsnorm->super.output_size = 1;
3071 model_rmsnorm->super.is_trainable = is_trainable;
3072 ccv_cnnp_model_copy_name(&model_rmsnorm->super, name);
3073 model_rmsnorm->scale.d = CCV_NNC_NO_TENSOR_SYMBOL;
3074 model_rmsnorm->scale.graph = 0;
3075 model_rmsnorm->params.rmsnorm.epsilon = epsilon;
3076 model_rmsnorm->params.rmsnorm.scale = scale;
3077 model_rmsnorm->params.rmsnorm.count = axis_count;
3078 model_rmsnorm->params.rmsnorm.elementwise_affine = elementwise_affine;
3079 memcpy(model_rmsnorm->params.lnorm.axis, axis, sizeof(int) * axis_count);
3080 return (ccv_cnnp_model_t*)model_rmsnorm;
3081}
3082
3083static ccv_cnnp_model_t* _ccv_cnnp_rmsnorm_copy(const ccv_cnnp_model_t* const super, void* const context)
3084{
3085 const ccv_cnnp_model_rmsnorm_t* const self = (const ccv_cnnp_model_rmsnorm_t*)super;
3086 return ccv_cnnp_rmsnorm(self->params.rmsnorm.epsilon, self->params.rmsnorm.axis, self->params.rmsnorm.count, self->params.rmsnorm.elementwise_affine, self->params.rmsnorm.scale, self->super.is_trainable, self->super.name);
3087}
3088
3089// MARK - RMSNorm Gated Layer
3090
3091typedef struct {
3092 ccv_cnnp_model_t super;
3093 ccv_nnc_tensor_symbol_t output;
3094 ccv_nnc_tensor_symbol_t scale;
3095 ccv_nnc_cmd_param_t params;
3096} ccv_cnnp_model_rmsnorm_gated_t;
3097
3098static void _ccv_cnnp_rmsnorm_gated_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3099{
3100 PRINT(CCV_CLI_VERBOSE, "[cnnp_rmsnorm_gated_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_rmsnorm_gated_build] -\n"); fflush(stdout); }
} while (0)
;
3101 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3101, __extension__ __PRETTY_FUNCTION__); }))
;
3102 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3102, __extension__ __PRETTY_FUNCTION__
); }))
;
3103 ccv_cnnp_model_rmsnorm_gated_t* const self = (ccv_cnnp_model_rmsnorm_gated_t*)super;
3104 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3105 const ccv_nnc_tensor_param_t gate_params = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
3106 ccv_nnc_tensor_param_t scale_params = params;
3107 const int nd = ccv_nnc_tensor_nd(params.dim);
3108 int i;
3109 for (i = 0; i < nd; i++)
3110 scale_params.dim[i] = 1;
3111 for (i = 0; i < self->params.rmsnorm_gated.count; i++)
3112 scale_params.dim[self->params.rmsnorm_gated.axis[i]] = params.dim[self->params.rmsnorm_gated.axis[i]];
3113 if (self->params.rmsnorm_gated.elementwise_affine)
3114 {
3115 if (!self->scale.graph)
3116 self->scale = ccv_nnc_tensor_symbol_new(graph, scale_params, "scale");
3117 }
3118 const ccv_nnc_tensor_symbol_t scale = self->params.rmsnorm_gated.elementwise_affine ? ccv_cnnp_model_get_symbol(super, self->scale) : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
3119 const ccv_nnc_cmd_t rmsnorm_gated = ccv_nnc_cmd(CCV_NNC_RMSNORM_GATED_FORWARD, 0, self->params, 0);
3120 ccv_nnc_tensor_param_t output_params;
3121 if (self->params.rmsnorm_gated.elementwise_affine)
3122 ccv_nnc_hint_tensor_auto(rmsnorm_gated, (ccv_nnc_tensor_param_t []){
3123 params,
3124 gate_params,
3125 scale_params,
3126 }, 3, ccv_nnc_no_hint, &output_params, 1);
3127 else
3128 ccv_nnc_hint_tensor_auto(rmsnorm_gated, (ccv_nnc_tensor_param_t []){
3129 params,
3130 gate_params,
3131 }, 2, ccv_nnc_no_hint, &output_params, 1);
3132 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3133 if (self->params.rmsnorm_gated.elementwise_affine)
3134 ccv_nnc_graph_exec_symbol_new(graph, rmsnorm_gated, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], scale)(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], scale
}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 -1)
, outputs, output_size, "rmsnorm_gated");
3135 else
3136 ccv_nnc_graph_exec_symbol_new(graph, rmsnorm_gated, inputs, input_size, outputs, output_size, "rmsnorm_gated");
3137}
3138
3139static void _ccv_cnnp_rmsnorm_gated_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
3140{
3141 ccv_cnnp_model_rmsnorm_gated_t* const self = (ccv_cnnp_model_rmsnorm_gated_t*)super;
3142 if (self->scale.graph)
3143 initializer(context, CMD_SET_FORWARD(1)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={1,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->scale);
3144}
3145
3146static void _ccv_cnnp_rmsnorm_gated_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
3147{
3148 ccv_cnnp_model_rmsnorm_gated_t* const self = (ccv_cnnp_model_rmsnorm_gated_t*)super;
3149 if (self->scale.graph)
3150 add_to_array(parameters, self->scale, is_trainable);
3151}
3152
3153static ccv_cnnp_model_t* _ccv_cnnp_rmsnorm_gated_copy(const ccv_cnnp_model_t* const super, void* const context);
3154
3155static const ccv_cnnp_model_vtab_t ccv_cnnp_rmsnorm_gated_isa = {
3156 .build = _ccv_cnnp_rmsnorm_gated_build,
3157 .init_states = _ccv_cnnp_rmsnorm_gated_init_states,
3158 .add_to_parameter = _ccv_cnnp_rmsnorm_gated_add_to_parameter,
3159 .copy = _ccv_cnnp_rmsnorm_gated_copy,
3160};
3161
3162ccv_cnnp_model_t* ccv_cnnp_rmsnorm_gated(const float epsilon, const int axis[CCV_NNC_MAX_DIM_ALLOC(12)], const int axis_count, const int elementwise_affine, const int is_trainable, const char* const name)
3163{
3164 ccv_cnnp_model_rmsnorm_gated_t* const model_rmsnorm_gated = (ccv_cnnp_model_rmsnorm_gated_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_rmsnorm_gated_t));
3165 model_rmsnorm_gated->super.isa = &ccv_cnnp_rmsnorm_gated_isa;
3166 model_rmsnorm_gated->super.input_size = 2;
3167 model_rmsnorm_gated->super.outputs = &model_rmsnorm_gated->output;
3168 model_rmsnorm_gated->super.output_size = 1;
3169 model_rmsnorm_gated->super.is_trainable = is_trainable;
3170 ccv_cnnp_model_copy_name(&model_rmsnorm_gated->super, name);
3171 model_rmsnorm_gated->scale.d = CCV_NNC_NO_TENSOR_SYMBOL;
3172 model_rmsnorm_gated->scale.graph = 0;
3173 model_rmsnorm_gated->params.rmsnorm_gated.epsilon = epsilon;
3174 model_rmsnorm_gated->params.rmsnorm_gated.count = axis_count;
3175 model_rmsnorm_gated->params.rmsnorm_gated.elementwise_affine = elementwise_affine;
3176 memcpy(model_rmsnorm_gated->params.rmsnorm_gated.axis, axis, sizeof(int) * axis_count);
3177 return (ccv_cnnp_model_t*)model_rmsnorm_gated;
3178}
3179
3180static ccv_cnnp_model_t* _ccv_cnnp_rmsnorm_gated_copy(const ccv_cnnp_model_t* const super, void* const context)
3181{
3182 const ccv_cnnp_model_rmsnorm_gated_t* const self = (const ccv_cnnp_model_rmsnorm_gated_t*)super;
3183 return ccv_cnnp_rmsnorm_gated(self->params.rmsnorm_gated.epsilon, self->params.rmsnorm_gated.axis, self->params.rmsnorm_gated.count, self->params.rmsnorm_gated.elementwise_affine, self->super.is_trainable, self->super.name);
3184}
3185
3186// MARK - Batched Matrix Mul Layer
3187
3188typedef struct {
3189 ccv_cnnp_model_t super;
3190 ccv_nnc_tensor_symbol_t output;
3191 int transpose_a[2];
3192 int transpose_b[2];
3193 int flags;
3194} ccv_cnnp_model_matmul_t;
3195
3196static void _ccv_cnnp_matmul_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3197{
3198 PRINT(CCV_CLI_VERBOSE, "[cnnp_matmul_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_matmul_build] -\n"); fflush(stdout); } } while
(0)
;
3199 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3199, __extension__ __PRETTY_FUNCTION__); }))
;
3200 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3200, __extension__ __PRETTY_FUNCTION__
); }))
;
3201 ccv_cnnp_model_matmul_t* const self = (ccv_cnnp_model_matmul_t*)super;
3202 ccv_nnc_tensor_param_t a_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3203 ccv_nnc_tensor_param_t b_params = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
3204 ccv_nnc_tensor_param_t output_params;
3205 ccv_nnc_cmd_t matmul = CMD_GEMM_FORWARD(self->transpose_a, self->transpose_b)ccv_nnc_cmd(CCV_NNC_GEMM_FORWARD, 0, ((ccv_nnc_cmd_param_t){.
size={.dim={1,1,1}},.blas={.a={1,1},.transpose_a={self->transpose_a
[0],self->transpose_a[1]},.transpose_b={self->transpose_b
[0],self->transpose_b[1]},}}), 0)
;
3206 matmul.info.blas.flags = self->flags;
3207 ccv_nnc_hint_tensor_auto(matmul, (ccv_nnc_tensor_param_t []){
3208 a_params,
3209 b_params,
3210 }, 2, ccv_nnc_no_hint, &output_params, 1);
3211 const ccv_nnc_tensor_symbol_t matmul_output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3212 ccv_nnc_graph_exec_symbol_new(graph, matmul, inputs, input_size, TENSOR_SYMBOL_LIST(matmul_output)(const ccv_nnc_tensor_symbol_t []){matmul_output}, (1 +1 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1
)
, "matmul");
3213 outputs[0] = matmul_output;
3214}
3215
3216static ccv_cnnp_model_t* _ccv_cnnp_matmul_copy(const ccv_cnnp_model_t* const super, void* const context);
3217
3218static const ccv_cnnp_model_vtab_t ccv_cnnp_matmul_isa = {
3219 .build = _ccv_cnnp_matmul_build,
3220 .copy = _ccv_cnnp_matmul_copy,
3221};
3222
3223ccv_cnnp_model_t* ccv_cnnp_matmul(const int transpose_a[2], const int transpose_b[2], const int flags, const char* const name)
3224{
3225 ccv_cnnp_model_matmul_t* const model_matmul = (ccv_cnnp_model_matmul_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_matmul_t));
3226 model_matmul->super.isa = &ccv_cnnp_matmul_isa;
3227 model_matmul->super.input_size = 2;
3228 model_matmul->super.outputs = &model_matmul->output;
3229 model_matmul->super.output_size = 1;
3230 model_matmul->transpose_a[0] = transpose_a[0];
3231 model_matmul->transpose_a[1] = transpose_a[1];
3232 model_matmul->transpose_b[0] = transpose_b[0];
3233 model_matmul->transpose_b[1] = transpose_b[1];
3234 model_matmul->flags = flags;
3235 ccv_cnnp_model_copy_name(&model_matmul->super, name);
3236 return (ccv_cnnp_model_t*)model_matmul;
3237}
3238
3239static ccv_cnnp_model_t* _ccv_cnnp_matmul_copy(const ccv_cnnp_model_t* const super, void* const context)
3240{
3241 const ccv_cnnp_model_matmul_t* const self = (const ccv_cnnp_model_matmul_t*)super;
3242 return ccv_cnnp_matmul(self->transpose_a, self->transpose_b, self->flags, self->super.name);
3243}
3244
3245// MARK - Dropout Layer
3246
3247typedef struct {
3248 ccv_cnnp_model_t super;
3249 ccv_nnc_tensor_symbol_t output;
3250 ccv_nnc_graph_exec_symbol_t dropout;
3251 float p;
3252 int entirety;
3253} ccv_cnnp_model_dropout_t;
3254
3255static void _ccv_cnnp_dropout_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3256{
3257 PRINT(CCV_CLI_VERBOSE, "[cnnp_dropout_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_dropout_build] -\n"); fflush(stdout); } } while
(0)
;
3258 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3258, __extension__ __PRETTY_FUNCTION__); }))
;
3259 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3259, __extension__ __PRETTY_FUNCTION__
); }))
;
3260 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3261 ccv_nnc_tensor_param_t output_params[2];
3262 ccv_cnnp_model_dropout_t* const self = (ccv_cnnp_model_dropout_t*)super;
3263 const ccv_nnc_cmd_t dropout = CMD_DROPOUT_FORWARD(self->p, self->entirety)ccv_nnc_cmd(CCV_NNC_DROPOUT_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.dropout={.p=self->p,.entirety=self
->entirety}}), 0)
;
3264 ccv_nnc_hint_tensor_auto(dropout, (ccv_nnc_tensor_param_t []){
3265 params,
3266 }, 1, ccv_nnc_no_hint, output_params, 2);
3267 const ccv_nnc_tensor_symbol_t dropout_output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
3268 const ccv_nnc_tensor_symbol_t mask = ccv_nnc_tensor_symbol_new(graph, output_params[1], "mask");
3269 self->dropout = ccv_nnc_graph_exec_symbol_new(graph, dropout, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(dropout_output, mask)(const ccv_nnc_tensor_symbol_t []){dropout_output, mask}, (1 +
1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 -1)
, "dropout");
3270 outputs[0] = dropout_output;
3271}
3272
3273static void _ccv_cnnp_dropout_set_is_test(ccv_cnnp_model_t* const super, const int is_test, const ccv_cnnp_cmd_updater_f updater, void* const context)
3274{
3275 ccv_cnnp_model_dropout_t* const self = (ccv_cnnp_model_dropout_t*)super;
3276 if (self->dropout.graph)
3277 {
3278 if (is_test)
3279 // During test, the dropout is not applied. Data transfer is perfect because if these are the same tensor, it will skip.
3280 updater(context, self->dropout, CMD_DATA_TRANSFER_FORWARD()ccv_nnc_cmd(CCV_NNC_DATA_TRANSFER_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, ccv_nnc_no_hint);
3281 else
3282 updater(context, self->dropout, CMD_DROPOUT_FORWARD(self->p, self->entirety)ccv_nnc_cmd(CCV_NNC_DROPOUT_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.dropout={.p=self->p,.entirety=self
->entirety}}), 0)
, ccv_nnc_no_hint);
3283 }
3284}
3285
3286static ccv_cnnp_model_t* _ccv_cnnp_dropout_copy(const ccv_cnnp_model_t* const super, void* const context);
3287
3288static const ccv_cnnp_model_vtab_t ccv_cnnp_dropout_isa = {
3289 .build = _ccv_cnnp_dropout_build,
3290 .set_is_test = _ccv_cnnp_dropout_set_is_test,
3291 .copy = _ccv_cnnp_dropout_copy,
3292};
3293
3294ccv_cnnp_model_t* ccv_cnnp_dropout(const float p, const int entirety, const char* const name)
3295{
3296 ccv_cnnp_model_dropout_t* const model_dropout = (ccv_cnnp_model_dropout_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_dropout_t));
3297 model_dropout->super.isa = &ccv_cnnp_dropout_isa;
3298 model_dropout->super.input_size = 1;
3299 model_dropout->super.outputs = &model_dropout->output;
3300 model_dropout->super.output_size = 1;
3301 model_dropout->p = p;
3302 model_dropout->entirety = entirety;
3303 ccv_cnnp_model_copy_name(&model_dropout->super, name);
3304 return (ccv_cnnp_model_t*)model_dropout;
3305}
3306
3307static ccv_cnnp_model_t* _ccv_cnnp_dropout_copy(const ccv_cnnp_model_t* const super, void* const context)
3308{
3309 const ccv_cnnp_model_dropout_t* const self = (const ccv_cnnp_model_dropout_t*)super;
3310 return ccv_cnnp_dropout(self->p, self->entirety, self->super.name);
3311}
3312
3313// MARK - Masked Fill Layer
3314
3315typedef struct {
3316 ccv_cnnp_model_t super;
3317 ccv_nnc_tensor_symbol_t output;
3318 float eq;
3319 float fill;
3320} ccv_cnnp_model_masked_fill_t;
3321
3322static void _ccv_cnnp_masked_fill_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3323{
3324 PRINT(CCV_CLI_VERBOSE, "[cnnp_masked_fill_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_masked_fill_build] -\n"); fflush(stdout); } }
while (0)
;
3325 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3325, __extension__ __PRETTY_FUNCTION__); }))
;
3326 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3326, __extension__ __PRETTY_FUNCTION__
); }))
;
3327 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3328 ccv_cnnp_model_masked_fill_t* const self = (ccv_cnnp_model_masked_fill_t*)super;
3329 const ccv_nnc_tensor_symbol_t masked_fill_output = ccv_nnc_tensor_symbol_new(graph, params, 0);
3330 ccv_nnc_graph_exec_symbol_new(graph, CMD_MASKED_FILL_FORWARD(self->eq, self->fill)ccv_nnc_cmd(CCV_NNC_MASKED_FILL_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={self->eq, self->fill}
}}, 0)
, TENSOR_SYMBOL_LIST(inputs[0], inputs[1])(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1]}, (1 +
1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 -1)
, TENSOR_SYMBOL_LIST(masked_fill_output)(const ccv_nnc_tensor_symbol_t []){masked_fill_output}, (1 +1
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 -1)
, "masked_fill");
3331 outputs[0] = masked_fill_output;
3332}
3333
3334static ccv_cnnp_model_t* _ccv_cnnp_masked_fill_copy(const ccv_cnnp_model_t* const super, void* const context);
3335
3336static const ccv_cnnp_model_vtab_t ccv_cnnp_masked_fill_isa = {
3337 .build = _ccv_cnnp_masked_fill_build,
3338 .copy = _ccv_cnnp_masked_fill_copy,
3339};
3340
3341ccv_cnnp_model_t* ccv_cnnp_masked_fill(const float eq, const float fill, const char* const name)
3342{
3343 ccv_cnnp_model_masked_fill_t* const model_masked_fill = (ccv_cnnp_model_masked_fill_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_masked_fill_t));
3344 model_masked_fill->super.isa = &ccv_cnnp_masked_fill_isa;
3345 model_masked_fill->super.input_size = 2;
3346 model_masked_fill->super.outputs = &model_masked_fill->output;
3347 model_masked_fill->super.output_size = 1;
3348 model_masked_fill->eq = eq;
3349 model_masked_fill->fill = fill;
3350 ccv_cnnp_model_copy_name(&model_masked_fill->super, name);
3351 return (ccv_cnnp_model_t*)model_masked_fill;
3352}
3353
3354static ccv_cnnp_model_t* _ccv_cnnp_masked_fill_copy(const ccv_cnnp_model_t* const super, void* const context)
3355{
3356 const ccv_cnnp_model_masked_fill_t* const self = (const ccv_cnnp_model_masked_fill_t*)super;
3357 return ccv_cnnp_masked_fill(self->eq, self->fill, self->super.name);
3358}
3359
3360// MARK - Index Select Layer
3361
3362typedef struct {
3363 ccv_cnnp_model_t super;
3364 ccv_nnc_tensor_symbol_t output;
3365} ccv_cnnp_model_index_select_t;
3366
3367static void _ccv_cnnp_index_select_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3368{
3369 PRINT(CCV_CLI_VERBOSE, "[cnnp_index_select_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_index_select_build] -\n"); fflush(stdout); }
} while (0)
;
3370 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3370, __extension__ __PRETTY_FUNCTION__); }))
;
3371 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3371, __extension__ __PRETTY_FUNCTION__
); }))
;
3372 const ccv_nnc_tensor_param_t vocab_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3373 const ccv_nnc_tensor_param_t index_params = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
3374 ccv_nnc_tensor_param_t output_params;
3375 const ccv_nnc_cmd_t index_select = CMD_INDEX_SELECT_FORWARD()ccv_nnc_cmd(CCV_NNC_INDEX_SELECT_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
;
3376 ccv_nnc_hint_tensor_auto(index_select, (ccv_nnc_tensor_param_t []){
3377 vocab_params,
3378 index_params,
3379 }, 2, ccv_nnc_no_hint, &output_params, 1);
3380 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3381 ccv_nnc_graph_exec_symbol_new(graph, index_select, TENSOR_SYMBOL_LIST(inputs[0], inputs[1])(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1]}, (1 +
1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "index_select");
3382 outputs[0] = output;
3383}
3384
3385static ccv_cnnp_model_t* _ccv_cnnp_index_select_copy(const ccv_cnnp_model_t* const super, void* const context);
3386
3387static const ccv_cnnp_model_vtab_t ccv_cnnp_index_select_isa = {
3388 .build = _ccv_cnnp_index_select_build,
3389 .copy = _ccv_cnnp_index_select_copy,
3390};
3391
3392ccv_cnnp_model_t* ccv_cnnp_index_select(const char* const name)
3393{
3394 ccv_cnnp_model_index_select_t* const model_index_select = (ccv_cnnp_model_index_select_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_index_select_t));
3395 model_index_select->super.isa = &ccv_cnnp_index_select_isa;
3396 model_index_select->super.input_size = 2;
3397 model_index_select->super.outputs = &model_index_select->output;
3398 model_index_select->super.output_size = 1;
3399 ccv_cnnp_model_copy_name(&model_index_select->super, name);
3400 return (ccv_cnnp_model_t*)model_index_select;
3401}
3402
3403static ccv_cnnp_model_t* _ccv_cnnp_index_select_copy(const ccv_cnnp_model_t* const super, void* const context)
3404{
3405 ccv_cnnp_model_index_select_t* const self = (ccv_cnnp_model_index_select_t*)super;
3406 return ccv_cnnp_index_select(self->super.name);
3407}
3408
3409// MARK - Embedding Layer
3410
3411typedef struct {
3412 ccv_cnnp_model_t super;
3413 ccv_nnc_tensor_symbol_t output;
3414 ccv_nnc_tensor_symbol_t vocab;
3415 int datatype;
3416 int vocab_size;
3417 int embed_size;
3418} ccv_cnnp_model_embedding_t;
3419
3420static void _ccv_cnnp_embedding_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3421{
3422 ccv_cnnp_model_embedding_t* const self = (ccv_cnnp_model_embedding_t*)super;
3423 PRINT(CCV_CLI_VERBOSE, "[cnnp_embedding_build] vocab_size: %d, embed_size: %d\n", self->vocab_size, self->embed_size)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_embedding_build] vocab_size: %d, embed_size: %d\n"
, self->vocab_size, self->embed_size); fflush(stdout); }
} while (0)
;
3424 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3424, __extension__ __PRETTY_FUNCTION__); }))
;
3425 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3425, __extension__ __PRETTY_FUNCTION__
); }))
;
3426 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3427 ccv_nnc_tensor_param_t vocab_params = params;
3428 memset(vocab_params.dim, 0, sizeof(vocab_params.dim));
3429 vocab_params.datatype = self->datatype;
3430 vocab_params.dim[0] = self->vocab_size;
3431 vocab_params.dim[1] = self->embed_size;
3432 if (!self->vocab.graph)
3433 self->vocab = ccv_nnc_tensor_symbol_new(graph, vocab_params, "vocab");
3434 assert(self->vocab.graph == graph)((void) sizeof ((self->vocab.graph == graph) ? 1 : 0), __extension__
({ if (self->vocab.graph == graph) ; else __assert_fail (
"self->vocab.graph == graph", "ccv_cnnp_model_addons.c", 3434
, __extension__ __PRETTY_FUNCTION__); }))
;
3435 const ccv_nnc_tensor_symbol_t vocab = ccv_cnnp_model_get_symbol(super, self->vocab);
3436 ccv_nnc_tensor_param_t output_params;
3437 const ccv_nnc_cmd_t embedding = CMD_INDEX_SELECT_FORWARD()ccv_nnc_cmd(CCV_NNC_INDEX_SELECT_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
;
3438 ccv_nnc_hint_tensor_auto(embedding, (ccv_nnc_tensor_param_t []){
3439 vocab_params,
3440 params,
3441 }, 2, ccv_nnc_no_hint, &output_params, 1);
3442 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3443 ccv_nnc_graph_exec_symbol_new(graph, embedding, TENSOR_SYMBOL_LIST(vocab, inputs[0])(const ccv_nnc_tensor_symbol_t []){vocab, inputs[0]}, (1 +1 +
1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
-1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "embedding");
3444 outputs[0] = output;
3445}
3446
3447static void _ccv_cnnp_embedding_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
3448{
3449 ccv_cnnp_model_embedding_t* const self = (ccv_cnnp_model_embedding_t*)super;
3450 const float std = sqrtf(2) / sqrtf(self->vocab_size + self->embed_size);
3451 const float bound = sqrtf(3) * std;
3452 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->vocab);
3453}
3454
3455static void _ccv_cnnp_embedding_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
3456{
3457 ccv_cnnp_model_embedding_t* const self = (ccv_cnnp_model_embedding_t*)super;
3458 add_to_array(parameters, self->vocab, is_trainable);
3459}
3460
3461static ccv_cnnp_model_t* _ccv_cnnp_embedding_copy(const ccv_cnnp_model_t* const super, void* const context);
3462
3463static const ccv_cnnp_model_vtab_t ccv_cnnp_embedding_isa = {
3464 .build = _ccv_cnnp_embedding_build,
3465 .init_states = _ccv_cnnp_embedding_init_states,
3466 .add_to_parameter = _ccv_cnnp_embedding_add_to_parameter,
3467 .copy = _ccv_cnnp_embedding_copy,
3468};
3469
3470ccv_cnnp_model_t* ccv_cnnp_embedding(const int datatype, const int vocab_size, const int embed_size, const int is_trainable, const char* const name)
3471{
3472 ccv_cnnp_model_embedding_t* const model_embedding = (ccv_cnnp_model_embedding_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_embedding_t));
3473 model_embedding->super.isa = &ccv_cnnp_embedding_isa;
3474 model_embedding->super.input_size = 1;
3475 model_embedding->super.outputs = &model_embedding->output;
3476 model_embedding->super.output_size = 1;
3477 model_embedding->super.is_trainable = is_trainable;
3478 ccv_cnnp_model_copy_name(&model_embedding->super, name);
3479 model_embedding->vocab.d = CCV_NNC_NO_TENSOR_SYMBOL;
3480 model_embedding->vocab.graph = 0;
3481 assert(datatype == CCV_32F || datatype == CCV_16F || datatype == CCV_16BF)((void) sizeof ((datatype == CCV_32F || datatype == CCV_16F ||
datatype == CCV_16BF) ? 1 : 0), __extension__ ({ if (datatype
== CCV_32F || datatype == CCV_16F || datatype == CCV_16BF) ;
else __assert_fail ("datatype == CCV_32F || datatype == CCV_16F || datatype == CCV_16BF"
, "ccv_cnnp_model_addons.c", 3481, __extension__ __PRETTY_FUNCTION__
); }))
;
3482 model_embedding->datatype = datatype;
3483 assert(vocab_size > 0)((void) sizeof ((vocab_size > 0) ? 1 : 0), __extension__ (
{ if (vocab_size > 0) ; else __assert_fail ("vocab_size > 0"
, "ccv_cnnp_model_addons.c", 3483, __extension__ __PRETTY_FUNCTION__
); }))
;
3484 model_embedding->vocab_size = vocab_size;
3485 assert(embed_size > 0)((void) sizeof ((embed_size > 0) ? 1 : 0), __extension__ (
{ if (embed_size > 0) ; else __assert_fail ("embed_size > 0"
, "ccv_cnnp_model_addons.c", 3485, __extension__ __PRETTY_FUNCTION__
); }))
;
3486 model_embedding->embed_size = embed_size;
3487 return (ccv_cnnp_model_t*)model_embedding;
3488}
3489
3490static ccv_cnnp_model_t* _ccv_cnnp_embedding_copy(const ccv_cnnp_model_t* const super, void* const context)
3491{
3492 ccv_cnnp_model_embedding_t* const self = (ccv_cnnp_model_embedding_t*)super;
3493 return ccv_cnnp_embedding(self->datatype, self->vocab_size, self->embed_size, self->super.is_trainable, self->super.name);
3494}
3495
3496// MARK - Pool Layers
3497
3498typedef struct {
3499 ccv_cnnp_model_t super;
3500 ccv_nnc_tensor_symbol_t output;
3501 int type;
3502 float width_scale;
3503 float height_scale;
3504 int align_corners;
3505} ccv_cnnp_model_upsample_t;
3506
3507static void _ccv_cnnp_upsample_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3508{
3509 PRINT(CCV_CLI_VERBOSE, "[cnnp_upsample_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_upsample_build] -\n"); fflush(stdout); } } while
(0)
;
3510 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3510, __extension__ __PRETTY_FUNCTION__); }))
;
3511 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3511, __extension__ __PRETTY_FUNCTION__
); }))
;
3512 ccv_cnnp_model_upsample_t* const self = (ccv_cnnp_model_upsample_t*)super;
3513 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3514 ccv_nnc_cmd_t cmd = CMD_UPSAMPLE_FORWARD(self->type, self->width_scale, self->height_scale, self->align_corners)ccv_nnc_cmd(CCV_NNC_UPSAMPLE_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.upsample={.type=self->type,.width_scale
=self->width_scale,.height_scale=self->height_scale,.align_corners
=self->align_corners}}), 0)
;
3515 ccv_nnc_tensor_param_t output_params;
3516 ccv_nnc_hint_tensor_auto(cmd, &params, 1, ccv_nnc_no_hint, &output_params, 1);
3517 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3518 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0])(const ccv_nnc_tensor_symbol_t []){inputs[0]}, (1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "upsample");
3519 outputs[0] = output;
3520}
3521
3522static ccv_cnnp_model_t* _ccv_cnnp_upsample_copy(const ccv_cnnp_model_t* const super, void* const context);
3523
3524static const ccv_cnnp_model_vtab_t ccv_cnnp_upsample_isa = {
3525 .build = _ccv_cnnp_upsample_build,
3526 .copy = _ccv_cnnp_upsample_copy,
3527};
3528
3529ccv_cnnp_model_t* ccv_cnnp_upsample(const int type, const float width_scale, const float height_scale, const int align_corners, const char* const name)
3530{
3531 ccv_cnnp_model_upsample_t* const model_upsample = (ccv_cnnp_model_upsample_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_upsample_t));
3532 model_upsample->super.isa = &ccv_cnnp_upsample_isa;
3533 model_upsample->super.input_size = 1;
3534 model_upsample->super.outputs = &model_upsample->output;
3535 model_upsample->super.output_size = 1;
3536 ccv_cnnp_model_copy_name(&model_upsample->super, name);
3537 assert(type == CCV_NNC_UPSAMPLE_NEAREST || type == CCV_NNC_UPSAMPLE_BILINEAR)((void) sizeof ((type == CCV_NNC_UPSAMPLE_NEAREST || type == CCV_NNC_UPSAMPLE_BILINEAR
) ? 1 : 0), __extension__ ({ if (type == CCV_NNC_UPSAMPLE_NEAREST
|| type == CCV_NNC_UPSAMPLE_BILINEAR) ; else __assert_fail (
"type == CCV_NNC_UPSAMPLE_NEAREST || type == CCV_NNC_UPSAMPLE_BILINEAR"
, "ccv_cnnp_model_addons.c", 3537, __extension__ __PRETTY_FUNCTION__
); }))
;
3538 model_upsample->type = type;
3539 model_upsample->width_scale = width_scale;
3540 model_upsample->height_scale = height_scale;
3541 model_upsample->align_corners = align_corners;
3542 return (ccv_cnnp_model_t*)model_upsample;
3543}
3544
3545static ccv_cnnp_model_t* _ccv_cnnp_upsample_copy(const ccv_cnnp_model_t* const super, void* const context)
3546{
3547 const ccv_cnnp_model_upsample_t* const self = (const ccv_cnnp_model_upsample_t*)super;
3548 return ccv_cnnp_upsample(self->type, self->width_scale, self->height_scale, self->align_corners, self->super.name);
3549}
3550
3551// MARK - Reduce Sum Layer
3552
3553typedef struct {
3554 ccv_cnnp_model_t super;
3555 int axis[CCV_NNC_MAX_DIM_ALLOC(12)];
3556 int count;
3557 ccv_nnc_tensor_symbol_t output;
3558} ccv_cnnp_model_reduce_sum_t;
3559
3560static void _ccv_cnnp_reduce_sum_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3561{
3562 PRINT(CCV_CLI_VERBOSE, "[cnnp_reduce_sum_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reduce_sum_build] -\n"); fflush(stdout); } }
while (0)
;
3563 const ccv_cnnp_model_reduce_sum_t* const self = (const ccv_cnnp_model_reduce_sum_t*)super;
3564 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3564, __extension__ __PRETTY_FUNCTION__); }))
;
3565 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3565, __extension__ __PRETTY_FUNCTION__
); }))
;
3566 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3567 ccv_nnc_tensor_param_t output_params;
3568 ccv_nnc_cmd_t reduce_sum = CMD_REDUCE_SUM_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_SUM_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
3569 int i;
3570 for (i = 0; i < self->count; i++)
3571 reduce_sum.info.reduce.axis[i] = self->axis[i];
3572 reduce_sum.info.reduce.count = self->count;
3573 ccv_nnc_hint_tensor_auto(reduce_sum, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3574 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3575 ccv_nnc_graph_exec_symbol_new(graph, reduce_sum, inputs, input_size, outputs, output_size, "reduce_sum");
3576}
3577
3578static ccv_cnnp_model_t* _ccv_cnnp_reduce_sum_copy(const ccv_cnnp_model_t* const self, void* const context);
3579
3580static const ccv_cnnp_model_vtab_t ccv_cnnp_reduce_sum_isa = {
3581 .build = _ccv_cnnp_reduce_sum_build,
3582 .copy = _ccv_cnnp_reduce_sum_copy,
3583};
3584
3585ccv_cnnp_model_t* ccv_cnnp_reduce_sum(const int* const axis, const int axis_count, const char* const name)
3586{
3587 ccv_cnnp_model_reduce_sum_t* const model_reduce_sum = (ccv_cnnp_model_reduce_sum_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reduce_sum_t));
3588 model_reduce_sum->super.isa = &ccv_cnnp_reduce_sum_isa;
3589 model_reduce_sum->super.input_size = 1;
3590 model_reduce_sum->super.outputs = &model_reduce_sum->output;
3591 model_reduce_sum->super.output_size = 1;
3592 ccv_cnnp_model_copy_name(&model_reduce_sum->super, name);
3593 assert(axis_count <= CCV_NNC_MAX_DIM_ALLOC)((void) sizeof ((axis_count <= (12)) ? 1 : 0), __extension__
({ if (axis_count <= (12)) ; else __assert_fail ("axis_count <= CCV_NNC_MAX_DIM_ALLOC"
, "ccv_cnnp_model_addons.c", 3593, __extension__ __PRETTY_FUNCTION__
); }))
;
3594 int i;
3595 for (i = 0; i < axis_count; i++)
3596 model_reduce_sum->axis[i] = axis[i];
3597 model_reduce_sum->count = axis_count;
3598 return (ccv_cnnp_model_t*)model_reduce_sum;
3599}
3600
3601static ccv_cnnp_model_t* _ccv_cnnp_reduce_sum_copy(const ccv_cnnp_model_t* const super, void* const context)
3602{
3603 const ccv_cnnp_model_reduce_sum_t* const self = (const ccv_cnnp_model_reduce_sum_t*)super;
3604 return ccv_cnnp_reduce_sum(self->axis, self->count, self->super.name);
3605}
3606
3607// MARK - Reduce Mean Layer
3608
3609typedef struct {
3610 ccv_cnnp_model_t super;
3611 int axis[CCV_NNC_MAX_DIM_ALLOC(12)];
3612 int count;
3613 ccv_nnc_tensor_symbol_t output;
3614} ccv_cnnp_model_reduce_mean_t;
3615
3616static void _ccv_cnnp_reduce_mean_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3617{
3618 PRINT(CCV_CLI_VERBOSE, "[cnnp_reduce_mean_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reduce_mean_build] -\n"); fflush(stdout); } }
while (0)
;
3619 const ccv_cnnp_model_reduce_mean_t* const self = (const ccv_cnnp_model_reduce_mean_t*)super;
3620 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3620, __extension__ __PRETTY_FUNCTION__); }))
;
3621 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3621, __extension__ __PRETTY_FUNCTION__
); }))
;
3622 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3623 ccv_nnc_tensor_param_t output_params;
3624 ccv_nnc_cmd_t reduce_mean = CMD_REDUCE_MEAN_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_MEAN_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
3625 int i;
3626 for (i = 0; i < self->count; i++)
3627 reduce_mean.info.reduce.axis[i] = self->axis[i];
3628 reduce_mean.info.reduce.count = self->count;
3629 ccv_nnc_hint_tensor_auto(reduce_mean, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3630 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3631 ccv_nnc_graph_exec_symbol_new(graph, reduce_mean, inputs, input_size, outputs, output_size, "reduce_mean");
3632}
3633
3634static ccv_cnnp_model_t* _ccv_cnnp_reduce_mean_copy(const ccv_cnnp_model_t* const self, void* const context);
3635
3636static const ccv_cnnp_model_vtab_t ccv_cnnp_reduce_mean_isa = {
3637 .build = _ccv_cnnp_reduce_mean_build,
3638 .copy = _ccv_cnnp_reduce_mean_copy,
3639};
3640
3641ccv_cnnp_model_t* ccv_cnnp_reduce_mean(const int* const axis, const int axis_count, const char* const name)
3642{
3643 ccv_cnnp_model_reduce_mean_t* const model_reduce_mean = (ccv_cnnp_model_reduce_mean_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reduce_mean_t));
3644 model_reduce_mean->super.isa = &ccv_cnnp_reduce_mean_isa;
3645 model_reduce_mean->super.input_size = 1;
3646 model_reduce_mean->super.outputs = &model_reduce_mean->output;
3647 model_reduce_mean->super.output_size = 1;
3648 ccv_cnnp_model_copy_name(&model_reduce_mean->super, name);
3649 assert(axis_count <= CCV_NNC_MAX_DIM_ALLOC)((void) sizeof ((axis_count <= (12)) ? 1 : 0), __extension__
({ if (axis_count <= (12)) ; else __assert_fail ("axis_count <= CCV_NNC_MAX_DIM_ALLOC"
, "ccv_cnnp_model_addons.c", 3649, __extension__ __PRETTY_FUNCTION__
); }))
;
3650 int i;
3651 for (i = 0; i < axis_count; i++)
3652 model_reduce_mean->axis[i] = axis[i];
3653 model_reduce_mean->count = axis_count;
3654 return (ccv_cnnp_model_t*)model_reduce_mean;
3655}
3656
3657static ccv_cnnp_model_t* _ccv_cnnp_reduce_mean_copy(const ccv_cnnp_model_t* const super, void* const context)
3658{
3659 const ccv_cnnp_model_reduce_mean_t* const self = (const ccv_cnnp_model_reduce_mean_t*)super;
3660 return ccv_cnnp_reduce_mean(self->axis, self->count, self->super.name);
3661}
3662
3663// MARK - Reduce Max Layer
3664
3665typedef struct {
3666 ccv_cnnp_model_t super;
3667 int axis[CCV_NNC_MAX_DIM_ALLOC(12)];
3668 int count;
3669 ccv_nnc_tensor_symbol_t output;
3670} ccv_cnnp_model_reduce_max_t;
3671
3672static void _ccv_cnnp_reduce_max_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3673{
3674 PRINT(CCV_CLI_VERBOSE, "[cnnp_reduce_max_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reduce_max_build] -\n"); fflush(stdout); } }
while (0)
;
3675 const ccv_cnnp_model_reduce_max_t* const self = (const ccv_cnnp_model_reduce_max_t*)super;
3676 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3676, __extension__ __PRETTY_FUNCTION__); }))
;
3677 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3677, __extension__ __PRETTY_FUNCTION__
); }))
;
3678 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3679 ccv_nnc_tensor_param_t output_params;
3680 ccv_nnc_cmd_t reduce_max = CMD_REDUCE_MAX_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_MAX_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
3681 int i;
3682 for (i = 0; i < self->count; i++)
3683 reduce_max.info.reduce.axis[i] = self->axis[i];
3684 reduce_max.info.reduce.count = self->count;
3685 ccv_nnc_hint_tensor_auto(reduce_max, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3686 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3687 ccv_nnc_graph_exec_symbol_new(graph, reduce_max, inputs, input_size, outputs, output_size, "reduce_max");
3688}
3689
3690static ccv_cnnp_model_t* _ccv_cnnp_reduce_max_copy(const ccv_cnnp_model_t* const self, void* const context);
3691
3692static const ccv_cnnp_model_vtab_t ccv_cnnp_reduce_max_isa = {
3693 .build = _ccv_cnnp_reduce_max_build,
3694 .copy = _ccv_cnnp_reduce_max_copy,
3695};
3696
3697ccv_cnnp_model_t* ccv_cnnp_reduce_max(const int* const axis, const int axis_count, const char* const name)
3698{
3699 ccv_cnnp_model_reduce_max_t* const model_reduce_max = (ccv_cnnp_model_reduce_max_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reduce_max_t));
3700 model_reduce_max->super.isa = &ccv_cnnp_reduce_max_isa;
3701 model_reduce_max->super.input_size = 1;
3702 model_reduce_max->super.outputs = &model_reduce_max->output;
3703 model_reduce_max->super.output_size = 1;
3704 ccv_cnnp_model_copy_name(&model_reduce_max->super, name);
3705 assert(axis_count <= CCV_NNC_MAX_DIM_ALLOC)((void) sizeof ((axis_count <= (12)) ? 1 : 0), __extension__
({ if (axis_count <= (12)) ; else __assert_fail ("axis_count <= CCV_NNC_MAX_DIM_ALLOC"
, "ccv_cnnp_model_addons.c", 3705, __extension__ __PRETTY_FUNCTION__
); }))
;
3706 int i;
3707 for (i = 0; i < axis_count; i++)
3708 model_reduce_max->axis[i] = axis[i];
3709 model_reduce_max->count = axis_count;
3710 return (ccv_cnnp_model_t*)model_reduce_max;
3711}
3712
3713static ccv_cnnp_model_t* _ccv_cnnp_reduce_max_copy(const ccv_cnnp_model_t* const super, void* const context)
3714{
3715 const ccv_cnnp_model_reduce_max_t* const self = (const ccv_cnnp_model_reduce_max_t*)super;
3716 return ccv_cnnp_reduce_max(self->axis, self->count, self->super.name);
3717}
3718
3719// MARK - Reduce Min Layer
3720
3721typedef struct {
3722 ccv_cnnp_model_t super;
3723 int axis[CCV_NNC_MAX_DIM_ALLOC(12)];
3724 int count;
3725 ccv_nnc_tensor_symbol_t output;
3726} ccv_cnnp_model_reduce_min_t;
3727
3728static void _ccv_cnnp_reduce_min_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3729{
3730 PRINT(CCV_CLI_VERBOSE, "[cnnp_reduce_min_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reduce_min_build] -\n"); fflush(stdout); } }
while (0)
;
3731 const ccv_cnnp_model_reduce_min_t* const self = (const ccv_cnnp_model_reduce_min_t*)super;
3732 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3732, __extension__ __PRETTY_FUNCTION__); }))
;
3733 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3733, __extension__ __PRETTY_FUNCTION__
); }))
;
3734 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3735 ccv_nnc_tensor_param_t output_params;
3736 ccv_nnc_cmd_t reduce_min = CMD_REDUCE_MIN_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_MIN_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
3737 int i;
3738 for (i = 0; i < self->count; i++)
3739 reduce_min.info.reduce.axis[i] = self->axis[i];
3740 reduce_min.info.reduce.count = self->count;
3741 ccv_nnc_hint_tensor_auto(reduce_min, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3742 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3743 ccv_nnc_graph_exec_symbol_new(graph, reduce_min, inputs, input_size, outputs, output_size, "reduce_min");
3744}
3745
3746static ccv_cnnp_model_t* _ccv_cnnp_reduce_min_copy(const ccv_cnnp_model_t* const self, void* const context);
3747
3748static const ccv_cnnp_model_vtab_t ccv_cnnp_reduce_min_isa = {
3749 .build = _ccv_cnnp_reduce_min_build,
3750 .copy = _ccv_cnnp_reduce_min_copy,
3751};
3752
3753ccv_cnnp_model_t* ccv_cnnp_reduce_min(const int* const axis, const int axis_count, const char* const name)
3754{
3755 ccv_cnnp_model_reduce_min_t* const model_reduce_min = (ccv_cnnp_model_reduce_min_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reduce_min_t));
3756 model_reduce_min->super.isa = &ccv_cnnp_reduce_min_isa;
3757 model_reduce_min->super.input_size = 1;
3758 model_reduce_min->super.outputs = &model_reduce_min->output;
3759 model_reduce_min->super.output_size = 1;
3760 ccv_cnnp_model_copy_name(&model_reduce_min->super, name);
3761 assert(axis_count <= CCV_NNC_MAX_DIM_ALLOC)((void) sizeof ((axis_count <= (12)) ? 1 : 0), __extension__
({ if (axis_count <= (12)) ; else __assert_fail ("axis_count <= CCV_NNC_MAX_DIM_ALLOC"
, "ccv_cnnp_model_addons.c", 3761, __extension__ __PRETTY_FUNCTION__
); }))
;
3762 int i;
3763 for (i = 0; i < axis_count; i++)
3764 model_reduce_min->axis[i] = axis[i];
3765 model_reduce_min->count = axis_count;
3766 return (ccv_cnnp_model_t*)model_reduce_min;
3767}
3768
3769static ccv_cnnp_model_t* _ccv_cnnp_reduce_min_copy(const ccv_cnnp_model_t* const super, void* const context)
3770{
3771 const ccv_cnnp_model_reduce_min_t* const self = (const ccv_cnnp_model_reduce_min_t*)super;
3772 return ccv_cnnp_reduce_min(self->axis, self->count, self->super.name);
3773}
3774
3775// MARK - Reduce Norm2 Layer
3776
3777typedef struct {
3778 ccv_cnnp_model_t super;
3779 int axis[CCV_NNC_MAX_DIM_ALLOC(12)];
3780 int count;
3781 ccv_nnc_tensor_symbol_t output;
3782} ccv_cnnp_model_reduce_norm2_t;
3783
3784static void _ccv_cnnp_reduce_norm2_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3785{
3786 const ccv_cnnp_model_reduce_norm2_t* const self = (const ccv_cnnp_model_reduce_norm2_t*)super;
3787 PRINT(CCV_CLI_VERBOSE, "[cnnp_reduce_norm2_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_reduce_norm2_build] -\n"); fflush(stdout); }
} while (0)
;
3788 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3788, __extension__ __PRETTY_FUNCTION__); }))
;
3789 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3789, __extension__ __PRETTY_FUNCTION__
); }))
;
3790 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3791 ccv_nnc_tensor_param_t output_params;
3792 ccv_nnc_cmd_t reduce_norm2 = CMD_REDUCE_NORM2_FORWARD()ccv_nnc_cmd(CCV_NNC_REDUCE_NORM2_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}}
), 0)
;
3793 int i;
3794 for (i = 0; i < self->count; i++)
3795 reduce_norm2.info.reduce.axis[i] = self->axis[i];
3796 reduce_norm2.info.reduce.count = self->count;
3797 ccv_nnc_hint_tensor_auto(reduce_norm2, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3798 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3799 ccv_nnc_graph_exec_symbol_new(graph, reduce_norm2, inputs, input_size, outputs, output_size, "reduce_norm2");
3800}
3801
3802static ccv_cnnp_model_t* _ccv_cnnp_reduce_norm2_copy(const ccv_cnnp_model_t* const self, void* const context);
3803
3804static const ccv_cnnp_model_vtab_t ccv_cnnp_reduce_norm2_isa = {
3805 .build = _ccv_cnnp_reduce_norm2_build,
3806 .copy = _ccv_cnnp_reduce_norm2_copy,
3807};
3808
3809ccv_cnnp_model_t* ccv_cnnp_reduce_norm2(const int* const axis, const int axis_count, const char* const name)
3810{
3811 ccv_cnnp_model_reduce_norm2_t* const model_reduce_norm2 = (ccv_cnnp_model_reduce_norm2_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_reduce_norm2_t));
3812 model_reduce_norm2->super.isa = &ccv_cnnp_reduce_norm2_isa;
3813 model_reduce_norm2->super.input_size = 1;
3814 model_reduce_norm2->super.outputs = &model_reduce_norm2->output;
3815 model_reduce_norm2->super.output_size = 1;
3816 ccv_cnnp_model_copy_name(&model_reduce_norm2->super, name);
3817 assert(axis_count <= CCV_NNC_MAX_DIM_ALLOC)((void) sizeof ((axis_count <= (12)) ? 1 : 0), __extension__
({ if (axis_count <= (12)) ; else __assert_fail ("axis_count <= CCV_NNC_MAX_DIM_ALLOC"
, "ccv_cnnp_model_addons.c", 3817, __extension__ __PRETTY_FUNCTION__
); }))
;
3818 int i;
3819 for (i = 0; i < axis_count; i++)
3820 model_reduce_norm2->axis[i] = axis[i];
3821 model_reduce_norm2->count = axis_count;
3822 return (ccv_cnnp_model_t*)model_reduce_norm2;
3823}
3824
3825static ccv_cnnp_model_t* _ccv_cnnp_reduce_norm2_copy(const ccv_cnnp_model_t* const super, void* const context)
3826{
3827 const ccv_cnnp_model_reduce_norm2_t* const self = (const ccv_cnnp_model_reduce_norm2_t*)super;
3828 return ccv_cnnp_reduce_norm2(self->axis, self->count, self->super.name);
3829}
3830
3831// MARK - Argmax Layer
3832
3833typedef struct {
3834 ccv_cnnp_model_t super;
3835 int axis;
3836 ccv_nnc_tensor_symbol_t output;
3837} ccv_cnnp_model_argmax_t;
3838
3839static void _ccv_cnnp_argmax_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3840{
3841 const ccv_cnnp_model_argmax_t* const self = (const ccv_cnnp_model_argmax_t*)super;
3842 PRINT(CCV_CLI_VERBOSE, "[cnnp_argmax_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_argmax_build] -\n"); fflush(stdout); } } while
(0)
;
3843 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3843, __extension__ __PRETTY_FUNCTION__); }))
;
3844 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3844, __extension__ __PRETTY_FUNCTION__
); }))
;
3845 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3846 ccv_nnc_tensor_param_t output_params;
3847 ccv_nnc_cmd_t argmax = CMD_ARGMAX_FORWARD()ccv_nnc_cmd(CCV_NNC_ARGMAX_FORWARD, 0, ((ccv_nnc_cmd_param_t)
{.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}})
, 0)
;
3848 argmax.info.reduce.axis[0] = self->axis;
3849 argmax.info.reduce.count = 1;
3850 ccv_nnc_hint_tensor_auto(argmax, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3851 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3852 ccv_nnc_graph_exec_symbol_new(graph, argmax, inputs, input_size, outputs, output_size, "argmax");
3853}
3854
3855static ccv_cnnp_model_t* _ccv_cnnp_argmax_copy(const ccv_cnnp_model_t* const self, void* const context);
3856
3857static const ccv_cnnp_model_vtab_t ccv_cnnp_argmax_isa = {
3858 .build = _ccv_cnnp_argmax_build,
3859 .copy = _ccv_cnnp_argmax_copy,
3860};
3861
3862ccv_cnnp_model_t* ccv_cnnp_argmax(const int axis, const char* const name)
3863{
3864 ccv_cnnp_model_argmax_t* const model_argmax = (ccv_cnnp_model_argmax_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_argmax_t));
3865 model_argmax->super.isa = &ccv_cnnp_argmax_isa;
3866 model_argmax->super.input_size = 1;
3867 model_argmax->super.outputs = &model_argmax->output;
3868 model_argmax->super.output_size = 1;
3869 ccv_cnnp_model_copy_name(&model_argmax->super, name);
3870 model_argmax->axis = axis;
3871 return (ccv_cnnp_model_t*)model_argmax;
3872}
3873
3874static ccv_cnnp_model_t* _ccv_cnnp_argmax_copy(const ccv_cnnp_model_t* const super, void* const context)
3875{
3876 const ccv_cnnp_model_argmax_t* const self = (const ccv_cnnp_model_argmax_t*)super;
3877 return ccv_cnnp_argmax(self->axis, self->super.name);
3878}
3879
3880// MARK - Argmin Layer
3881
3882typedef struct {
3883 ccv_cnnp_model_t super;
3884 int axis;
3885 ccv_nnc_tensor_symbol_t output;
3886} ccv_cnnp_model_argmin_t;
3887
3888static void _ccv_cnnp_argmin_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3889{
3890 const ccv_cnnp_model_argmin_t* const self = (const ccv_cnnp_model_argmin_t*)super;
3891 PRINT(CCV_CLI_VERBOSE, "[cnnp_argmin_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_argmin_build] -\n"); fflush(stdout); } } while
(0)
;
3892 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 3892, __extension__ __PRETTY_FUNCTION__); }))
;
3893 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3893, __extension__ __PRETTY_FUNCTION__
); }))
;
3894 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
3895 ccv_nnc_tensor_param_t output_params;
3896 ccv_nnc_cmd_t argmin = CMD_ARGMIN_FORWARD()ccv_nnc_cmd(CCV_NNC_ARGMIN_FORWARD, 0, ((ccv_nnc_cmd_param_t)
{.size={.dim={1,1,1}},.reduce={.count=(1 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1),.axis={}}})
, 0)
;
3897 argmin.info.reduce.axis[0] = self->axis;
3898 argmin.info.reduce.count = 1;
3899 ccv_nnc_hint_tensor_auto(argmin, &input_params, 1, ccv_nnc_no_hint, &output_params, 1);
3900 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3901 ccv_nnc_graph_exec_symbol_new(graph, argmin, inputs, input_size, outputs, output_size, "argmin");
3902}
3903
3904static ccv_cnnp_model_t* _ccv_cnnp_argmin_copy(const ccv_cnnp_model_t* const self, void* const context);
3905
3906static const ccv_cnnp_model_vtab_t ccv_cnnp_argmin_isa = {
3907 .build = _ccv_cnnp_argmin_build,
3908 .copy = _ccv_cnnp_argmin_copy,
3909};
3910
3911ccv_cnnp_model_t* ccv_cnnp_argmin(const int axis, const char* const name)
3912{
3913 ccv_cnnp_model_argmin_t* const model_argmin = (ccv_cnnp_model_argmin_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_argmin_t));
3914 model_argmin->super.isa = &ccv_cnnp_argmin_isa;
3915 model_argmin->super.input_size = 1;
3916 model_argmin->super.outputs = &model_argmin->output;
3917 model_argmin->super.output_size = 1;
3918 ccv_cnnp_model_copy_name(&model_argmin->super, name);
3919 model_argmin->axis = axis;
3920 return (ccv_cnnp_model_t*)model_argmin;
3921}
3922
3923static ccv_cnnp_model_t* _ccv_cnnp_argmin_copy(const ccv_cnnp_model_t* const super, void* const context)
3924{
3925 const ccv_cnnp_model_argmin_t* const self = (const ccv_cnnp_model_argmin_t*)super;
3926 return ccv_cnnp_argmin(self->axis, self->super.name);
3927}
3928
3929// MARK - Min Layer
3930
3931typedef struct {
3932 ccv_cnnp_model_t super;
3933 ccv_nnc_tensor_symbol_t output;
3934} ccv_cnnp_model_min_t;
3935
3936static void _ccv_cnnp_min_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3937{
3938 PRINT(CCV_CLI_VERBOSE, "[cnnp_min_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_min_build] -\n"); fflush(stdout); } } while (
0)
;
3939 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3939, __extension__ __PRETTY_FUNCTION__); }))
;
3940 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3940, __extension__ __PRETTY_FUNCTION__
); }))
;
3941 ccv_nnc_tensor_param_t input_params[2];
3942 int i;
3943 for (i = 0; i < 2; i++)
3944 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
3945 ccv_nnc_tensor_param_t output_params;
3946 const ccv_nnc_cmd_t min = CMD_MIN_FORWARD()ccv_nnc_cmd(CCV_NNC_MIN_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}}}, 0)
;
3947 ccv_nnc_hint_tensor_auto(min, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
3948 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3949 ccv_nnc_graph_exec_symbol_new(graph, min, inputs, input_size, outputs, output_size, "min");
3950}
3951
3952static ccv_cnnp_model_t* _ccv_cnnp_min_copy(const ccv_cnnp_model_t* const self, void* const context);
3953
3954static const ccv_cnnp_model_vtab_t ccv_cnnp_min_isa = {
3955 .build = _ccv_cnnp_min_build,
3956 .copy = _ccv_cnnp_min_copy,
3957};
3958
3959ccv_cnnp_model_t* ccv_cnnp_min(const char* const name)
3960{
3961 ccv_cnnp_model_min_t* const model_min = (ccv_cnnp_model_min_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_min_t));
3962 model_min->super.isa = &ccv_cnnp_min_isa;
3963 model_min->super.input_size = 2;
3964 model_min->super.outputs = &model_min->output;
3965 model_min->super.output_size = 1;
3966 ccv_cnnp_model_copy_name(&model_min->super, name);
3967 return (ccv_cnnp_model_t*)model_min;
3968}
3969
3970static ccv_cnnp_model_t* _ccv_cnnp_min_copy(const ccv_cnnp_model_t* const super, void* const context)
3971{
3972 const ccv_cnnp_model_min_t* const self = (const ccv_cnnp_model_min_t*)super;
3973 return ccv_cnnp_min(self->super.name);
3974}
3975
3976// MARK - Max Layer
3977
3978typedef struct {
3979 ccv_cnnp_model_t super;
3980 ccv_nnc_tensor_symbol_t output;
3981} ccv_cnnp_model_max_t;
3982
3983static void _ccv_cnnp_max_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
3984{
3985 PRINT(CCV_CLI_VERBOSE, "[cnnp_max_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_max_build] -\n"); fflush(stdout); } } while (
0)
;
3986 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 3986, __extension__ __PRETTY_FUNCTION__); }))
;
3987 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 3987, __extension__ __PRETTY_FUNCTION__
); }))
;
3988 ccv_nnc_tensor_param_t input_params[2];
3989 int i;
3990 for (i = 0; i < 2; i++)
3991 input_params[i] = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
3992 ccv_nnc_tensor_param_t output_params;
3993 const ccv_nnc_cmd_t max = CMD_MAX_FORWARD()ccv_nnc_cmd(CCV_NNC_MAX_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}}}, 0)
;
3994 ccv_nnc_hint_tensor_auto(max, input_params, 2, ccv_nnc_no_hint, &output_params, 1);
3995 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
3996 ccv_nnc_graph_exec_symbol_new(graph, max, inputs, input_size, outputs, output_size, "max");
3997}
3998
3999static ccv_cnnp_model_t* _ccv_cnnp_max_copy(const ccv_cnnp_model_t* const self, void* const context);
4000
4001static const ccv_cnnp_model_vtab_t ccv_cnnp_max_isa = {
4002 .build = _ccv_cnnp_max_build,
4003 .copy = _ccv_cnnp_max_copy,
4004};
4005
4006ccv_cnnp_model_t* ccv_cnnp_max(const char* const name)
4007{
4008 ccv_cnnp_model_max_t* const model_max = (ccv_cnnp_model_max_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_max_t));
4009 model_max->super.isa = &ccv_cnnp_max_isa;
4010 model_max->super.input_size = 2;
4011 model_max->super.outputs = &model_max->output;
4012 model_max->super.output_size = 1;
4013 ccv_cnnp_model_copy_name(&model_max->super, name);
4014 return (ccv_cnnp_model_t*)model_max;
4015}
4016
4017static ccv_cnnp_model_t* _ccv_cnnp_max_copy(const ccv_cnnp_model_t* const super, void* const context)
4018{
4019 const ccv_cnnp_model_max_t* const self = (const ccv_cnnp_model_max_t*)super;
4020 return ccv_cnnp_max(self->super.name);
4021}
4022
4023// MARK - LSTM Layer
4024
4025typedef struct {
4026 ccv_cnnp_model_t super;
4027 int masked;
4028 ccv_nnc_tensor_symbol_t output;
4029 ccv_nnc_tensor_symbol_t weights;
4030 ccv_nnc_tensor_symbol_t reserves;
4031 ccv_nnc_cmd_param_t params;
4032 ccv_nnc_graph_exec_symbol_t lstm;
4033} ccv_cnnp_model_lstm_t;
4034
4035static int _ccv_cnnp_lstm_weight_dim(int bidirectional, int num_layers, int input_size, int hidden_size, int proj_size, int bias)
4036{
4037 const int D = !!bidirectional + 1;
4038 if (hidden_size == proj_size)
4039 return (num_layers * (bias ? 8 : 0) + (num_layers - 1) * (hidden_size * 4 * D + hidden_size * 4) + input_size * 4 + hidden_size * 4) * D;
4040 else
4041 return (num_layers * (bias ? 8 : 0) + (num_layers - 1) * (proj_size * 4 * D + proj_size * 4) + (proj_size * 4 + input_size * 4) + num_layers * proj_size) * D;
4042}
4043
4044static void _ccv_cnnp_lstm_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4045{
4046 ccv_cnnp_model_lstm_t* const self = (ccv_cnnp_model_lstm_t*)super;
4047 PRINT(CCV_CLI_VERBOSE, "[cnnp_lstm_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_lstm_build] -\n"); fflush(stdout); } } while
(0)
;
4048 assert(input_size == self->super.input_size)((void) sizeof ((input_size == self->super.input_size) ? 1
: 0), __extension__ ({ if (input_size == self->super.input_size
) ; else __assert_fail ("input_size == self->super.input_size"
, "ccv_cnnp_model_addons.c", 4048, __extension__ __PRETTY_FUNCTION__
); }))
;
4049 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4049, __extension__ __PRETTY_FUNCTION__
); }))
;
4050 const int proj_size = self->params.rnn.proj_size == 0 ? self->params.rnn.hidden_size : self->params.rnn.proj_size;
4051 ccv_nnc_tensor_param_t input_params[5];
4052 input_params[0]= ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4053 if (input_size == 2)
4054 input_params[1] = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
4055 input_params[4] = input_params[0];
4056 memset(input_params[4].dim, 0, sizeof(input_params[4].dim));
4057 const int x_nd = ccv_nnc_tensor_nd(input_params[0].dim);
4058 const int feature_count = input_params[0].dim[x_nd - 1];
4059 input_params[4].dim[0] = _ccv_cnnp_lstm_weight_dim(self->params.rnn.bidirectional, self->params.rnn.num_layers, feature_count, self->params.rnn.hidden_size, proj_size, self->params.rnn.bias);
4060 input_params[4].dim[1] = self->params.rnn.hidden_size;
4061 const ccv_nnc_cmd_t lstm = ccv_nnc_cmd(CCV_NNC_LSTM_FORWARD, 0, self->params, 0);
4062 ccv_nnc_tensor_param_t output_params[4];
4063 ccv_nnc_hint_tensor_auto(lstm, input_params, 5, ccv_nnc_no_hint, output_params, 4);
4064 outputs[0] = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
4065 if (!self->weights.graph)
4066 self->weights = ccv_nnc_tensor_symbol_new(graph, input_params[4], "weights");
4067 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 4067, __extension__ __PRETTY_FUNCTION__); }))
;
4068 const ccv_nnc_tensor_symbol_t weights = ccv_cnnp_model_get_symbol(super, self->weights);
4069 if (!self->reserves.graph)
4070 self->reserves = ccv_nnc_tensor_symbol_new(graph, output_params[3], "reserves");
4071 assert(self->reserves.graph == graph)((void) sizeof ((self->reserves.graph == graph) ? 1 : 0), __extension__
({ if (self->reserves.graph == graph) ; else __assert_fail
("self->reserves.graph == graph", "ccv_cnnp_model_addons.c"
, 4071, __extension__ __PRETTY_FUNCTION__); }))
;
4072 const ccv_nnc_tensor_symbol_t reserves = ccv_cnnp_model_get_symbol(super, self->reserves);
4073 const ccv_nnc_tensor_symbol_t mask = input_size == 2 ? inputs[1] : NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
4074 self->lstm = ccv_nnc_graph_exec_symbol_new(graph, lstm, TENSOR_SYMBOL_LIST(inputs[0], mask, NO_TENSOR_SYMBOL, NO_TENSOR_SYMBOL, weights)(const ccv_nnc_tensor_symbol_t []){inputs[0], mask, (const ccv_nnc_tensor_symbol_t
){.d = CCV_NNC_NO_TENSOR_SYMBOL}, (const ccv_nnc_tensor_symbol_t
){.d = CCV_NNC_NO_TENSOR_SYMBOL}, weights}, (1 +1 +1 +1 +1 +1
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(outputs[0], NO_TENSOR_SYMBOL, NO_TENSOR_SYMBOL, reserves)(const ccv_nnc_tensor_symbol_t []){outputs[0], (const ccv_nnc_tensor_symbol_t
){.d = CCV_NNC_NO_TENSOR_SYMBOL}, (const ccv_nnc_tensor_symbol_t
){.d = CCV_NNC_NO_TENSOR_SYMBOL}, reserves}, (1 +1 +1 +1 +1 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "lstm");
4075}
4076
4077static void _ccv_cnnp_lstm_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
4078{
4079 ccv_cnnp_model_lstm_t* const self = (ccv_cnnp_model_lstm_t*)super;
4080 if (self->weights.graph)
4081 {
4082 const float stdv = 1.0 / sqrt(self->params.rnn.hidden_size);
4083 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-stdv, stdv)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-stdv, stdv}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
4084 }
4085}
4086
4087static void _ccv_cnnp_lstm_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
4088{
4089 ccv_cnnp_model_lstm_t* const self = (ccv_cnnp_model_lstm_t*)super;
4090 if (self->weights.graph)
4091 add_to_array(parameters, self->weights, is_trainable);
4092}
4093
4094static void _ccv_cnnp_lstm_set_is_test(ccv_cnnp_model_t* const super, const int is_test, const ccv_cnnp_cmd_updater_f updater, void* const context)
4095{
4096 ccv_cnnp_model_lstm_t* const self = (ccv_cnnp_model_lstm_t*)super;
4097 if (self->lstm.graph)
4098 {
4099 self->params.rnn.is_test = is_test;
4100 updater(context, self->lstm, ccv_nnc_cmd(CCV_NNC_LSTM_FORWARD, 0, self->params, 0), ccv_nnc_no_hint);
4101 }
4102}
4103
4104static ccv_cnnp_model_t* _ccv_cnnp_lstm_copy(const ccv_cnnp_model_t* const self, void* const context);
4105
4106static const ccv_cnnp_model_vtab_t ccv_cnnp_lstm_isa = {
4107 .build = _ccv_cnnp_lstm_build,
4108 .init_states = _ccv_cnnp_lstm_init_states,
4109 .add_to_parameter = _ccv_cnnp_lstm_add_to_parameter,
4110 .copy = _ccv_cnnp_lstm_copy,
4111 .set_is_test = _ccv_cnnp_lstm_set_is_test,
4112};
4113
4114ccv_cnnp_model_t* ccv_cnnp_lstm(const int masked, const int hidden_size, const int proj_size, const int num_layers, const int bias, const int batch_first, const int bidirectional, const float dropout, const int is_trainable, const char* const name)
4115{
4116 ccv_cnnp_model_lstm_t* const model_lstm = (ccv_cnnp_model_lstm_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_lstm_t));
4117 model_lstm->super.isa = &ccv_cnnp_lstm_isa;
4118 model_lstm->super.input_size = masked ? 2 : 1;
4119 model_lstm->super.outputs = &model_lstm->output;
4120 model_lstm->super.output_size = 1;
4121 model_lstm->super.is_trainable = is_trainable;
4122 ccv_cnnp_model_copy_name(&model_lstm->super, name);
4123 model_lstm->masked = masked;
4124 model_lstm->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
4125 model_lstm->weights.graph = 0;
4126 model_lstm->params.rnn.hidden_size = hidden_size;
4127 model_lstm->params.rnn.proj_size = proj_size;
4128 model_lstm->params.rnn.num_layers = num_layers;
4129 model_lstm->params.rnn.bias = bias;
4130 model_lstm->params.rnn.batch_first = batch_first;
4131 model_lstm->params.rnn.bidirectional = bidirectional;
4132 model_lstm->params.rnn.dropout = dropout;
4133 return (ccv_cnnp_model_t*)model_lstm;
4134}
4135
4136static ccv_cnnp_model_t* _ccv_cnnp_lstm_copy(const ccv_cnnp_model_t* const super, void* const context)
4137{
4138 const ccv_cnnp_model_lstm_t* const self = (const ccv_cnnp_model_lstm_t*)super;
4139 return ccv_cnnp_lstm(self->masked, self->params.rnn.hidden_size, self->params.rnn.proj_size, self->params.rnn.num_layers, self->params.rnn.bias, self->params.rnn.batch_first, self->params.rnn.bidirectional, self->params.rnn.dropout, self->super.is_trainable, self->super.name);
4140}
4141
4142/// MARK - Datatype conversion layer.
4143
4144typedef struct {
4145 ccv_cnnp_model_t super;
4146 ccv_nnc_tensor_symbol_t output;
4147 int datatype;
4148 int ref_to_last;
4149} ccv_cnnp_model_datatype_conversion_t;
4150
4151static void _ccv_cnnp_datatype_conversion_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4152{
4153 ccv_cnnp_model_datatype_conversion_t* const self = (ccv_cnnp_model_datatype_conversion_t*)super;
4154 PRINT(CCV_CLI_VERBOSE, "[cnnp_datatype_conversion_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_datatype_conversion_build] -\n"); fflush(stdout
); } } while (0)
;
4155 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4156 if (self->ref_to_last)
4157 {
4158 assert(input_size > 1)((void) sizeof ((input_size > 1) ? 1 : 0), __extension__ (
{ if (input_size > 1) ; else __assert_fail ("input_size > 1"
, "ccv_cnnp_model_addons.c", 4158, __extension__ __PRETTY_FUNCTION__
); }))
;
4159 const ccv_nnc_tensor_param_t last_params = ccv_nnc_tensor_symbol_params(graph, inputs[input_size - 1]);
4160 params.datatype = last_params.datatype;
4161 } else
4162 params.datatype = self->datatype;
4163 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4163, __extension__ __PRETTY_FUNCTION__
); }))
;
4164 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4165 ccv_nnc_graph_exec_symbol_new(graph, CMD_DATATYPE_CONVERSION_FORWARD()ccv_nnc_cmd(CCV_NNC_DATATYPE_CONVERSION_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, output_size /* intentional */, outputs, output_size, 0);
4166}
4167
4168static ccv_cnnp_model_t* _ccv_cnnp_datatype_conversion_copy(const ccv_cnnp_model_t* const self, void* const context);
4169
4170static const ccv_cnnp_model_vtab_t ccv_cnnp_datatype_conversion_isa = {
4171 .build = _ccv_cnnp_datatype_conversion_build,
4172 .copy = _ccv_cnnp_datatype_conversion_copy,
4173};
4174
4175ccv_cnnp_model_t* ccv_cnnp_datatype_conversion(const int datatype, const int ref_to_last, const char* const name)
4176{
4177 ccv_cnnp_model_datatype_conversion_t* const model_datatype_conversion = (ccv_cnnp_model_datatype_conversion_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_datatype_conversion_t));
4178 model_datatype_conversion->super.isa = &ccv_cnnp_datatype_conversion_isa;
4179 model_datatype_conversion->super.input_size = 0;
4180 model_datatype_conversion->super.outputs = &model_datatype_conversion->output;
4181 model_datatype_conversion->super.output_size = 1;
4182 model_datatype_conversion->datatype = datatype;
4183 model_datatype_conversion->ref_to_last = ref_to_last;
4184 ccv_cnnp_model_copy_name(&model_datatype_conversion->super, name);
4185 return (ccv_cnnp_model_t*)model_datatype_conversion;
4186}
4187
4188static ccv_cnnp_model_t* _ccv_cnnp_datatype_conversion_copy(const ccv_cnnp_model_t* const super, void* const context)
4189{
4190 ccv_cnnp_model_datatype_conversion_t* const self = (ccv_cnnp_model_datatype_conversion_t*)super;
4191 return ccv_cnnp_datatype_conversion(self->datatype, self->ref_to_last, self->super.name);
4192}
4193
4194/// MARK - Clamp layer.
4195
4196typedef struct {
4197 ccv_cnnp_model_t super;
4198 ccv_nnc_tensor_symbol_t output;
4199 float min;
4200 float max;
4201} ccv_cnnp_model_clamp_t;
4202
4203static void _ccv_cnnp_clamp_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4204{
4205 ccv_cnnp_model_clamp_t* const self = (ccv_cnnp_model_clamp_t*)super;
4206 PRINT(CCV_CLI_VERBOSE, "[cnnp_clamp_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_clamp_build] -\n"); fflush(stdout); } } while
(0)
;
4207 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4208 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4208, __extension__ __PRETTY_FUNCTION__
); }))
;
4209 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4210 ccv_nnc_graph_exec_symbol_new(graph, CMD_CLAMP_FORWARD(self->min, self->max)ccv_nnc_cmd(CCV_NNC_CLAMP_FORWARD, 0, (ccv_nnc_cmd_param_t){.
size={.dim={1,1,1}},.clamp={.min=self->min,.max=self->max
}}, 0)
, inputs, output_size /* intentional */, outputs, output_size, 0);
4211}
4212
4213static ccv_cnnp_model_t* _ccv_cnnp_clamp_copy(const ccv_cnnp_model_t* const self, void* const context);
4214
4215static const ccv_cnnp_model_vtab_t ccv_cnnp_clamp_isa = {
4216 .build = _ccv_cnnp_clamp_build,
4217 .copy = _ccv_cnnp_clamp_copy,
4218};
4219
4220ccv_cnnp_model_t* ccv_cnnp_clamp(const float min, const float max, const char* const name)
4221{
4222 ccv_cnnp_model_clamp_t* const model_clamp = (ccv_cnnp_model_clamp_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_clamp_t));
4223 model_clamp->super.isa = &ccv_cnnp_clamp_isa;
4224 model_clamp->super.input_size = 0;
4225 model_clamp->super.outputs = &model_clamp->output;
4226 model_clamp->super.output_size = 1;
4227 model_clamp->min = min;
4228 model_clamp->max = max;
4229 ccv_cnnp_model_copy_name(&model_clamp->super, name);
4230 return (ccv_cnnp_model_t*)model_clamp;
4231}
4232
4233static ccv_cnnp_model_t* _ccv_cnnp_clamp_copy(const ccv_cnnp_model_t* const super, void* const context)
4234{
4235 ccv_cnnp_model_clamp_t* const self = (ccv_cnnp_model_clamp_t*)super;
4236 return ccv_cnnp_clamp(self->min, self->max, self->super.name);
4237}
4238
4239// MARK - Parameter Layer
4240
4241typedef struct {
4242 ccv_cnnp_model_t super;
4243 float init_bound;
4244 ccv_nnc_tensor_symbol_t weights;
4245 ccv_nnc_tensor_param_t weights_params;
4246 ccv_nnc_tensor_symbol_t output;
4247} ccv_cnnp_model_parameter_t;
4248
4249static void _ccv_cnnp_parameter_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4250{
4251 PRINT(CCV_CLI_VERBOSE, "[cnnp_parameter_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_parameter_build] -\n"); fflush(stdout); } } while
(0)
;
4252 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4252, __extension__ __PRETTY_FUNCTION__
); }))
;
4253 ccv_cnnp_model_parameter_t* const self = (ccv_cnnp_model_parameter_t*)super;
4254 if (!self->weights.graph)
4255 self->weights = ccv_nnc_tensor_symbol_new(graph, self->weights_params, "weights");
4256 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 4256, __extension__ __PRETTY_FUNCTION__); }))
;
4257 outputs[0] = ccv_cnnp_model_get_symbol(super, self->weights);
4258}
4259
4260static void _ccv_cnnp_parameter_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
4261{
4262 ccv_cnnp_model_parameter_t* const self = (ccv_cnnp_model_parameter_t*)super;
4263 if (self->init_bound > 0)
4264 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-self->init_bound, self->init_bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-self->init_bound, self->
init_bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
4265 else
4266 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
4267}
4268
4269static void _ccv_cnnp_parameter_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
4270{
4271 ccv_cnnp_model_parameter_t* const self = (ccv_cnnp_model_parameter_t*)super;
4272 add_to_array(parameters, self->weights, is_trainable);
4273}
4274
4275static ccv_cnnp_model_t* _ccv_cnnp_parameter_copy(const ccv_cnnp_model_t* const super, void* const context);
4276
4277static const ccv_cnnp_model_vtab_t ccv_cnnp_parameter_isa = {
4278 .build = _ccv_cnnp_parameter_build,
4279 .init_states = _ccv_cnnp_parameter_init_states,
4280 .add_to_parameter = _ccv_cnnp_parameter_add_to_parameter,
4281 .copy = _ccv_cnnp_parameter_copy,
4282};
4283
4284ccv_cnnp_model_t* ccv_cnnp_parameter(const ccv_nnc_tensor_param_t params, const float init_bound, const int is_trainable, const char* const name)
4285{
4286 ccv_cnnp_model_parameter_t* const model_parameter = (ccv_cnnp_model_parameter_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_parameter_t));
4287 model_parameter->super.isa = &ccv_cnnp_parameter_isa;
4288 model_parameter->super.input_size = 0;
4289 model_parameter->super.outputs = &model_parameter->output;
4290 model_parameter->super.output_size = 1;
4291 model_parameter->super.is_trainable = is_trainable;
4292 ccv_cnnp_model_copy_name(&model_parameter->super, name);
4293 model_parameter->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
4294 model_parameter->weights.graph = 0;
4295 model_parameter->weights_params = params;
4296 return (ccv_cnnp_model_t*)model_parameter;
4297}
4298
4299static ccv_cnnp_model_t* _ccv_cnnp_parameter_copy(const ccv_cnnp_model_t* const super, void* const context)
4300{
4301 const ccv_cnnp_model_parameter_t* const self = (const ccv_cnnp_model_parameter_t*)super;
4302 return ccv_cnnp_parameter(self->weights_params, self->init_bound, self->super.is_trainable, self->super.name);
4303}
4304
4305// MARK - Scalar Layer
4306
4307typedef struct {
4308 ccv_cnnp_model_t super;
4309 int type;
4310 int format;
4311 int datatype;
4312 float value;
4313 ccv_nnc_tensor_symbol_t output;
4314} ccv_cnnp_model_scalar_t;
4315
4316static void _ccv_cnnp_scalar_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4317{
4318 PRINT(CCV_CLI_VERBOSE, "[cnnp_scalar_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_scalar_build] -\n"); fflush(stdout); } } while
(0)
;
4319 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4319, __extension__ __PRETTY_FUNCTION__
); }))
;
4320 ccv_cnnp_model_scalar_t* const self = (ccv_cnnp_model_scalar_t*)super;
4321 ccv_nnc_tensor_param_t params = {
4322 .type = self->type,
4323 .format = self->format,
4324 .datatype = self->datatype,
4325 .dim = {
4326 1
4327 }
4328 };
4329 if (input_size > 0)
4330 {
4331 ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4332 params.type = input_params.type;
4333 params.format = input_params.format;
4334 params.datatype = input_params.datatype;
4335 }
4336 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4337 ccv_nnc_graph_exec_symbol_new(graph, CMD_SET_FORWARD(self->value)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={self->value,}}}, 0)
, 0, 0, outputs, 1, 0);
4338}
4339
4340static ccv_cnnp_model_t* _ccv_cnnp_scalar_copy(const ccv_cnnp_model_t* const super, void* const context);
4341
4342static const ccv_cnnp_model_vtab_t ccv_cnnp_scalar_isa = {
4343 .build = _ccv_cnnp_scalar_build,
4344 .copy = _ccv_cnnp_scalar_copy,
4345};
4346
4347ccv_cnnp_model_t* ccv_cnnp_scalar(const int type, const int format, const int datatype, const float value, const char* const name)
4348{
4349 ccv_cnnp_model_scalar_t* const model_scalar = (ccv_cnnp_model_scalar_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_scalar_t));
4350 model_scalar->super.isa = &ccv_cnnp_scalar_isa;
4351 model_scalar->super.input_size = 0;
4352 model_scalar->super.outputs = &model_scalar->output;
4353 model_scalar->super.output_size = 1;
4354 ccv_cnnp_model_copy_name(&model_scalar->super, name);
4355 model_scalar->type = type;
4356 model_scalar->format = format;
4357 model_scalar->datatype = datatype;
4358 model_scalar->value = value;
4359 return (ccv_cnnp_model_t*)model_scalar;
4360}
4361
4362static ccv_cnnp_model_t* _ccv_cnnp_scalar_copy(const ccv_cnnp_model_t* const super, void* const context)
4363{
4364 const ccv_cnnp_model_scalar_t* const self = (const ccv_cnnp_model_scalar_t*)super;
4365 return ccv_cnnp_scalar(self->type, self->format, self->datatype, self->value, self->super.name);
4366}
4367
4368// MARK - Variable Layer
4369
4370typedef struct {
4371 ccv_cnnp_model_t super;
4372 ccv_nnc_tensor_param_t params;
4373 ccv_nnc_tensor_symbol_t output;
4374} ccv_cnnp_model_variable_t;
4375
4376static void _ccv_cnnp_variable_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4377{
4378 PRINT(CCV_CLI_VERBOSE, "[cnnp_variable_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_variable_build] -\n"); fflush(stdout); } } while
(0)
;
4379 assert(input_size == 0)((void) sizeof ((input_size == 0) ? 1 : 0), __extension__ ({ if
(input_size == 0) ; else __assert_fail ("input_size == 0", "ccv_cnnp_model_addons.c"
, 4379, __extension__ __PRETTY_FUNCTION__); }))
;
4380 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4380, __extension__ __PRETTY_FUNCTION__
); }))
;
4381 ccv_cnnp_model_variable_t* const self = (ccv_cnnp_model_variable_t*)super;
4382 outputs[0] = ccv_nnc_tensor_symbol_new(graph, self->params, 0);
4383}
4384
4385static ccv_cnnp_model_t* _ccv_cnnp_variable_copy(const ccv_cnnp_model_t* const super, void* const context);
4386
4387static const ccv_cnnp_model_vtab_t ccv_cnnp_variable_isa = {
4388 .build = _ccv_cnnp_variable_build,
4389 .copy = _ccv_cnnp_variable_copy,
4390};
4391
4392ccv_cnnp_model_t* ccv_cnnp_variable(const ccv_nnc_tensor_param_t params, const char* const name)
4393{
4394 ccv_cnnp_model_variable_t* const model_variable = (ccv_cnnp_model_variable_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_variable_t));
4395 model_variable->super.isa = &ccv_cnnp_variable_isa;
4396 model_variable->super.input_size = 0;
4397 model_variable->super.outputs = &model_variable->output;
4398 model_variable->super.output_size = 1;
4399 ccv_cnnp_model_copy_name(&model_variable->super, name);
4400 model_variable->params = params;
4401 return (ccv_cnnp_model_t*)model_variable;
4402}
4403
4404static ccv_cnnp_model_t* _ccv_cnnp_variable_copy(const ccv_cnnp_model_t* const super, void* const context)
4405{
4406 const ccv_cnnp_model_variable_t* const self = (const ccv_cnnp_model_variable_t*)super;
4407 return ccv_cnnp_variable(self->params, self->super.name);
4408}
4409
4410// MARK - Send Layer
4411
4412typedef struct {
4413 ccv_cnnp_model_t super;
4414 int device_id;
4415 ccv_nnc_tensor_symbol_t output;
4416} ccv_cnnp_model_send_t;
4417
4418static void _ccv_cnnp_send_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4419{
4420 ccv_cnnp_model_send_t* const self = (ccv_cnnp_model_send_t*)super;
4421 PRINT(CCV_CLI_VERBOSE, "[cnnp_send_build] - device_id: %d\n", self->device_id)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_send_build] - device_id: %d\n", self->device_id
); fflush(stdout); } } while (0)
;
4422 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 4422, __extension__ __PRETTY_FUNCTION__); }))
;
4423 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4423, __extension__ __PRETTY_FUNCTION__
); }))
;
4424 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4425 params.type = (params.type & ~0x3) | CCV_TENSOR_GPU_MEMORY;
4426 CCV_TENSOR_SET_DEVICE_ID(params.type, self->device_id)(params.type) = (((params.type) & ~0xfff00) | (((self->
device_id) & 0xfff) << 8))
;
4427 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4428 ccv_nnc_graph_exec_symbol_new(graph, CMD_DATA_TRANSFER_FORWARD()ccv_nnc_cmd(CCV_NNC_DATA_TRANSFER_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, 1, outputs, 1, "send");
4429}
4430
4431static ccv_cnnp_model_t* _ccv_cnnp_send_copy(const ccv_cnnp_model_t* const super, void* const context);
4432
4433static const ccv_cnnp_model_vtab_t ccv_cnnp_send_isa = {
4434 .build = _ccv_cnnp_send_build,
4435 .copy = _ccv_cnnp_send_copy,
4436};
4437
4438ccv_cnnp_model_t* ccv_cnnp_send(const int device_id, const char* const name)
4439{
4440 assert(device_id >= 0)((void) sizeof ((device_id >= 0) ? 1 : 0), __extension__ (
{ if (device_id >= 0) ; else __assert_fail ("device_id >= 0"
, "ccv_cnnp_model_addons.c", 4440, __extension__ __PRETTY_FUNCTION__
); }))
;
4441 ccv_cnnp_model_send_t* const model_send = (ccv_cnnp_model_send_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_send_t));
4442 model_send->super.isa = &ccv_cnnp_send_isa;
4443 model_send->super.input_size = 1;
4444 model_send->super.outputs = &model_send->output;
4445 model_send->super.output_size = 1;
4446 ccv_cnnp_model_copy_name(&model_send->super, name);
4447 model_send->device_id = device_id;
4448 return (ccv_cnnp_model_t*)model_send;
4449}
4450
4451static ccv_cnnp_model_t* _ccv_cnnp_send_copy(const ccv_cnnp_model_t* const super, void* const context)
4452{
4453 const ccv_cnnp_model_send_t* const self = (const ccv_cnnp_model_send_t*)super;
4454 return ccv_cnnp_send(self->device_id, self->super.name);
4455}
4456
4457// MARK - Move Layer
4458
4459typedef struct {
4460 ccv_cnnp_model_t super;
4461 ccv_nnc_tensor_symbol_t output;
4462} ccv_cnnp_model_move_t;
4463
4464static void _ccv_cnnp_move_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4465{
4466 PRINT(CCV_CLI_VERBOSE, "[cnnp_move_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_move_build] -\n"); fflush(stdout); } } while
(0)
;
4467 assert(input_size == 2)((void) sizeof ((input_size == 2) ? 1 : 0), __extension__ ({ if
(input_size == 2) ; else __assert_fail ("input_size == 2", "ccv_cnnp_model_addons.c"
, 4467, __extension__ __PRETTY_FUNCTION__); }))
;
4468 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4468, __extension__ __PRETTY_FUNCTION__
); }))
;
4469 outputs[0] = inputs[1];
4470 ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, 1, outputs, 1, "move");
4471}
4472
4473static ccv_cnnp_model_t* _ccv_cnnp_move_copy(const ccv_cnnp_model_t* const super, void* const context);
4474
4475static const ccv_cnnp_model_vtab_t ccv_cnnp_move_isa = {
4476 .build = _ccv_cnnp_move_build,
4477 .copy = _ccv_cnnp_move_copy,
4478};
4479
4480ccv_cnnp_model_t* ccv_cnnp_move(const char* const name)
4481{
4482 ccv_cnnp_model_move_t* const model_move = (ccv_cnnp_model_move_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_move_t));
4483 model_move->super.isa = &ccv_cnnp_move_isa;
4484 model_move->super.input_size = 2;
4485 model_move->super.outputs = &model_move->output;
4486 model_move->super.output_size = 1;
4487 ccv_cnnp_model_copy_name(&model_move->super, name);
4488 return (ccv_cnnp_model_t*)model_move;
4489}
4490
4491static ccv_cnnp_model_t* _ccv_cnnp_move_copy(const ccv_cnnp_model_t* const super, void* const context)
4492{
4493 const ccv_cnnp_model_move_t* const self = (const ccv_cnnp_model_move_t*)super;
4494 return ccv_cnnp_move(self->super.name);
4495}
4496
4497// MARK - "Making" Contiguous Layer
4498
4499typedef struct {
4500 ccv_cnnp_model_t super;
4501 ccv_nnc_tensor_symbol_t output;
4502} ccv_cnnp_model_contiguous_t;
4503
4504static void _ccv_cnnp_contiguous_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4505{
4506 PRINT(CCV_CLI_VERBOSE, "[cnnp_contiguous_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_contiguous_build] -\n"); fflush(stdout); } }
while (0)
;
4507 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 4507, __extension__ __PRETTY_FUNCTION__); }))
;
4508 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4508, __extension__ __PRETTY_FUNCTION__
); }))
;
4509 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4510 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
4511 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If we are not reshape an alias, it is straightforward.
4512 {
4513 outputs[0] = inputs[0];
4514 return;
4515 }
4516 // Otherwise, we need to check its stride to know if it is contiguous.
4517 int old_stride[CCV_NNC_MAX_DIM_ALLOC(12)];
4518 ccv_nnc_tensor_symbol_alias_params(graph, inputs[0], 0, old_stride);
4519 // We identify permute by checking if the stride is not in descending order.
4520 // This also covered "permute" through reshape, rather than using ccv_cnnp_permute directly.
4521 if (ccv_nnc_is_tensor_stride_packed(old_stride, params.dim))
4522 {
4523 outputs[0] = inputs[0];
4524 return;
4525 }
4526 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4527 ccv_nnc_graph_exec_symbol_t make_contiguous = ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, 1, outputs, 1, "contiguous");
4528 ccv_nnc_graph_exec_symbol_set_flags(graph, make_contiguous, CCV_NNC_GRAPH_EXEC_DISABLE_OPT);
4529}
4530
4531static ccv_cnnp_model_t* _ccv_cnnp_contiguous_copy(const ccv_cnnp_model_t* const super, void* const context);
4532
4533static const ccv_cnnp_model_vtab_t ccv_cnnp_contiguous_isa = {
4534 .build = _ccv_cnnp_contiguous_build,
4535 .copy = _ccv_cnnp_contiguous_copy,
4536};
4537
4538ccv_cnnp_model_t* ccv_cnnp_contiguous(const char* const name)
4539{
4540 ccv_cnnp_model_contiguous_t* const model_contiguous = (ccv_cnnp_model_contiguous_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_contiguous_t));
4541 model_contiguous->super.isa = &ccv_cnnp_contiguous_isa;
4542 model_contiguous->super.input_size = 1;
4543 model_contiguous->super.outputs = &model_contiguous->output;
4544 model_contiguous->super.output_size = 1;
4545 ccv_cnnp_model_copy_name(&model_contiguous->super, name);
4546 return (ccv_cnnp_model_t*)model_contiguous;
4547}
4548
4549static ccv_cnnp_model_t* _ccv_cnnp_contiguous_copy(const ccv_cnnp_model_t* const super, void* const context)
4550{
4551 const ccv_cnnp_model_contiguous_t* const self = (const ccv_cnnp_model_contiguous_t*)super;
4552 return ccv_cnnp_contiguous(self->super.name);
4553}
4554
4555// MARK - "Making" Copy Layer
4556
4557typedef struct {
4558 ccv_cnnp_model_t super;
4559 ccv_nnc_tensor_symbol_t output;
4560} ccv_cnnp_model_copy_t;
4561
4562static void _ccv_cnnp_copy_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4563{
4564 PRINT(CCV_CLI_VERBOSE, "[cnnp_copy_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_copy_build] -\n"); fflush(stdout); } } while
(0)
;
4565 assert(input_size == 1)((void) sizeof ((input_size == 1) ? 1 : 0), __extension__ ({ if
(input_size == 1) ; else __assert_fail ("input_size == 1", "ccv_cnnp_model_addons.c"
, 4565, __extension__ __PRETTY_FUNCTION__); }))
;
4566 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4566, __extension__ __PRETTY_FUNCTION__
); }))
;
4567 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4568 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
4569 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If we are not reshape an alias, it is straightforward.
4570 {
4571 outputs[0] = inputs[0];
4572 return;
4573 }
4574 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4575 ccv_nnc_graph_exec_symbol_t make_contiguous = ccv_nnc_graph_exec_symbol_new(graph, CMD_FORMAT_TRANSFORM_FORWARD()ccv_nnc_cmd(CCV_NNC_FORMAT_TRANSFORM_FORWARD, 0, ccv_nnc_cmd_auto
, 0)
, inputs, 1, outputs, 1, "contiguous");
4576 ccv_nnc_graph_exec_symbol_set_flags(graph, make_contiguous, CCV_NNC_GRAPH_EXEC_DISABLE_OPT);
4577}
4578
4579static ccv_cnnp_model_t* _ccv_cnnp_copy_copy(const ccv_cnnp_model_t* const super, void* const context);
4580
4581static const ccv_cnnp_model_vtab_t ccv_cnnp_copy_isa = {
4582 .build = _ccv_cnnp_copy_build,
4583 .copy = _ccv_cnnp_copy_copy,
4584};
4585
4586ccv_cnnp_model_t* ccv_cnnp_copy(const char* const name)
4587{
4588 ccv_cnnp_model_copy_t* const model_copy = (ccv_cnnp_model_copy_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_copy_t));
4589 model_copy->super.isa = &ccv_cnnp_copy_isa;
4590 model_copy->super.input_size = 1;
4591 model_copy->super.outputs = &model_copy->output;
4592 model_copy->super.output_size = 1;
4593 ccv_cnnp_model_copy_name(&model_copy->super, name);
4594 return (ccv_cnnp_model_t*)model_copy;
4595}
4596
4597static ccv_cnnp_model_t* _ccv_cnnp_copy_copy(const ccv_cnnp_model_t* const super, void* const context)
4598{
4599 const ccv_cnnp_model_copy_t* const self = (const ccv_cnnp_model_copy_t*)super;
4600 return ccv_cnnp_copy(self->super.name);
4601}
4602
4603// MARK - All-To-All Layer
4604
4605typedef struct {
4606 ccv_cnnp_model_t super;
4607 int axis;
4608 ccv_nnc_tensor_symbol_t outputs[1];
4609} ccv_cnnp_model_all_to_all_t;
4610
4611static void _ccv_cnnp_all_to_all_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4612{
4613 ccv_cnnp_model_all_to_all_t* const self = (ccv_cnnp_model_all_to_all_t*)super;
4614 PRINT(CCV_CLI_VERBOSE, "[cnnp_all_to_all_build] - axis: %d\n", self->axis)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_all_to_all_build] - axis: %d\n", self->axis
); fflush(stdout); } } while (0)
;
4615 assert(input_size == self->super.input_size)((void) sizeof ((input_size == self->super.input_size) ? 1
: 0), __extension__ ({ if (input_size == self->super.input_size
) ; else __assert_fail ("input_size == self->super.input_size"
, "ccv_cnnp_model_addons.c", 4615, __extension__ __PRETTY_FUNCTION__
); }))
;
4616 assert(output_size == self->super.output_size)((void) sizeof ((output_size == self->super.output_size) ?
1 : 0), __extension__ ({ if (output_size == self->super.output_size
) ; else __assert_fail ("output_size == self->super.output_size"
, "ccv_cnnp_model_addons.c", 4616, __extension__ __PRETTY_FUNCTION__
); }))
;
4617 assert(input_size == output_size)((void) sizeof ((input_size == output_size) ? 1 : 0), __extension__
({ if (input_size == output_size) ; else __assert_fail ("input_size == output_size"
, "ccv_cnnp_model_addons.c", 4617, __extension__ __PRETTY_FUNCTION__
); }))
;
4618 assert(input_size > 0)((void) sizeof ((input_size > 0) ? 1 : 0), __extension__ (
{ if (input_size > 0) ; else __assert_fail ("input_size > 0"
, "ccv_cnnp_model_addons.c", 4618, __extension__ __PRETTY_FUNCTION__
); }))
;
4619 const ccv_nnc_tensor_param_t input_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4620 const int nd = ccv_nnc_tensor_nd(input_params.dim);
4621 assert(self->axis >= 0 && self->axis < nd)((void) sizeof ((self->axis >= 0 && self->axis
< nd) ? 1 : 0), __extension__ ({ if (self->axis >= 0
&& self->axis < nd) ; else __assert_fail ("self->axis >= 0 && self->axis < nd"
, "ccv_cnnp_model_addons.c", 4621, __extension__ __PRETTY_FUNCTION__
); }))
;
4622 assert(input_params.dim[self->axis] % input_size == 0)((void) sizeof ((input_params.dim[self->axis] % input_size
== 0) ? 1 : 0), __extension__ ({ if (input_params.dim[self->
axis] % input_size == 0) ; else __assert_fail ("input_params.dim[self->axis] % input_size == 0"
, "ccv_cnnp_model_addons.c", 4622, __extension__ __PRETTY_FUNCTION__
); }))
;
4623 int i;
4624 for (i = 0; i < input_size; i++)
4625 {
4626 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[i]);
4627 assert(params.format == input_params.format)((void) sizeof ((params.format == input_params.format) ? 1 : 0
), __extension__ ({ if (params.format == input_params.format)
; else __assert_fail ("params.format == input_params.format"
, "ccv_cnnp_model_addons.c", 4627, __extension__ __PRETTY_FUNCTION__
); }))
;
4628 assert(params.datatype == input_params.datatype)((void) sizeof ((params.datatype == input_params.datatype) ? 1
: 0), __extension__ ({ if (params.datatype == input_params.datatype
) ; else __assert_fail ("params.datatype == input_params.datatype"
, "ccv_cnnp_model_addons.c", 4628, __extension__ __PRETTY_FUNCTION__
); }))
;
4629 assert(CCV_TENSOR_GET_MEMORY(params.type) == CCV_TENSOR_GET_MEMORY(input_params.type))((void) sizeof ((((params.type) & 0x3) == ((input_params.
type) & 0x3)) ? 1 : 0), __extension__ ({ if (((params.type
) & 0x3) == ((input_params.type) & 0x3)) ; else __assert_fail
("CCV_TENSOR_GET_MEMORY(params.type) == CCV_TENSOR_GET_MEMORY(input_params.type)"
, "ccv_cnnp_model_addons.c", 4629, __extension__ __PRETTY_FUNCTION__
); }))
;
4630 assert(memcmp(params.dim, input_params.dim, sizeof(input_params.dim)) == 0)((void) sizeof ((memcmp(params.dim, input_params.dim, sizeof(
input_params.dim)) == 0) ? 1 : 0), __extension__ ({ if (memcmp
(params.dim, input_params.dim, sizeof(input_params.dim)) == 0
) ; else __assert_fail ("memcmp(params.dim, input_params.dim, sizeof(input_params.dim)) == 0"
, "ccv_cnnp_model_addons.c", 4630, __extension__ __PRETTY_FUNCTION__
); }))
;
4631 outputs[i] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4632 }
4633 ccv_nnc_graph_exec_symbol_new(graph, CMD_COMM_ALL_TO_ALL_FORWARD(self->axis)ccv_nnc_cmd(CCV_NNC_COMM_ALL_TO_ALL_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.all_to_all={.axis=self->axis}}), 0
)
, inputs, input_size, outputs, output_size, "all_to_all");
4634}
4635
4636static ccv_cnnp_model_t* _ccv_cnnp_all_to_all_copy(const ccv_cnnp_model_t* const super, void* const context);
4637
4638static const ccv_cnnp_model_vtab_t ccv_cnnp_all_to_all_isa = {
4639 .build = _ccv_cnnp_all_to_all_build,
4640 .copy = _ccv_cnnp_all_to_all_copy,
4641};
4642
4643ccv_cnnp_model_t* ccv_cnnp_all_to_all(const int count, const int axis, const char* const name)
4644{
4645 assert(count > 0)((void) sizeof ((count > 0) ? 1 : 0), __extension__ ({ if (
count > 0) ; else __assert_fail ("count > 0", "ccv_cnnp_model_addons.c"
, 4645, __extension__ __PRETTY_FUNCTION__); }))
;
4646 assert(axis >= 0)((void) sizeof ((axis >= 0) ? 1 : 0), __extension__ ({ if (
axis >= 0) ; else __assert_fail ("axis >= 0", "ccv_cnnp_model_addons.c"
, 4646, __extension__ __PRETTY_FUNCTION__); }))
;
4647 ccv_cnnp_model_all_to_all_t* const model_all_to_all = (ccv_cnnp_model_all_to_all_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_all_to_all_t) + sizeof(ccv_nnc_tensor_symbol_t) * (count - 1));
4648 model_all_to_all->super.isa = &ccv_cnnp_all_to_all_isa;
4649 model_all_to_all->super.input_size = count;
4650 model_all_to_all->super.outputs = model_all_to_all->outputs;
4651 model_all_to_all->super.output_size = count;
4652 model_all_to_all->axis = axis;
4653 ccv_cnnp_model_copy_name(&model_all_to_all->super, name);
4654 return (ccv_cnnp_model_t*)model_all_to_all;
4655}
4656
4657static ccv_cnnp_model_t* _ccv_cnnp_all_to_all_copy(const ccv_cnnp_model_t* const super, void* const context)
4658{
4659 const ccv_cnnp_model_all_to_all_t* const self = (const ccv_cnnp_model_all_to_all_t*)super;
4660 return ccv_cnnp_all_to_all(self->super.output_size, self->axis, self->super.name);
4661}
4662
4663// MARK - Scaled-Dot Product Attention Layer
4664
4665typedef struct {
4666 ccv_cnnp_model_t super;
4667 ccv_nnc_tensor_symbol_t output;
4668 ccv_nnc_tensor_symbol_t weights;
4669 ccv_nnc_tensor_symbol_t bias;
4670 float scale;
4671 int is_causal;
4672 int has_attn_mask;
4673 int is_varlen;
4674 int max_seqlen_q;
4675 int max_seqlen_kv;
4676 int flags;
4677 int fused_unify_head_weights;
4678 int no_bias;
4679} ccv_cnnp_model_scaled_dot_product_attention_t;
4680
4681static void _ccv_cnnp_scaled_dot_product_attention_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4682{
4683 PRINT(CCV_CLI_VERBOSE, "[cnnp_scaled_dot_product_attention_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_scaled_dot_product_attention_build] -\n"); fflush
(stdout); } } while (0)
;
4684 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4684, __extension__ __PRETTY_FUNCTION__
); }))
;
4685 ccv_cnnp_model_scaled_dot_product_attention_t* const self = (ccv_cnnp_model_scaled_dot_product_attention_t*)super;
4686 assert(input_size == (self->is_varlen ? 5 : (self->has_attn_mask ? 4 : 3)))((void) sizeof ((input_size == (self->is_varlen ? 5 : (self
->has_attn_mask ? 4 : 3))) ? 1 : 0), __extension__ ({ if (
input_size == (self->is_varlen ? 5 : (self->has_attn_mask
? 4 : 3))) ; else __assert_fail ("input_size == (self->is_varlen ? 5 : (self->has_attn_mask ? 4 : 3))"
, "ccv_cnnp_model_addons.c", 4686, __extension__ __PRETTY_FUNCTION__
); }))
;
4687 assert(!self->is_varlen || !self->has_attn_mask)((void) sizeof ((!self->is_varlen || !self->has_attn_mask
) ? 1 : 0), __extension__ ({ if (!self->is_varlen || !self
->has_attn_mask) ; else __assert_fail ("!self->is_varlen || !self->has_attn_mask"
, "ccv_cnnp_model_addons.c", 4687, __extension__ __PRETTY_FUNCTION__
); }))
;
4688 assert(!self->is_varlen || !self->fused_unify_head_weights)((void) sizeof ((!self->is_varlen || !self->fused_unify_head_weights
) ? 1 : 0), __extension__ ({ if (!self->is_varlen || !self
->fused_unify_head_weights) ; else __assert_fail ("!self->is_varlen || !self->fused_unify_head_weights"
, "ccv_cnnp_model_addons.c", 4688, __extension__ __PRETTY_FUNCTION__
); }))
;
4689 const ccv_nnc_tensor_param_t q_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4690 const ccv_nnc_tensor_param_t k_params = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
4691 const ccv_nnc_tensor_param_t v_params = ccv_nnc_tensor_symbol_params(graph, inputs[2]);
4692 const ccv_nnc_tensor_param_t q_seq_offsets_params = self->is_varlen ? ccv_nnc_tensor_symbol_params(graph, inputs[3]) : (ccv_nnc_tensor_param_t){};
4693 const ccv_nnc_tensor_param_t kv_seq_offsets_params = self->is_varlen ? ccv_nnc_tensor_symbol_params(graph, inputs[4]) : (ccv_nnc_tensor_param_t){};
4694 const int v_nd = ccv_nnc_tensor_nd(v_params.dim);
4695 assert(v_nd == 3 || v_nd == 4)((void) sizeof ((v_nd == 3 || v_nd == 4) ? 1 : 0), __extension__
({ if (v_nd == 3 || v_nd == 4) ; else __assert_fail ("v_nd == 3 || v_nd == 4"
, "ccv_cnnp_model_addons.c", 4695, __extension__ __PRETTY_FUNCTION__
); }))
;
4696 const int hEv = (v_nd == 3 ? 1 : v_params.dim[2]) * v_params.dim[v_nd - 1];
4697 ccv_nnc_tensor_param_t weights_params = q_params;
4698 memset(weights_params.dim, 0, sizeof(weights_params.dim));
4699 weights_params.dim[0] = hEv;
4700 weights_params.dim[1] = hEv;
4701 ccv_nnc_tensor_param_t bias_params = q_params;
4702 memset(bias_params.dim, 0, sizeof(bias_params.dim));
4703 bias_params.dim[0] = hEv;
4704 ccv_nnc_cmd_t cmd = {0};
4705 cmd.cmd = CCV_NNC_SCALED_DOT_PRODUCT_ATTENTION_FORWARD;
4706 cmd.info.scaled_dot_product_attention.scale = self->scale;
4707 cmd.info.scaled_dot_product_attention.is_causal = self->is_causal;
4708 cmd.info.scaled_dot_product_attention.is_varlen = self->is_varlen;
4709 cmd.info.scaled_dot_product_attention.max_seqlen_q = self->max_seqlen_q;
4710 cmd.info.scaled_dot_product_attention.max_seqlen_kv = self->max_seqlen_kv;
4711 cmd.info.scaled_dot_product_attention.flags = self->flags;
4712 ccv_nnc_tensor_param_t output_params[3];
4713 ccv_nnc_tensor_symbol_t output;
4714 ccv_nnc_tensor_symbol_t saved_softmax_lse;
4715 ccv_nnc_tensor_symbol_t saved_v_proj = NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
4716 ccv_nnc_tensor_symbol_t attn_mask = NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
4717 ccv_nnc_tensor_symbol_t weights = NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
4718 ccv_nnc_tensor_symbol_t bias = NO_TENSOR_SYMBOL(const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}
;
4719 if (self->has_attn_mask)
4720 attn_mask = inputs[3];
4721 if (self->is_varlen)
4722 {
4723 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
4724 q_params,
4725 k_params,
4726 v_params,
4727 (ccv_nnc_tensor_param_t){},
4728 (ccv_nnc_tensor_param_t){},
4729 (ccv_nnc_tensor_param_t){},
4730 q_seq_offsets_params,
4731 kv_seq_offsets_params,
4732 }, 8, ccv_nnc_no_hint, output_params, 2);
4733 output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
4734 saved_softmax_lse = ccv_nnc_tensor_symbol_new(graph, output_params[1], 0);
4735 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], inputs[2], NO_TENSOR_SYMBOL, NO_TENSOR_SYMBOL, NO_TENSOR_SYMBOL, inputs[3], inputs[4])(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], inputs
[2], (const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}, (const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}, (const ccv_nnc_tensor_symbol_t){.d = CCV_NNC_NO_TENSOR_SYMBOL
}, inputs[3], inputs[4]}, (1 +1 +1 +1 +1 +1 +1 +1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_softmax_lse, saved_v_proj)(const ccv_nnc_tensor_symbol_t []){output, saved_softmax_lse,
saved_v_proj}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 -1)
, "scaled_dot_product_attention");
4736 } else if (self->fused_unify_head_weights)
4737 {
4738 if (!self->weights.graph)
4739 self->weights = ccv_nnc_tensor_symbol_new(graph, weights_params, "weights");
4740 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 4740, __extension__ __PRETTY_FUNCTION__); }))
;
4741 weights = ccv_cnnp_model_get_symbol(super, self->weights);
4742 if (!self->no_bias)
4743 {
4744 if (!self->bias.graph)
4745 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
4746 assert(self->bias.graph == graph)((void) sizeof ((self->bias.graph == graph) ? 1 : 0), __extension__
({ if (self->bias.graph == graph) ; else __assert_fail ("self->bias.graph == graph"
, "ccv_cnnp_model_addons.c", 4746, __extension__ __PRETTY_FUNCTION__
); }))
;
4747 bias = ccv_cnnp_model_get_symbol(super, self->bias);
4748 }
4749 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
4750 q_params,
4751 k_params,
4752 v_params,
4753 (ccv_nnc_tensor_param_t){},
4754 weights_params,
4755 bias_params,
4756 }, 6, ccv_nnc_no_hint, output_params, 3);
4757 output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
4758 saved_softmax_lse = ccv_nnc_tensor_symbol_new(graph, output_params[1], 0);
4759 saved_v_proj = ccv_nnc_tensor_symbol_new(graph, output_params[2], 0);
4760 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], inputs[2], attn_mask, weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], inputs
[2], attn_mask, weights, bias}, (1 +1 +1 +1 +1 +1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_softmax_lse, saved_v_proj)(const ccv_nnc_tensor_symbol_t []){output, saved_softmax_lse,
saved_v_proj}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 -1)
, "scaled_dot_product_attention");
4761 } else {
4762 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
4763 q_params,
4764 k_params,
4765 v_params,
4766 }, 3, ccv_nnc_no_hint, output_params, 2);
4767 output = ccv_nnc_tensor_symbol_new(graph, output_params[0], 0);
4768 saved_softmax_lse = ccv_nnc_tensor_symbol_new(graph, output_params[1], 0);
4769 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], inputs[2], attn_mask, weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], inputs
[2], attn_mask, weights, bias}, (1 +1 +1 +1 +1 +1 +1 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output, saved_softmax_lse, saved_v_proj)(const ccv_nnc_tensor_symbol_t []){output, saved_softmax_lse,
saved_v_proj}, (1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 -1)
, "scaled_dot_product_attention");
4770 }
4771 outputs[0] = output;
4772}
4773
4774static void _ccv_cnnp_scaled_dot_product_attention_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
4775{
4776 ccv_cnnp_model_scaled_dot_product_attention_t* const self = (ccv_cnnp_model_scaled_dot_product_attention_t*)super;
4777 if (self->weights.graph)
4778 {
4779 assert(self->fused_unify_head_weights)((void) sizeof ((self->fused_unify_head_weights) ? 1 : 0),
__extension__ ({ if (self->fused_unify_head_weights) ; else
__assert_fail ("self->fused_unify_head_weights", "ccv_cnnp_model_addons.c"
, 4779, __extension__ __PRETTY_FUNCTION__); }))
;
4780 const ccv_nnc_tensor_param_t weight_params = ccv_nnc_tensor_symbol_params(graph, self->weights);
4781 const int c = weight_params.dim[1];
4782 const float std = sqrtf(2) / sqrtf(c);
4783 const float bound = sqrtf(3) * std;
4784 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
4785 if (self->bias.graph)
4786 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
4787 }
4788}
4789
4790static void _ccv_cnnp_scaled_dot_product_attention_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
4791{
4792 ccv_cnnp_model_scaled_dot_product_attention_t* const self = (ccv_cnnp_model_scaled_dot_product_attention_t*)super;
4793 if (self->weights.graph)
4794 {
4795 assert(self->fused_unify_head_weights)((void) sizeof ((self->fused_unify_head_weights) ? 1 : 0),
__extension__ ({ if (self->fused_unify_head_weights) ; else
__assert_fail ("self->fused_unify_head_weights", "ccv_cnnp_model_addons.c"
, 4795, __extension__ __PRETTY_FUNCTION__); }))
;
4796 add_to_array(parameters, self->weights, is_trainable);
4797 if (self->bias.graph)
4798 add_to_array(parameters, self->bias, is_trainable);
4799 }
4800}
4801
4802static ccv_cnnp_model_t* _ccv_cnnp_scaled_dot_product_attention_copy(const ccv_cnnp_model_t* const super, void* const context);
4803
4804static const ccv_cnnp_model_vtab_t ccv_cnnp_scaled_dot_product_attention_isa = {
4805 .build = _ccv_cnnp_scaled_dot_product_attention_build,
4806 .copy = _ccv_cnnp_scaled_dot_product_attention_copy,
4807};
4808
4809static const ccv_cnnp_model_vtab_t ccv_cnnp_scaled_dot_product_attention_fused_isa = {
4810 .build = _ccv_cnnp_scaled_dot_product_attention_build,
4811 .init_states = _ccv_cnnp_scaled_dot_product_attention_init_states,
4812 .add_to_parameter = _ccv_cnnp_scaled_dot_product_attention_add_to_parameter,
4813 .copy = _ccv_cnnp_scaled_dot_product_attention_copy,
4814};
4815
4816ccv_cnnp_model_t* ccv_cnnp_scaled_dot_product_attention(const float scale, const int is_causal, const int has_attn_mask, const int is_varlen, const int max_seqlen_q, const int max_seqlen_kv, const int flags, const int fused_unify_head_weights, const int no_bias, const int is_trainable, const char* const name)
4817{
4818 assert(!is_varlen || !has_attn_mask)((void) sizeof ((!is_varlen || !has_attn_mask) ? 1 : 0), __extension__
({ if (!is_varlen || !has_attn_mask) ; else __assert_fail ("!is_varlen || !has_attn_mask"
, "ccv_cnnp_model_addons.c", 4818, __extension__ __PRETTY_FUNCTION__
); }))
;
4819 assert(!is_varlen || !fused_unify_head_weights)((void) sizeof ((!is_varlen || !fused_unify_head_weights) ? 1
: 0), __extension__ ({ if (!is_varlen || !fused_unify_head_weights
) ; else __assert_fail ("!is_varlen || !fused_unify_head_weights"
, "ccv_cnnp_model_addons.c", 4819, __extension__ __PRETTY_FUNCTION__
); }))
;
4820 ccv_cnnp_model_scaled_dot_product_attention_t* const model_scaled_dot_product_attention = (ccv_cnnp_model_scaled_dot_product_attention_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_scaled_dot_product_attention_t));
4821 model_scaled_dot_product_attention->super.isa = fused_unify_head_weights ? &ccv_cnnp_scaled_dot_product_attention_fused_isa : &ccv_cnnp_scaled_dot_product_attention_isa;
4822 model_scaled_dot_product_attention->super.input_size = is_varlen ? 5 : (has_attn_mask ? 4 : 3);
4823 model_scaled_dot_product_attention->super.outputs = &model_scaled_dot_product_attention->output;
4824 model_scaled_dot_product_attention->super.output_size = 1;
4825 model_scaled_dot_product_attention->super.is_trainable = is_trainable;
4826 ccv_cnnp_model_copy_name(&model_scaled_dot_product_attention->super, name);
4827 model_scaled_dot_product_attention->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
4828 model_scaled_dot_product_attention->weights.graph = 0;
4829 model_scaled_dot_product_attention->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
4830 model_scaled_dot_product_attention->bias.graph = 0;
4831 model_scaled_dot_product_attention->scale = scale;
4832 model_scaled_dot_product_attention->is_causal = is_causal;
4833 model_scaled_dot_product_attention->has_attn_mask = has_attn_mask;
4834 model_scaled_dot_product_attention->is_varlen = is_varlen;
4835 model_scaled_dot_product_attention->max_seqlen_q = max_seqlen_q;
4836 model_scaled_dot_product_attention->max_seqlen_kv = max_seqlen_kv;
4837 model_scaled_dot_product_attention->flags = flags;
4838 model_scaled_dot_product_attention->fused_unify_head_weights = fused_unify_head_weights;
4839 model_scaled_dot_product_attention->no_bias = no_bias;
4840 return (ccv_cnnp_model_t*)model_scaled_dot_product_attention;
4841}
4842
4843static ccv_cnnp_model_t* _ccv_cnnp_scaled_dot_product_attention_copy(const ccv_cnnp_model_t* const super, void* const context)
4844{
4845 const ccv_cnnp_model_scaled_dot_product_attention_t* const self = (const ccv_cnnp_model_scaled_dot_product_attention_t*)super;
4846 return ccv_cnnp_scaled_dot_product_attention(self->scale, self->is_causal, self->has_attn_mask, self->is_varlen, self->max_seqlen_q, self->max_seqlen_kv, self->flags, self->fused_unify_head_weights, self->no_bias, self->super.is_trainable, self->super.name);
4847}
4848
4849// MARK - Debug Layer
4850
4851typedef struct {
4852 ccv_cnnp_model_t super;
4853 ccv_nnc_tensor_symbol_t output;
4854 ccv_cnnp_model_debug_f debugger;
4855 ccv_cnnp_model_debug_context_deinit_f debug_deinit;
4856 ccv_cnnp_model_debug_context_copy_f debug_copy;
4857 void* debug_context;
4858} ccv_cnnp_model_debug_t;
4859
4860static int _ccv_cnnp_debug_exec(const ccv_nnc_cmd_t cmd, const ccv_nnc_hint_t hint, const int flags, ccv_nnc_tensor_t* const* const inputs, const int input_size, ccv_nnc_tensor_t* const* const outputs, const int output_size, ccv_nnc_stream_context_t* const stream_context)
4861{
4862 if (cmd.cmd == CCV_NNC_CUSTOM_BACKWARD)
4863 {
4864 assert(0 && "don't support debug backward pass yet")((void) sizeof ((0 && "don't support debug backward pass yet"
) ? 1 : 0), __extension__ ({ if (0 && "don't support debug backward pass yet"
) ; else __assert_fail ("0 && \"don't support debug backward pass yet\""
, "ccv_cnnp_model_addons.c", 4864, __extension__ __PRETTY_FUNCTION__
); }))
;
4865 }
4866 ccv_cnnp_model_debug_t* const self = (ccv_cnnp_model_debug_t*)cmd.data;
4867 self->debugger(inputs, input_size, stream_context, self->debug_context);
4868 return CCV_NNC_EXEC_SUCCESS;
4869}
4870
4871static ccv_nnc_cmd_vtab_t ccv_cnnp_debug_exec_isa = {
4872 .exec = _ccv_cnnp_debug_exec
4873};
4874
4875static void _ccv_cnnp_debug_build(ccv_cnnp_model_t* const self, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4876{
4877 PRINT(CCV_CLI_VERBOSE, "[cnnp_debug_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_debug_build] -\n"); fflush(stdout); } } while
(0)
;
4878 assert(input_size >= 1)((void) sizeof ((input_size >= 1) ? 1 : 0), __extension__ (
{ if (input_size >= 1) ; else __assert_fail ("input_size >= 1"
, "ccv_cnnp_model_addons.c", 4878, __extension__ __PRETTY_FUNCTION__
); }))
;
4879 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 4879, __extension__ __PRETTY_FUNCTION__
); }))
;
4880 ccv_nnc_tensor_symbol_t to = ccv_nnc_tensor_symbol_alias_to(graph, inputs[0]);
4881 ccv_nnc_tensor_param_t output_params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4882 if (to.d == CCV_NNC_NO_TENSOR_SYMBOL) // If we are not reshape an alias, it is straightforward.
4883 {
4884 int ofs[CCV_NNC_MAX_DIM_ALLOC(12)] = {0};
4885 int stride[CCV_NNC_MAX_DIM_ALLOC(12)];
4886 ccv_nnc_tensor_get_stride(output_params.dim, stride);
4887 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, inputs[0], ofs, stride, output_params, 0);
4888 } else {
4889 int old_ofs[CCV_NNC_MAX_DIM_ALLOC(12)];
4890 int old_stride[CCV_NNC_MAX_DIM_ALLOC(12)];
4891 ccv_nnc_tensor_symbol_alias_params(graph, inputs[0], old_ofs, old_stride);
4892 outputs[0] = ccv_nnc_tensor_symbol_alias_new(graph, to, old_ofs, old_stride, output_params, 0);
4893 }
4894 ccv_nnc_cmd_t cmd = ccv_nnc_cmd(CCV_NNC_CUSTOM_FORWARD, (ccv_nnc_cmd_vtab_t*)&ccv_cnnp_debug_exec_isa, (ccv_nnc_cmd_param_t){}, 0);
4895 cmd.data = self;
4896 ccv_nnc_graph_exec_symbol_t make_debug = ccv_nnc_graph_exec_symbol_new(graph, cmd, inputs, input_size, outputs, 1, "debug");
4897 // Disable any optimizations.
4898 ccv_nnc_graph_exec_symbol_set_flags(graph, make_debug, CCV_NNC_GRAPH_EXEC_DISABLE_OPT);
4899}
4900
4901static void _ccv_cnnp_debug_deinit(ccv_cnnp_model_t* const super)
4902{
4903 const ccv_cnnp_model_debug_t* const self = (const ccv_cnnp_model_debug_t*)super;
4904 if (self->debug_deinit && self->debug_context)
4905 self->debug_deinit(self->debug_context);
4906}
4907
4908static ccv_cnnp_model_t* _ccv_cnnp_debug_copy(const ccv_cnnp_model_t* const super, void* const context);
4909
4910static const ccv_cnnp_model_vtab_t ccv_cnnp_debug_isa = {
4911 .build = _ccv_cnnp_debug_build,
4912 .deinit = _ccv_cnnp_debug_deinit,
4913 .copy = _ccv_cnnp_debug_copy,
4914};
4915
4916ccv_cnnp_model_t* ccv_cnnp_debug(ccv_cnnp_model_debug_f func, void* const context, ccv_cnnp_model_debug_context_deinit_f deinit, ccv_cnnp_model_debug_context_copy_f copy, const char* const name)
4917{
4918 ccv_cnnp_model_debug_t* const model_debug = (ccv_cnnp_model_debug_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_debug_t));
4919 model_debug->super.isa = &ccv_cnnp_debug_isa;
4920 model_debug->super.input_size = 0;
4921 model_debug->super.outputs = &model_debug->output;
4922 model_debug->super.output_size = 1;
4923 model_debug->debugger = func;
4924 model_debug->debug_context = context;
4925 model_debug->debug_deinit = deinit;
4926 model_debug->debug_copy = copy;
4927 ccv_cnnp_model_copy_name(&model_debug->super, name);
4928 return (ccv_cnnp_model_t*)model_debug;
4929}
4930
4931static ccv_cnnp_model_t* _ccv_cnnp_debug_copy(const ccv_cnnp_model_t* const super, void* const context)
4932{
4933 const ccv_cnnp_model_debug_t* const self = (const ccv_cnnp_model_debug_t*)super;
4934 void* debug_context = self->debug_context;
4935 if (self->debug_copy && self->debug_context)
4936 debug_context = self->debug_copy(self->debug_context);
4937 return ccv_cnnp_debug(self->debugger, debug_context, self->debug_deinit, self->debug_copy, self->super.name);
4938}
4939
4940/// MARK - Sort layer.
4941
4942typedef struct {
4943 ccv_cnnp_model_t super;
4944 ccv_nnc_tensor_symbol_t outputs[2];
4945 int along_axis;
4946 int descending;
4947} ccv_cnnp_model_sort_t;
4948
4949static void _ccv_cnnp_sort_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4950{
4951 ccv_cnnp_model_sort_t* const self = (ccv_cnnp_model_sort_t*)super;
4952 PRINT(CCV_CLI_VERBOSE, "[cnnp_sort_build] - along_axis: %d, descending: %d\n", self->along_axis, self->descending)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_sort_build] - along_axis: %d, descending: %d\n"
, self->along_axis, self->descending); fflush(stdout); }
} while (0)
;
4953 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
4954 assert(output_size == 2)((void) sizeof ((output_size == 2) ? 1 : 0), __extension__ ({
if (output_size == 2) ; else __assert_fail ("output_size == 2"
, "ccv_cnnp_model_addons.c", 4954, __extension__ __PRETTY_FUNCTION__
); }))
;
4955 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4956 params.datatype = CCV_32S;
4957 outputs[1] = ccv_nnc_tensor_symbol_new(graph, params, 0);
4958 ccv_nnc_graph_exec_symbol_new(graph, CMD_SORT_FORWARD(self->along_axis, self->descending)ccv_nnc_cmd(CCV_NNC_SORT_FORWARD, 0, ((ccv_nnc_cmd_param_t){.
size={.dim={1,1,1}},.sort={.along_axis=self->along_axis,.descending
=self->descending}}), 0)
, inputs, input_size, outputs, output_size, "sort");
4959}
4960
4961static ccv_cnnp_model_t* _ccv_cnnp_sort_copy(const ccv_cnnp_model_t* const self, void* const context);
4962
4963static const ccv_cnnp_model_vtab_t ccv_cnnp_sort_isa = {
4964 .build = _ccv_cnnp_sort_build,
4965 .copy = _ccv_cnnp_sort_copy,
4966};
4967
4968ccv_cnnp_model_t* ccv_cnnp_sort(const int along_axis, const int descending, const char* const name)
4969{
4970 ccv_cnnp_model_sort_t* const model_sort = (ccv_cnnp_model_sort_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_sort_t));
4971 model_sort->super.isa = &ccv_cnnp_sort_isa;
4972 model_sort->super.input_size = 0;
4973 model_sort->super.outputs = model_sort->outputs;
4974 model_sort->super.output_size = 2;
4975 model_sort->along_axis = along_axis;
4976 model_sort->descending = descending;
4977 ccv_cnnp_model_copy_name(&model_sort->super, name);
4978 return (ccv_cnnp_model_t*)model_sort;
4979}
4980
4981static ccv_cnnp_model_t* _ccv_cnnp_sort_copy(const ccv_cnnp_model_t* const super, void* const context)
4982{
4983 ccv_cnnp_model_sort_t* const self = (ccv_cnnp_model_sort_t*)super;
4984 return ccv_cnnp_sort(self->along_axis, self->descending, self->super.name);
4985}
4986
4987/// MARK - Partition layer.
4988
4989typedef struct {
4990 ccv_cnnp_model_t super;
4991 ccv_nnc_tensor_symbol_t outputs[2];
4992 int kth;
4993 int along_axis;
4994 int descending;
4995} ccv_cnnp_model_partition_t;
4996
4997static void _ccv_cnnp_partition_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
4998{
4999 ccv_cnnp_model_partition_t* const self = (ccv_cnnp_model_partition_t*)super;
5000 PRINT(CCV_CLI_VERBOSE, "[cnnp_partition_build] - kth: %d, along_axis: %d, descending: %d\n", self->kth, self->along_axis, self->descending)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_partition_build] - kth: %d, along_axis: %d, descending: %d\n"
, self->kth, self->along_axis, self->descending); fflush
(stdout); } } while (0)
;
5001 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
5002 assert(output_size == 2)((void) sizeof ((output_size == 2) ? 1 : 0), __extension__ ({
if (output_size == 2) ; else __assert_fail ("output_size == 2"
, "ccv_cnnp_model_addons.c", 5002, __extension__ __PRETTY_FUNCTION__
); }))
;
5003 if (self->kth > 0)
5004 params.dim[self->along_axis] = self->kth;
5005 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
5006 params.datatype = CCV_32S;
5007 outputs[1] = ccv_nnc_tensor_symbol_new(graph, params, 0);
5008 ccv_nnc_graph_exec_symbol_new(graph, CMD_PARTITION_FORWARD(self->kth, self->along_axis, self->descending)ccv_nnc_cmd(CCV_NNC_PARTITION_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.partition={.kth=self->kth,.along_axis
=self->along_axis,.descending=self->descending}}), 0)
, inputs, input_size, outputs, output_size, "partition");
5009}
5010
5011static ccv_cnnp_model_t* _ccv_cnnp_partition_copy(const ccv_cnnp_model_t* const self, void* const context);
5012
5013static const ccv_cnnp_model_vtab_t ccv_cnnp_partition_isa = {
5014 .build = _ccv_cnnp_partition_build,
5015 .copy = _ccv_cnnp_partition_copy,
5016};
5017
5018ccv_cnnp_model_t* ccv_cnnp_partition(const int kth, const int along_axis, const int descending, const char* const name)
5019{
5020 ccv_cnnp_model_partition_t* const model_partition = (ccv_cnnp_model_partition_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_partition_t));
5021 model_partition->super.isa = &ccv_cnnp_partition_isa;
5022 model_partition->super.input_size = 0;
5023 model_partition->super.outputs = model_partition->outputs;
5024 model_partition->super.output_size = 2;
5025 model_partition->kth = kth;
5026 model_partition->along_axis = along_axis;
5027 model_partition->descending = descending;
5028 ccv_cnnp_model_copy_name(&model_partition->super, name);
5029 return (ccv_cnnp_model_t*)model_partition;
5030}
5031
5032static ccv_cnnp_model_t* _ccv_cnnp_partition_copy(const ccv_cnnp_model_t* const super, void* const context)
5033{
5034 ccv_cnnp_model_partition_t* const self = (ccv_cnnp_model_partition_t*)super;
5035 return ccv_cnnp_partition(self->kth, self->along_axis, self->descending, self->super.name);
5036}
5037
5038/// MARK - Unique consecutive layer.
5039
5040typedef struct {
5041 ccv_cnnp_model_t super;
5042 ccv_nnc_tensor_symbol_t outputs[2];
5043 int bincount;
5044} ccv_cnnp_model_unique_consecutive_t;
5045
5046static void _ccv_cnnp_unique_consecutive_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
5047{
5048 ccv_cnnp_model_unique_consecutive_t* const self = (ccv_cnnp_model_unique_consecutive_t*)super;
5049 PRINT(CCV_CLI_VERBOSE, "[cnnp_unique_consecutive_build] - bincount: %d\n", self->bincount)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_unique_consecutive_build] - bincount: %d\n",
self->bincount); fflush(stdout); } } while (0)
;
5050 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
5051 assert(output_size == 2)((void) sizeof ((output_size == 2) ? 1 : 0), __extension__ ({
if (output_size == 2) ; else __assert_fail ("output_size == 2"
, "ccv_cnnp_model_addons.c", 5051, __extension__ __PRETTY_FUNCTION__
); }))
;
5052 if (self->bincount > 0)
5053 params.dim[0] = ccv_min(params.dim[0], self->bincount)({ typeof (params.dim[0]) _a = (params.dim[0]); typeof (self->
bincount) _b = (self->bincount); (_a < _b) ? _a : _b; }
)
;
5054 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
5055 params.datatype = CCV_32S;
5056 outputs[1] = ccv_nnc_tensor_symbol_new(graph, params, 0);
5057 ccv_nnc_graph_exec_symbol_new(graph, CMD_UNIQUE_CONSECUTIVE_FORWARD(self->bincount)ccv_nnc_cmd(CCV_NNC_UNIQUE_CONSECUTIVE_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.unique_consecutive={.bincount=self->
bincount}}), 0)
, inputs, input_size, outputs, output_size, "unique_consecutive");
5058}
5059
5060static ccv_cnnp_model_t* _ccv_cnnp_unique_consecutive_copy(const ccv_cnnp_model_t* const self, void* const context);
5061
5062static const ccv_cnnp_model_vtab_t ccv_cnnp_unique_consecutive_isa = {
5063 .build = _ccv_cnnp_unique_consecutive_build,
5064 .copy = _ccv_cnnp_unique_consecutive_copy,
5065};
5066
5067ccv_cnnp_model_t* ccv_cnnp_unique_consecutive(const int bincount, const char* const name)
5068{
5069 ccv_cnnp_model_unique_consecutive_t* const model_unique_consecutive = (ccv_cnnp_model_unique_consecutive_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_unique_consecutive_t));
5070 model_unique_consecutive->super.isa = &ccv_cnnp_unique_consecutive_isa;
5071 model_unique_consecutive->super.input_size = 0;
5072 model_unique_consecutive->super.outputs = model_unique_consecutive->outputs;
5073 model_unique_consecutive->super.output_size = 2;
5074 model_unique_consecutive->bincount = bincount;
5075 ccv_cnnp_model_copy_name(&model_unique_consecutive->super, name);
5076 return (ccv_cnnp_model_t*)model_unique_consecutive;
5077}
5078
5079static ccv_cnnp_model_t* _ccv_cnnp_unique_consecutive_copy(const ccv_cnnp_model_t* const super, void* const context)
5080{
5081 ccv_cnnp_model_unique_consecutive_t* const self = (ccv_cnnp_model_unique_consecutive_t*)super;
5082 return ccv_cnnp_unique_consecutive(self->bincount, self->super.name);
5083}
5084
5085/// MARK - Scatter add layer.
5086
5087typedef struct {
5088 ccv_cnnp_model_t super;
5089 ccv_nnc_tensor_symbol_t output;
5090 int bincount;
5091} ccv_cnnp_model_scatter_add_t;
5092
5093static void _ccv_cnnp_scatter_add_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
5094{
5095 ccv_cnnp_model_scatter_add_t* const self = (ccv_cnnp_model_scatter_add_t*)super;
5096 PRINT(CCV_CLI_VERBOSE, "[cnnp_scatter_add_build] - bincount: %d\n", self->bincount)do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_scatter_add_build] - bincount: %d\n", self->
bincount); fflush(stdout); } } while (0)
;
5097 ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
5098 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 5098, __extension__ __PRETTY_FUNCTION__
); }))
;
5099 assert(self->bincount > 0)((void) sizeof ((self->bincount > 0) ? 1 : 0), __extension__
({ if (self->bincount > 0) ; else __assert_fail ("self->bincount > 0"
, "ccv_cnnp_model_addons.c", 5099, __extension__ __PRETTY_FUNCTION__
); }))
;
5100 params.dim[0] = self->bincount;
5101 outputs[0] = ccv_nnc_tensor_symbol_new(graph, params, 0);
5102 ccv_nnc_graph_exec_symbol_new(graph, CMD_SCATTER_ADD_FORWARD(self->bincount)ccv_nnc_cmd(CCV_NNC_SCATTER_ADD_FORWARD, 0, ((ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.scatter_add={.bincount=self->bincount
}}), 0)
, inputs, input_size, outputs, output_size, "scatter_add");
5103}
5104
5105static ccv_cnnp_model_t* _ccv_cnnp_scatter_add_copy(const ccv_cnnp_model_t* const self, void* const context);
5106
5107static const ccv_cnnp_model_vtab_t ccv_cnnp_scatter_add_isa = {
5108 .build = _ccv_cnnp_scatter_add_build,
5109 .copy = _ccv_cnnp_scatter_add_copy,
5110};
5111
5112ccv_cnnp_model_t* ccv_cnnp_scatter_add(const int bincount, const char* const name)
5113{
5114 assert(bincount > 0)((void) sizeof ((bincount > 0) ? 1 : 0), __extension__ ({ if
(bincount > 0) ; else __assert_fail ("bincount > 0", "ccv_cnnp_model_addons.c"
, 5114, __extension__ __PRETTY_FUNCTION__); }))
;
5115 ccv_cnnp_model_scatter_add_t* const model_scatter_add = (ccv_cnnp_model_scatter_add_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_scatter_add_t));
5116 model_scatter_add->super.isa = &ccv_cnnp_scatter_add_isa;
5117 model_scatter_add->super.input_size = 0;
5118 model_scatter_add->super.outputs = &model_scatter_add->output;
5119 model_scatter_add->super.output_size = 1;
5120 model_scatter_add->bincount = bincount;
5121 ccv_cnnp_model_copy_name(&model_scatter_add->super, name);
5122 return (ccv_cnnp_model_t*)model_scatter_add;
5123}
5124
5125static ccv_cnnp_model_t* _ccv_cnnp_scatter_add_copy(const ccv_cnnp_model_t* const super, void* const context)
5126{
5127 ccv_cnnp_model_scatter_add_t* const self = (ccv_cnnp_model_scatter_add_t*)super;
5128 return ccv_cnnp_scatter_add(self->bincount, self->super.name);
5129}
5130
5131// MARK - Segmented Dense Layer
5132
5133typedef struct {
5134 ccv_cnnp_model_t super;
5135 ccv_nnc_tensor_symbol_t output;
5136 ccv_nnc_tensor_symbol_t weights;
5137 ccv_nnc_tensor_symbol_t bias;
5138 int segments;
5139 int count;
5140 int no_bias;
5141 int flags;
5142} ccv_cnnp_model_segmented_dense_t;
5143
5144static void _ccv_cnnp_segmented_dense_build(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_nnc_tensor_symbol_t* const inputs, const int input_size, ccv_nnc_tensor_symbol_t* const outputs, const int output_size)
5145{
5146 ccv_cnnp_model_segmented_dense_t* const self = (ccv_cnnp_model_segmented_dense_t*)super;
5147 PRINT(CCV_CLI_VERBOSE, "[cnnp_segmented_dense_build] -\n")do { if ((CCV_CLI_VERBOSE & ccv_cli_get_output_levels()))
{ printf("[cnnp_segmented_dense_build] -\n"); fflush(stdout)
; } } while (0)
;
5148 assert(input_size == 3)((void) sizeof ((input_size == 3) ? 1 : 0), __extension__ ({ if
(input_size == 3) ; else __assert_fail ("input_size == 3", "ccv_cnnp_model_addons.c"
, 5148, __extension__ __PRETTY_FUNCTION__); }))
;
5149 assert(output_size == 1)((void) sizeof ((output_size == 1) ? 1 : 0), __extension__ ({
if (output_size == 1) ; else __assert_fail ("output_size == 1"
, "ccv_cnnp_model_addons.c", 5149, __extension__ __PRETTY_FUNCTION__
); }))
;
5150 const ccv_nnc_tensor_param_t params = ccv_nnc_tensor_symbol_params(graph, inputs[0]);
5151 const ccv_nnc_tensor_param_t indices_params = ccv_nnc_tensor_symbol_params(graph, inputs[1]);
5152 const ccv_nnc_tensor_param_t counts_params = ccv_nnc_tensor_symbol_params(graph, inputs[2]);
5153 ccv_nnc_tensor_param_t weights_params = params;
5154 memset(weights_params.dim, 0, sizeof(weights_params.dim));
5155 weights_params.dim[0] = self->segments;
5156 weights_params.dim[1] = self->count;
5157 weights_params.dim[2] = params.dim[ccv_nnc_tensor_nd(params.dim) - 1];
5158 if (!self->weights.graph)
5159 self->weights = ccv_nnc_tensor_symbol_new(graph, weights_params, "weights");
5160 assert(self->weights.graph == graph)((void) sizeof ((self->weights.graph == graph) ? 1 : 0), __extension__
({ if (self->weights.graph == graph) ; else __assert_fail
("self->weights.graph == graph", "ccv_cnnp_model_addons.c"
, 5160, __extension__ __PRETTY_FUNCTION__); }))
;
5161 const ccv_nnc_tensor_symbol_t weights = ccv_cnnp_model_get_symbol(super, self->weights);
5162 ccv_nnc_tensor_param_t bias_params = params;
5163 memset(bias_params.dim, 0, sizeof(bias_params.dim));
5164 bias_params.dim[0] = self->segments;
5165 bias_params.dim[1] = self->count;
5166 ccv_nnc_cmd_t cmd = {0};
5167 cmd.cmd = CCV_NNC_SEGMENTED_GEMM_FORWARD;
5168 cmd.info.blas.a[0] = 1;
5169 cmd.info.blas.a[1] = 1;
5170 cmd.info.blas.transpose_b[0] = 1;
5171 cmd.info.blas.transpose_b[1] = 2;
5172 cmd.info.blas.flags = self->flags;
5173 ccv_nnc_tensor_param_t output_params;
5174 ccv_nnc_hint_tensor_auto(cmd, (ccv_nnc_tensor_param_t []){
5175 params, indices_params, counts_params,
5176 weights_params,
5177 bias_params,
5178 }, 5, ccv_nnc_no_hint, &output_params, 1);
5179 const ccv_nnc_tensor_symbol_t output = ccv_nnc_tensor_symbol_new(graph, output_params, 0);
5180 if (self->no_bias)
5181 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], inputs[2], weights)(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], inputs
[2], weights}, (1 +1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "segmented_dense");
5182 else {
5183 if (!self->bias.graph)
5184 self->bias = ccv_nnc_tensor_symbol_new(graph, bias_params, "bias");
5185 const ccv_nnc_tensor_symbol_t bias = ccv_cnnp_model_get_symbol(super, self->bias);
5186 ccv_nnc_graph_exec_symbol_new(graph, cmd, TENSOR_SYMBOL_LIST(inputs[0], inputs[1], inputs[2], weights, bias)(const ccv_nnc_tensor_symbol_t []){inputs[0], inputs[1], inputs
[2], weights, bias}, (1 +1 +1 +1 +1 +1 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, TENSOR_SYMBOL_LIST(output)(const ccv_nnc_tensor_symbol_t []){output}, (1 +1 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +
0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0
+0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 +0 -1)
, "segmented_dense");
5187 }
5188 outputs[0] = output;
5189}
5190
5191static void _ccv_cnnp_segmented_dense_init_states(ccv_cnnp_model_t* const super, ccv_nnc_symbolic_graph_t* const graph, const ccv_cnnp_state_initializer_f initializer, void* const context)
5192{
5193 ccv_cnnp_model_segmented_dense_t* const self = (ccv_cnnp_model_segmented_dense_t*)super;
5194 const ccv_nnc_tensor_param_t weight_params = ccv_nnc_tensor_symbol_params(graph, self->weights);
5195 const int c = weight_params.dim[1];
5196 const float std = sqrtf(2) / sqrtf(c);
5197 const float bound = sqrtf(3) * std;
5198 initializer(context, CMD_RANDOM_UNIFORM_FORWARD(-bound, bound)ccv_nnc_cmd(CCV_NNC_RANDOM_UNIFORM_FORWARD, 0, (ccv_nnc_cmd_param_t
){.size={.dim={1,1,1}},.blas={.a={-bound, bound}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->weights);
5199 if (self->bias.graph)
5200 initializer(context, CMD_SET_FORWARD(0)ccv_nnc_cmd(CCV_NNC_SET_FORWARD, 0, (ccv_nnc_cmd_param_t){.size
={.dim={1,1,1}},.blas={.a={0,}}}, 0)
, ccv_nnc_no_hint, 0, 0, self->bias);
5201}
5202
5203static void _ccv_cnnp_segmented_dense_add_to_parameter(ccv_cnnp_model_t* const super, const ccv_cnnp_add_to_array_f add_to_array, void* const parameters, const int is_trainable)
5204{
5205 ccv_cnnp_model_segmented_dense_t* const self = (ccv_cnnp_model_segmented_dense_t*)super;
5206 add_to_array(parameters, self->weights, is_trainable);
5207 if (self->bias.graph)
5208 add_to_array(parameters, self->bias, is_trainable);
5209}
5210
5211static ccv_cnnp_model_t* _ccv_cnnp_segmented_dense_copy(const ccv_cnnp_model_t* const super, void* const context);
5212
5213static const ccv_cnnp_model_vtab_t ccv_cnnp_segmented_dense_isa = {
5214 .build = _ccv_cnnp_segmented_dense_build,
5215 .init_states = _ccv_cnnp_segmented_dense_init_states,
5216 .add_to_parameter = _ccv_cnnp_segmented_dense_add_to_parameter,
5217 .copy = _ccv_cnnp_segmented_dense_copy,
5218};
5219
5220ccv_cnnp_model_t* ccv_cnnp_segmented_dense(const int segments, const int count, const int no_bias, const int flags, const int is_trainable, const char* const name)
5221{
5222 ccv_cnnp_model_segmented_dense_t* const model_segmented_dense = (ccv_cnnp_model_segmented_dense_t*)cccalloccalloc(1, sizeof(ccv_cnnp_model_segmented_dense_t));
5223 model_segmented_dense->super.isa = &ccv_cnnp_segmented_dense_isa;
5224 model_segmented_dense->super.input_size = 3;
5225 model_segmented_dense->super.outputs = &model_segmented_dense->output;
5226 model_segmented_dense->super.output_size = 1;
5227 model_segmented_dense->super.is_trainable = is_trainable;
5228 ccv_cnnp_model_copy_name(&model_segmented_dense->super, name);
5229 model_segmented_dense->weights.d = CCV_NNC_NO_TENSOR_SYMBOL;
5230 model_segmented_dense->weights.graph = 0;
5231 model_segmented_dense->bias.d = CCV_NNC_NO_TENSOR_SYMBOL;
5232 model_segmented_dense->bias.graph = 0;
5233 model_segmented_dense->segments = segments;
5234 model_segmented_dense->count = count;
5235 model_segmented_dense->no_bias = no_bias;
5236 model_segmented_dense->flags = flags;
5237 return (ccv_cnnp_model_t*)model_segmented_dense;
5238}
5239
5240static ccv_cnnp_model_t* _ccv_cnnp_segmented_dense_copy(const ccv_cnnp_model_t* const super, void* const context)
5241{
5242 const ccv_cnnp_model_segmented_dense_t* const self = (const ccv_cnnp_model_segmented_dense_t*)super;
5243 return ccv_cnnp_segmented_dense(self->segments, self->count, self->no_bias, self->flags, self->super.is_trainable, self->super.name);
5244}