Convlusion Cl Codes
vstore2 and vload2 function
__kernel void default_function_kernel0(__global float* restrict A, __global float* restrict W, __global float* restrict B) {
float B_local[64];
__local float Apad_shared[8];
__local float W_shared[128];
float Apad_shared_local[8];
float W_shared_local[8];
for (int ff_c_init = 0; ff_c_init < 4; ++ff_c_init) {