Sha256: cbdcba7dfdff0966e752c224239119cdc2544a642c1dc1e917b75603517d1388
Contents?: true
Size: 1.81 KB
Versions: 1
Compression:
Stored size: 1.81 KB
Contents
static void <%=c_iter%>(na_loop_t *const lp) { size_t n; size_t p1, p3; ssize_t s1, s3; size_t *idx1, *idx3; int o1, l1, r1, len; BIT_DIGIT *a1, *a3; BIT_DIGIT x; // TODO(sonots): CUDA kernelize SHOW_SYNCHRONIZE_FIXME_WARNING_ONCE("<%=name%>", "<%=type_name%>"); cumo_cuda_runtime_check_status(cudaDeviceSynchronize()); INIT_COUNTER(lp, n); INIT_PTR_BIT_IDX(lp, 0, a3, p3, s3, idx3); INIT_PTR_BIT_IDX(lp, 1, a1, p1, s1, idx1); if (s1!=1 || s3!=1 || idx1 || idx3) { for (; n--;) { LOAD_BIT_STEP(a1, p1, s1, idx1, x); STORE_BIT_STEP(a3, p3, s3, idx3, x); } } else { o1 = p1 % NB; o1 -= p3; l1 = NB+o1; r1 = NB-o1; if (p3>0 || n<NB) { len = NB - p3; if ((int)n<len) len=n; if (o1>=0) x = *a1>>o1; else x = *a1<<-o1; if (p1+len>NB) x |= *(a1+1)<<r1; a1++; *a3 = (x & (SLB(len)<<p3)) | (*a3 & ~(SLB(len)<<p3)); a3++; n -= len; } if (o1==0) { for (; n>=NB; n-=NB) { x = *(a1++); *(a3++) = x; } } else { for (; n>=NB; n-=NB) { x = *a1>>o1; if (o1<0) x |= *(a1-1)>>l1; if (o1>0) x |= *(a1+1)<<r1; a1++; *(a3++) = x; } } if (n>0) { x = *a1>>o1; if (o1<0) x |= *(a1-1)>>l1; *a3 = (x & SLB(n)) | (*a3 & BALL<<n); } } } static VALUE <%=c_func(:nodef)%>(VALUE self, VALUE obj) { ndfunc_arg_in_t ain[2] = {{OVERWRITE,0},{Qnil,0}}; ndfunc_t ndf = {<%=c_iter%>, FULL_LOOP, 2,0, ain,0}; na_ndloop(&ndf, 2, self, obj); return self; }
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
cumo-0.1.0 | ext/cumo/narray/gen/tmpl_bit/store_bit.c |